lp_rast.c revision 5e6a9005100ec2636ce9734a5e4535216494cf60
1d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca/**************************************************************************
2d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca *
3d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * Copyright 2009 VMware, Inc.
4d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * All Rights Reserved.
5d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca *
6d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * Permission is hereby granted, free of charge, to any person obtaining a
7d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * copy of this software and associated documentation files (the
8d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * "Software"), to deal in the Software without restriction, including
9d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * without limitation the rights to use, copy, modify, merge, publish,
10d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * distribute, sub license, and/or sell copies of the Software, and to
11d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * permit persons to whom the Software is furnished to do so, subject to
12d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * the following conditions:
13d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca *
14d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * The above copyright notice and this permission notice (including the
15d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * next paragraph) shall be included in all copies or substantial portions
16d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * of the Software.
17d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca *
18d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca *
26d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca **************************************************************************/
27d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca
28ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#include <limits.h>
29d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca#include "util/u_memory.h"
30aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#include "util/u_math.h"
317f457acabcbeea6a27b4f375f55e318fff52445fJosé Fonseca#include "util/u_cpu_detect.h"
32156eabbaf996f471458ee2a69078674277b89067Brian Paul#include "util/u_surface.h"
33d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca
34663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell#include "lp_scene_queue.h"
35a08d6302168341001003da32d42cfcff2311fa04Brian Paul#include "lp_debug.h"
364b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul#include "lp_fence.h"
374aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul#include "lp_perf.h"
38d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca#include "lp_rast.h"
39921584181eb2f3b2849d150295dfce1dae25dd11José Fonseca#include "lp_rast_priv.h"
40921584181eb2f3b2849d150295dfce1dae25dd11José Fonseca#include "lp_tile_soa.h"
41c61bf363937f40624a5632745630d4f2b9907082Zack Rusin#include "gallivm/lp_bld_debug.h"
42663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell#include "lp_scene.h"
43d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca
4489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
457505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
467505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Begin the rasterization phase.
477505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Map the framebuffer surfaces.  Initialize the 'rast' state.
487505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */
4901b1900084152dbacd4025a31ced25f75666ce59Brian Paulstatic boolean
5001b1900084152dbacd4025a31ced25f75666ce59Brian Paullp_rast_begin( struct lp_rasterizer *rast,
51156eabbaf996f471458ee2a69078674277b89067Brian Paul               const struct pipe_framebuffer_state *fb,
52156eabbaf996f471458ee2a69078674277b89067Brian Paul               boolean write_color,
53156eabbaf996f471458ee2a69078674277b89067Brian Paul               boolean write_zstencil )
5484ab7dcf48e87350c0622c533e51aa495f7256c2Keith Whitwell{
55e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   struct pipe_screen *screen = rast->screen;
56156eabbaf996f471458ee2a69078674277b89067Brian Paul   struct pipe_surface *cbuf, *zsbuf;
57c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   int i;
58e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
59156eabbaf996f471458ee2a69078674277b89067Brian Paul   LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__);
604e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
61156eabbaf996f471458ee2a69078674277b89067Brian Paul   util_copy_framebuffer_state(&rast->state.fb, fb);
62e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
63e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   rast->state.write_zstencil = write_zstencil;
64e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   rast->state.write_color = write_color;
65e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
66156eabbaf996f471458ee2a69078674277b89067Brian Paul   rast->check_for_clipped_tiles = (fb->width % TILE_SIZE != 0 ||
67156eabbaf996f471458ee2a69078674277b89067Brian Paul                                    fb->height % TILE_SIZE != 0);
6884ab7dcf48e87350c0622c533e51aa495f7256c2Keith Whitwell
69c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
70c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   for (i = 0; i < rast->state.fb.nr_cbufs; i++) {
71c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      cbuf = rast->state.fb.cbufs[i];
72c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (cbuf) {
73c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 rast->cbuf_transfer[i] = screen->get_tex_transfer(rast->screen,
74c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   cbuf->texture,
75c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   cbuf->face,
76c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   cbuf->level,
77c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   cbuf->zslice,
78c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   PIPE_TRANSFER_READ_WRITE,
79c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   0, 0,
80c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   cbuf->width,
81c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell							   cbuf->height);
82c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 if (!rast->cbuf_transfer[i])
83c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	    goto fail;
84c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
85c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 rast->cbuf_map[i] = screen->transfer_map(rast->screen,
86c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell						  rast->cbuf_transfer[i]);
87c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 if (!rast->cbuf_map[i])
88c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	    goto fail;
89c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      }
90e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   }
914e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
92156eabbaf996f471458ee2a69078674277b89067Brian Paul   zsbuf = rast->state.fb.zsbuf;
9351663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul   if (zsbuf) {
9451663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul      rast->zsbuf_transfer = screen->get_tex_transfer(rast->screen,
95156eabbaf996f471458ee2a69078674277b89067Brian Paul                                                      zsbuf->texture,
96156eabbaf996f471458ee2a69078674277b89067Brian Paul                                                      zsbuf->face,
97156eabbaf996f471458ee2a69078674277b89067Brian Paul                                                      zsbuf->level,
98156eabbaf996f471458ee2a69078674277b89067Brian Paul                                                      zsbuf->zslice,
99156eabbaf996f471458ee2a69078674277b89067Brian Paul                                                      PIPE_TRANSFER_READ_WRITE,
100156eabbaf996f471458ee2a69078674277b89067Brian Paul                                                      0, 0,
101c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell                                                      zsbuf->width,
102c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell						      zsbuf->height);
10351663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul      if (!rast->zsbuf_transfer)
104c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell         goto fail;
10551663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul
10651663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul      rast->zsbuf_map = screen->transfer_map(rast->screen,
10751663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul                                            rast->zsbuf_transfer);
10851663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul      if (!rast->zsbuf_map)
109c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 goto fail;
11051663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul   }
11151663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul
112e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   return TRUE;
113c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
114c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwellfail:
115c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   /* Unmap and release transfers?
116c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell    */
117c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   return FALSE;
1180718c7700533a965d7cd06b4f67b82bbae6e66a1Keith Whitwell}
1190718c7700533a965d7cd06b4f67b82bbae6e66a1Keith Whitwell
120e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
1217505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
1227505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Finish the rasterization phase.
1237505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Unmap framebuffer surfaces.
1247505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */
12501b1900084152dbacd4025a31ced25f75666ce59Brian Paulstatic void
12601b1900084152dbacd4025a31ced25f75666ce59Brian Paullp_rast_end( struct lp_rasterizer *rast )
1270718c7700533a965d7cd06b4f67b82bbae6e66a1Keith Whitwell{
128e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   struct pipe_screen *screen = rast->screen;
129c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i;
1304e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
131c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   for (i = 0; i < rast->state.fb.nr_cbufs; i++) {
132c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (rast->cbuf_map[i])
133c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 screen->transfer_unmap(screen, rast->cbuf_transfer[i]);
134c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
135c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (rast->cbuf_transfer[i])
136c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 screen->tex_transfer_destroy(rast->cbuf_transfer[i]);
137c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
138c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      rast->cbuf_transfer[i] = NULL;
139c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      rast->cbuf_map[i] = NULL;
140c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   }
141e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
142e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   if (rast->zsbuf_map)
143e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell      screen->transfer_unmap(screen, rast->zsbuf_transfer);
144e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
145e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   if (rast->zsbuf_transfer)
14651663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul      screen->tex_transfer_destroy(rast->zsbuf_transfer);
147e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell
148e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   rast->zsbuf_transfer = NULL;
149e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell   rast->zsbuf_map = NULL;
15089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
15189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
152d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwell
1537505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
1547505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Begining rasterization of a tile.
1557505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * \param x  window X position of the tile, in pixels
1567505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * \param y  window Y position of the tile, in pixels
15789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell */
158b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paulstatic void
159b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paullp_rast_start_tile( struct lp_rasterizer *rast,
1603a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                    unsigned thread_index,
161b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul                    unsigned x, unsigned y )
16289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
163a08d6302168341001003da32d42cfcff2311fa04Brian Paul   LP_DBG(DEBUG_RAST, "%s %d,%d\n", __FUNCTION__, x, y);
1644e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
1653a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   rast->tasks[thread_index].x = x;
1663a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   rast->tasks[thread_index].y = y;
16789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
16889498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
1697505510c7b7c33f3c571647c0398da7e1b823806Brian Paul
1707505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
1717505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Clear the rasterizer's current color tile.
172ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing.
1737505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */
174d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwellvoid lp_rast_clear_color( struct lp_rasterizer *rast,
1753a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                          unsigned thread_index,
1764cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell                          const union lp_rast_cmd_arg arg )
17789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
1784cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell   const uint8_t *clear_color = arg.clear_color;
179c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   uint8_t **color_tile = rast->tasks[thread_index].tile.color;
180c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i;
181c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
182a08d6302168341001003da32d42cfcff2311fa04Brian Paul   LP_DBG(DEBUG_RAST, "%s 0x%x,0x%x,0x%x,0x%x\n", __FUNCTION__,
183295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell              clear_color[0],
184295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell              clear_color[1],
185295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell              clear_color[2],
186295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell              clear_color[3]);
1874e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
18837b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca   if (clear_color[0] == clear_color[1] &&
18937b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca       clear_color[1] == clear_color[2] &&
19037b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca       clear_color[2] == clear_color[3]) {
191f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul      /* clear to grayscale value {x, x, x, x} */
192c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      for (i = 0; i < rast->state.fb.nr_cbufs; i++) {
193c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 memset(color_tile[i], clear_color[0], TILE_SIZE * TILE_SIZE * 4);
194c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      }
19537b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca   }
19637b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca   else {
197f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul      /* Non-gray color.
198f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul       * Note: if the swizzled tile layout changes (see TILE_PIXEL) this code
199f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul       * will need to change.  It'll be pretty obvious when clearing no longer
200f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul       * works.
201f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul       */
202f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul      const unsigned chunk = TILE_SIZE / 4;
203f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul      for (i = 0; i < rast->state.fb.nr_cbufs; i++) {
204f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul         uint8_t *c = color_tile[i];
205f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul         unsigned j;
206f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul         for (j = 0; j < 4 * TILE_SIZE; j++) {
207f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            memset(c, clear_color[0], chunk);
208f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            c += chunk;
209f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            memset(c, clear_color[1], chunk);
210f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            c += chunk;
211f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            memset(c, clear_color[2], chunk);
212f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            c += chunk;
213f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            memset(c, clear_color[3], chunk);
214f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul            c += chunk;
215f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul         }
216f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul         assert(c - color_tile[i] == TILE_SIZE * TILE_SIZE * 4);
217f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul      }
21837b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca   }
2194aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul
2204aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul   LP_COUNT(nr_color_tile_clear);
22189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
22289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
2237505510c7b7c33f3c571647c0398da7e1b823806Brian Paul
2247505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
2257505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Clear the rasterizer's current z/stencil tile.
226ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing.
2277505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */
228d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwellvoid lp_rast_clear_zstencil( struct lp_rasterizer *rast,
2293a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                             unsigned thread_index,
2304cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell                             const union lp_rast_cmd_arg arg)
23189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
2325e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   struct lp_rasterizer_task *task = &rast->tasks[thread_index];
2335e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   const unsigned tile_x = task->x;
2345e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   const unsigned tile_y = task->y;
2355e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   const unsigned height = TILE_SIZE/TILE_VECTOR_HEIGHT;
2365e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   const unsigned width = TILE_SIZE*TILE_VECTOR_HEIGHT;
2375e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   unsigned block_size = util_format_get_blocksize(rast->zsbuf_transfer->texture->format);
2385e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   uint8_t *dst;
2395e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   unsigned dst_stride = rast->zsbuf_transfer->stride*TILE_VECTOR_HEIGHT;
2405e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   unsigned i, j;
2415e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca
242a08d6302168341001003da32d42cfcff2311fa04Brian Paul   LP_DBG(DEBUG_RAST, "%s 0x%x\n", __FUNCTION__, arg.clear_zstencil);
2434e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
2445e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   assert(rast->zsbuf_map);
2455e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   if (!rast->zsbuf_map)
2465e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      return;
2475e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca
2485e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__);
2495e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca
2505e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   /*
2515e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca    * Clear the aera of the swizzled depth/depth buffer matching this tile, in
2525e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca    * stripes of TILE_VECTOR_HEIGHT x TILE_SIZE at a time.
2535e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca    *
2545e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca    * The swizzled depth format is such that the depths for
2555e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca    * TILE_VECTOR_HEIGHT x TILE_VECTOR_WIDTH pixels have consecutive offsets.
2565e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca    */
2575e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca
2585e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   dst = lp_rast_depth_pointer(rast, tile_x, tile_y);
2595e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca
2605e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   switch (block_size) {
2615e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   case 1:
2625e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      memset(dst, (uint8_t) arg.clear_zstencil, height * width);
2635e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      break;
2645e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   case 2:
2655e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      for (i = 0; i < height; i++) {
2665e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         uint16_t *row = (uint16_t *)dst;
2675e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         for (j = 0; j < width; j++)
2685e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca            *row++ = (uint16_t) arg.clear_zstencil;
2695e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         dst += dst_stride;
2705e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      }
2715e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      break;
2725e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   case 4:
2735e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      for (i = 0; i < height; i++) {
2745e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         uint32_t *row = (uint32_t *)dst;
2755e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         for (j = 0; j < width; j++)
2765e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca            *row++ = arg.clear_zstencil;
2775e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         dst += dst_stride;
2785e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      }
2795e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca      break;
2805e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   default:
2815e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         assert(0);
2825e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         break;
2835e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   }
28489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
28589498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
28689498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
287ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul/**
288ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * Load tile color from the framebuffer surface.
289ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing.
290ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul */
291d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwellvoid lp_rast_load_color( struct lp_rasterizer *rast,
2923a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                         unsigned thread_index,
2934cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell                         const union lp_rast_cmd_arg arg)
29489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
29592dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul   struct lp_rasterizer_task *task = &rast->tasks[thread_index];
29692dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul   const unsigned x = task->x;
29792dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul   const unsigned y = task->y;
298c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i;
29992dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul
30092dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul   LP_DBG(DEBUG_RAST, "%s at %u, %u\n", __FUNCTION__, x, y);
30192dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul
302c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   for (i = 0; i < rast->state.fb.nr_cbufs; i++) {
303c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      struct pipe_transfer *transfer = rast->cbuf_transfer[i];
304c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      int w = TILE_SIZE;
305c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      int h = TILE_SIZE;
30692dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul
307c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (x >= transfer->width)
308c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 continue;
30992dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul
310c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (y >= transfer->height)
311c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 continue;
312c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
313c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      assert(w >= 0);
314c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      assert(h >= 0);
315c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      assert(w <= TILE_SIZE);
316c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      assert(h <= TILE_SIZE);
317c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
318c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      lp_tile_read_4ub(transfer->texture->format,
319ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul		       task->tile.color[i],
320c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell		       rast->cbuf_map[i],
321c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell		       transfer->stride,
322c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell		       x, y,
323c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell		       w, h);
3244aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul
3254aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul      LP_COUNT(nr_color_tile_load);
326c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   }
32789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
32889498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
329ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul
330ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paulvoid lp_rast_set_state( struct lp_rasterizer *rast,
3313a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                        unsigned thread_index,
332ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul                        const union lp_rast_cmd_arg arg )
333ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul{
334e2f46344560f8f1193b311ad41883011e67eea00Brian Paul   const struct lp_rast_state *state = arg.set_state;
335e2f46344560f8f1193b311ad41883011e67eea00Brian Paul
336a08d6302168341001003da32d42cfcff2311fa04Brian Paul   LP_DBG(DEBUG_RAST, "%s %p\n", __FUNCTION__, (void *) state);
337ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul
338b1659b9213f3eeee440590dfe379f0d193948307Brian Paul   /* just set the current state pointer for this rasterizer */
3393a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   rast->tasks[thread_index].current_state = state;
340ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul}
341ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul
342ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul
343ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul
344ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul/**
345ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * Run the shader on all blocks in a tile.  This is used when a tile is
346ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * completely contained inside a triangle.
347ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing.
348ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul */
34989498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwellvoid lp_rast_shade_tile( struct lp_rasterizer *rast,
3503a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                         unsigned thread_index,
3514cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell                         const union lp_rast_cmd_arg arg )
35289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
353ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   struct lp_rasterizer_task *task = &rast->tasks[thread_index];
354ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   const struct lp_rast_state *state = task->current_state;
355ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   struct lp_rast_tile *tile = &task->tile;
3564cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell   const struct lp_rast_shader_inputs *inputs = arg.shade_tile;
357ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   const unsigned tile_x = task->x;
358ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   const unsigned tile_y = task->y;
35986dba3e4142276d76ecffc0cd238506df5efe9afJosé Fonseca   unsigned x, y;
36089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
361a08d6302168341001003da32d42cfcff2311fa04Brian Paul   LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__);
3624e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
3632797f2bf57562c95a601a67edca3089641215cc4Brian Paul   /* render the whole 64x64 tile in 4x4 chunks */
3642797f2bf57562c95a601a67edca3089641215cc4Brian Paul   for (y = 0; y < TILE_SIZE; y += 4){
3652797f2bf57562c95a601a67edca3089641215cc4Brian Paul      for (x = 0; x < TILE_SIZE; x += 4) {
3662797f2bf57562c95a601a67edca3089641215cc4Brian Paul         uint8_t *color[PIPE_MAX_COLOR_BUFS];
3672797f2bf57562c95a601a67edca3089641215cc4Brian Paul         uint32_t *depth;
3682797f2bf57562c95a601a67edca3089641215cc4Brian Paul         unsigned block_offset, i;
3692797f2bf57562c95a601a67edca3089641215cc4Brian Paul
3702797f2bf57562c95a601a67edca3089641215cc4Brian Paul         /* offset of the 16x16 pixel block within the tile */
3712797f2bf57562c95a601a67edca3089641215cc4Brian Paul         block_offset = ((y / 4) * (16 * 16) + (x / 4) * 16);
3722797f2bf57562c95a601a67edca3089641215cc4Brian Paul
3732797f2bf57562c95a601a67edca3089641215cc4Brian Paul         /* color buffer */
3742797f2bf57562c95a601a67edca3089641215cc4Brian Paul         for (i = 0; i < rast->state.fb.nr_cbufs; i++)
3752797f2bf57562c95a601a67edca3089641215cc4Brian Paul            color[i] = tile->color[i] + 4 * block_offset;
3762797f2bf57562c95a601a67edca3089641215cc4Brian Paul
3772797f2bf57562c95a601a67edca3089641215cc4Brian Paul         /* depth buffer */
3785e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca         depth = lp_rast_depth_pointer(rast, tile_x + x, tile_y + y);
3792797f2bf57562c95a601a67edca3089641215cc4Brian Paul
3802797f2bf57562c95a601a67edca3089641215cc4Brian Paul         /* run shader */
3812797f2bf57562c95a601a67edca3089641215cc4Brian Paul         state->jit_function[0]( &state->jit_context,
3822797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 tile_x + x, tile_y + y,
3832797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 inputs->a0,
3842797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 inputs->dadx,
3852797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 inputs->dady,
3862797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 color,
3872797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 depth,
3882797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 INT_MIN, INT_MIN, INT_MIN,
3892797f2bf57562c95a601a67edca3089641215cc4Brian Paul                                 NULL, NULL, NULL );
3902797f2bf57562c95a601a67edca3089641215cc4Brian Paul      }
3912797f2bf57562c95a601a67edca3089641215cc4Brian Paul   }
39289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
39389498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
394a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
395866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul/**
396866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul * Compute shading for a 4x4 block of pixels.
397ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing.
398866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul */
399ab76b2a8b896edc1e972de108d044b70310b4324José Fonsecavoid lp_rast_shade_quads( struct lp_rasterizer *rast,
4003a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                          unsigned thread_index,
401ab76b2a8b896edc1e972de108d044b70310b4324José Fonseca                          const struct lp_rast_shader_inputs *inputs,
402ab76b2a8b896edc1e972de108d044b70310b4324José Fonseca                          unsigned x, unsigned y,
403ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul                          int32_t c1, int32_t c2, int32_t c3)
404a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca{
405ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   struct lp_rasterizer_task *task = &rast->tasks[thread_index];
406ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   const struct lp_rast_state *state = task->current_state;
407ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   struct lp_rast_tile *tile = &task->tile;
408c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   uint8_t *color[PIPE_MAX_COLOR_BUFS];
40986dba3e4142276d76ecffc0cd238506df5efe9afJosé Fonseca   void *depth;
410c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i;
4117b116e13a2aa28a699e30c907c1b1ae5e04cab28Keith Whitwell   unsigned ix, iy;
412866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul   int block_offset;
413a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
414ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#ifdef DEBUG
415b1659b9213f3eeee440590dfe379f0d193948307Brian Paul   assert(state);
416b1659b9213f3eeee440590dfe379f0d193948307Brian Paul
417a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca   /* Sanity checks */
418a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca   assert(x % TILE_VECTOR_WIDTH == 0);
419a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca   assert(y % TILE_VECTOR_HEIGHT == 0);
420a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
421cdbcd96fdfe2c4d09e9b34cb083664d6b6e0558bBrian Paul   assert((x % 4) == 0);
422cdbcd96fdfe2c4d09e9b34cb083664d6b6e0558bBrian Paul   assert((y % 4) == 0);
423ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#endif
424866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul
42561f3eeb6403e404d297bdcd924c215ed36060945José Fonseca   ix = x % TILE_SIZE;
42661f3eeb6403e404d297bdcd924c215ed36060945José Fonseca   iy = y % TILE_SIZE;
42761f3eeb6403e404d297bdcd924c215ed36060945José Fonseca
428866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul   /* offset of the 16x16 pixel block within the tile */
4292797f2bf57562c95a601a67edca3089641215cc4Brian Paul   block_offset = ((iy / 4) * (16 * 16) + (ix / 4) * 16);
430866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul
431a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca   /* color buffer */
432c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   for (i = 0; i < rast->state.fb.nr_cbufs; i++)
433c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      color[i] = tile->color[i] + 4 * block_offset;
434a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
435a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca   /* depth buffer */
4365e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca   depth = lp_rast_depth_pointer(rast, x, y);
437a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
438c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
439c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
440ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#ifdef DEBUG
441c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   assert(lp_check_alignment(tile->color[0], 16));
44285999695829823e459e11822b4846ed1db5c055dJosé Fonseca   assert(lp_check_alignment(state->jit_context.blend_color, 16));
443a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
444ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul   assert(lp_check_alignment(inputs->step[0], 16));
445ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul   assert(lp_check_alignment(inputs->step[1], 16));
446ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul   assert(lp_check_alignment(inputs->step[2], 16));
447ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#endif
448ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul
449a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca   /* run shader */
4502797f2bf57562c95a601a67edca3089641215cc4Brian Paul   state->jit_function[1]( &state->jit_context,
45161f3eeb6403e404d297bdcd924c215ed36060945José Fonseca                        x, y,
45285999695829823e459e11822b4846ed1db5c055dJosé Fonseca                        inputs->a0,
45385999695829823e459e11822b4846ed1db5c055dJosé Fonseca                        inputs->dadx,
45485999695829823e459e11822b4846ed1db5c055dJosé Fonseca                        inputs->dady,
45585999695829823e459e11822b4846ed1db5c055dJosé Fonseca                        color,
456ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul                        depth,
457ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul                        c1, c2, c3,
458c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell                        inputs->step[0], inputs->step[1], inputs->step[2]);
459a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca}
460a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
461a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca
46262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul/**
46362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul * Set top row and left column of the tile's pixels to white.  For debugging.
46462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul */
46562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paulstatic void
46662623c4dc5d8b646942bc65e8de350e812945ad1Brian Pauloutline_tile(uint8_t *tile)
46762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul{
46862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   const uint8_t val = 0xff;
46962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   unsigned i;
47062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
47162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   for (i = 0; i < TILE_SIZE; i++) {
47262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, i, 0, 0) = val;
47362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, i, 0, 1) = val;
47462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, i, 0, 2) = val;
47562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, i, 0, 3) = val;
47662623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
47762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, 0, i, 0) = val;
47862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, 0, i, 1) = val;
47962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, 0, i, 2) = val;
48062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      TILE_PIXEL(tile, 0, i, 3) = val;
48162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   }
48262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul}
48362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
48462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
48562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul/**
48662623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul * Draw grid of gray lines at 16-pixel intervals across the tile to
48762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul * show the sub-tile boundaries.  For debugging.
48862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul */
48962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paulstatic void
49062623c4dc5d8b646942bc65e8de350e812945ad1Brian Pauloutline_subtiles(uint8_t *tile)
49162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul{
49262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   const uint8_t val = 0x80;
49362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   const unsigned step = 16;
49462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   unsigned i, j;
49562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
4960fccfc9cc0cb7699598f1739d8cd3811175cdf13Brian Paul   for (i = 0; i < TILE_SIZE; i += step) {
49762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      for (j = 0; j < TILE_SIZE; j++) {
49862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, i, j, 0) = val;
49962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, i, j, 1) = val;
50062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, i, j, 2) = val;
50162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, i, j, 3) = val;
50262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
50362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, j, i, 0) = val;
50462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, j, i, 1) = val;
50562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, j, i, 2) = val;
50662623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul         TILE_PIXEL(tile, j, i, 3) = val;
50762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      }
50862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   }
50962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
51062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul   outline_tile(tile);
51162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul}
51262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
51337b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca
51437b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca
5157505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
5167505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Write the rasterizer's color tile to the framebuffer.
5177505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */
5183a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paulstatic void lp_rast_store_color( struct lp_rasterizer *rast,
5193a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                                 unsigned thread_index)
52089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
521ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   struct lp_rasterizer_task *task = &rast->tasks[thread_index];
522ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   const unsigned x = task->x;
523ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul   const unsigned y = task->y;
524c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i;
52505131f7502150968d7ee19673676f74d4c2fd22bKeith Whitwell
526c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   for (i = 0; i < rast->state.fb.nr_cbufs; i++) {
527c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      struct pipe_transfer *transfer = rast->cbuf_transfer[i];
528c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      int w = TILE_SIZE;
529c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      int h = TILE_SIZE;
53073e13c33fd0a9b8574d00d01d301b9d4f88d4051Brian Paul
531c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (x >= transfer->width)
532c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 continue;
53305131f7502150968d7ee19673676f74d4c2fd22bKeith Whitwell
534c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      if (y >= transfer->height)
535c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 continue;
53689498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
537c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      LP_DBG(DEBUG_RAST, "%s [%u] %d,%d %dx%d\n", __FUNCTION__,
538c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	     thread_index, x, y, w, h);
539c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
54062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      if (LP_DEBUG & DEBUG_SHOW_SUBTILES)
541ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul         outline_subtiles(task->tile.color[i]);
54262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul      else if (LP_DEBUG & DEBUG_SHOW_TILES)
543ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul         outline_tile(task->tile.color[i]);
54462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul
545c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      lp_tile_write_4ub(transfer->texture->format,
546ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul			task->tile.color[i],
547c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell			rast->cbuf_map[i],
548c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell			transfer->stride,
549c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell			x, y,
550c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell			w, h);
5514aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul
5524aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul      LP_COUNT(nr_color_tile_store);
553c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   }
55489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
55589498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
55647510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca
5577505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/**
5587505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Write the rasterizer's tiles to the framebuffer.
5597505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */
560b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paulstatic void
5613a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paullp_rast_end_tile( struct lp_rasterizer *rast,
5623a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul                  unsigned thread_index )
56347510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca{
564a08d6302168341001003da32d42cfcff2311fa04Brian Paul   LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__);
5654e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell
56647510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca   if (rast->state.write_color)
5673a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul      lp_rast_store_color(rast, thread_index);
56847510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca}
56947510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca
57047510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca
571b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul/**
5724b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul * Signal on a fence.  This is called during bin execution/rasterization.
5734b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul * Called per thread.
5744b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul */
5754b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paulvoid lp_rast_fence( struct lp_rasterizer *rast,
5764b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul                    unsigned thread_index,
5774b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul                    const union lp_rast_cmd_arg arg )
5784b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul{
5794b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   struct lp_fence *fence = arg.fence;
5804b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5814b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   pipe_mutex_lock( fence->mutex );
5824b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5834b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   fence->count++;
5844b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   assert(fence->count <= fence->rank);
5854b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5864b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   LP_DBG(DEBUG_RAST, "%s count=%u rank=%u\n", __FUNCTION__,
5874b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul          fence->count, fence->rank);
5884b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5894b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   pipe_condvar_signal( fence->signalled );
5904b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5914b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul   pipe_mutex_unlock( fence->mutex );
5924b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul}
5934b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5944b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul
5954b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul/**
596663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * When all the threads are done rasterizing a scene, one thread will
597663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * call this function to reset the scene and put it onto the empty queue.
5982bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul */
5992bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paulstatic void
600663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwellrelease_scene( struct lp_rasterizer *rast,
601663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell	       struct lp_scene *scene )
6022bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul{
603663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   util_unreference_framebuffer_state( &scene->fb );
6042bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
605663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   lp_scene_reset( scene );
606663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   lp_scene_enqueue( rast->empty_scenes, scene );
607663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   rast->curr_scene = NULL;
6082bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul}
6092bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
6102bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
6112bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul/**
612b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul * Rasterize commands for a single bin.
61301b1900084152dbacd4025a31ced25f75666ce59Brian Paul * \param x, y  position of the bin's tile in the framebuffer
614b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul * Must be called between lp_rast_begin() and lp_rast_end().
6159509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul * Called per thread.
616b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul */
61701b1900084152dbacd4025a31ced25f75666ce59Brian Paulstatic void
61801b1900084152dbacd4025a31ced25f75666ce59Brian Paulrasterize_bin( struct lp_rasterizer *rast,
6193a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul               unsigned thread_index,
62001b1900084152dbacd4025a31ced25f75666ce59Brian Paul               const struct cmd_bin *bin,
62101b1900084152dbacd4025a31ced25f75666ce59Brian Paul               int x, int y)
622b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul{
623b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul   const struct cmd_block_list *commands = &bin->commands;
624b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul   struct cmd_block *block;
625b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul   unsigned k;
626b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul
6273a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   lp_rast_start_tile( rast, thread_index, x, y );
628b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul
629b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul   /* simply execute each of the commands in the block list */
630b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul   for (block = commands->head; block; block = block->next) {
631b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul      for (k = 0; k < block->count; k++) {
632aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         block->cmd[k]( rast, thread_index, block->arg[k] );
633b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul      }
634b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul   }
635b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul
6363a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   lp_rast_end_tile( rast, thread_index );
637b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul}
638b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul
6394231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
6404231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell#define RAST(x) { lp_rast_##x, #x }
6414231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
6424231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwellstatic struct {
6434231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   lp_rast_cmd cmd;
6444231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   const char *name;
6454231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell} cmd_names[] =
6464231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell{
6474231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(load_color),
6484231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(clear_color),
6494231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(clear_zstencil),
6504231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(triangle),
6514231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(shade_tile),
6524231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(set_state),
6534231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   RAST(fence),
6544231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell};
6554231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
6564231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwellstatic void
6574231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwelldebug_bin( const struct cmd_bin *bin )
6584231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell{
6594231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   const struct cmd_block *head = bin->commands.head;
6604231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   int i, j;
6614231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
6624231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   for (i = 0; i < head->count; i++) {
6634231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell      debug_printf("%d: ", i);
6644231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell      for (j = 0; j < Elements(cmd_names); j++) {
6654231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell         if (head->cmd[i] == cmd_names[j].cmd) {
6664231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell            debug_printf("%s\n", cmd_names[j].name);
6674231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell            break;
6684231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell         }
6694231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell      }
6704231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell      if (j == Elements(cmd_names))
6714231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell         debug_printf("...other\n");
6724231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   }
6734231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
6744231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell}
6754231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
676db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell/* An empty bin is one that just loads the contents of the tile and
677db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * stores them again unchanged.  This typically happens when bins have
678db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * been flushed for some reason in the middle of a frame, or when
679db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * incremental updates are being made to a render target.
680db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell *
681db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * Try to avoid doing pointless work in this case.
682db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell */
683da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwellstatic boolean
684db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwellis_empty_bin( const struct cmd_bin *bin )
685da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell{
686da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell   const struct cmd_block *head = bin->commands.head;
687da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell   int i;
6884231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
6894231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   if (0)
6904231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell      debug_bin(bin);
6914231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell
692db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell   /* We emit at most two load-tile commands at the start of the first
6934231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell    * command block.  In addition we seem to emit a couple of
6944231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell    * set-state commands even in empty bins.
6954231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell    *
6964231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell    * As a heuristic, if a bin has more than 4 commands, consider it
6974231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell    * non-empty.
698db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell    */
699da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell   if (head->next != NULL ||
7004231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell       head->count > 4) {
701da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell      return FALSE;
7024231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell   }
703da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell
704da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell   for (i = 0; i < head->count; i++)
705da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell      if (head->cmd[i] != lp_rast_load_color &&
7064231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell          head->cmd[i] != lp_rast_set_state) {
707da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell         return FALSE;
7084231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell      }
709da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell
710da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell   return TRUE;
711da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell}
712da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell
713da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell
714b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul
71501b1900084152dbacd4025a31ced25f75666ce59Brian Paul/**
716663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * Rasterize/execute all bins within a scene.
7179509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul * Called per thread.
71801b1900084152dbacd4025a31ced25f75666ce59Brian Paul */
719aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paulstatic void
720663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwellrasterize_scene( struct lp_rasterizer *rast,
721aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul                unsigned thread_index,
722663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell                struct lp_scene *scene,
723aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul                bool write_depth )
724aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{
725663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   /* loop over scene bins, rasterize each */
726aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#if 0
727aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   {
728aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      unsigned i, j;
729663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      for (i = 0; i < scene->tiles_x; i++) {
730663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell         for (j = 0; j < scene->tiles_y; j++) {
731663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell            struct cmd_bin *bin = lp_get_bin(scene, i, j);
732aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul            rasterize_bin( rast, thread_index,
733aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul                           bin, i * TILE_SIZE, j * TILE_SIZE );
734aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         }
735aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      }
736aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   }
737aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#else
738aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   {
739aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      struct cmd_bin *bin;
740aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      int x, y;
741aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
742663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      assert(scene);
743663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      while ((bin = lp_scene_bin_iter_next(scene, &x, &y))) {
744db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell         if (!is_empty_bin( bin ))
745da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell            rasterize_bin( rast, thread_index, bin, x * TILE_SIZE, y * TILE_SIZE);
746aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      }
747aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   }
748aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#endif
749aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul}
750aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
751aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
752aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul/**
7534e67f10331bfd87560e2900e66f3b942902bc65cBrian Paul * Called by setup module when it has something for us to render.
754aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul */
75501b1900084152dbacd4025a31ced25f75666ce59Brian Paulvoid
756663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwelllp_rasterize_scene( struct lp_rasterizer *rast,
757663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell                   struct lp_scene *scene,
75801b1900084152dbacd4025a31ced25f75666ce59Brian Paul                   const struct pipe_framebuffer_state *fb,
75901b1900084152dbacd4025a31ced25f75666ce59Brian Paul                   bool write_depth )
76001b1900084152dbacd4025a31ced25f75666ce59Brian Paul{
76196689d451a24753e088f40fb167c3cb26d8045acBrian Paul   boolean debug = false;
76296689d451a24753e088f40fb167c3cb26d8045acBrian Paul
76301b1900084152dbacd4025a31ced25f75666ce59Brian Paul   LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__);
76401b1900084152dbacd4025a31ced25f75666ce59Brian Paul
76596689d451a24753e088f40fb167c3cb26d8045acBrian Paul   if (debug) {
76696689d451a24753e088f40fb167c3cb26d8045acBrian Paul      unsigned x, y;
767a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca      debug_printf("rasterize scene:\n");
768a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca      debug_printf("  data size: %u\n", lp_scene_data_size(scene));
769663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      for (y = 0; y < scene->tiles_y; y++) {
770663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell         for (x = 0; x < scene->tiles_x; x++) {
771a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca            debug_printf("  bin %u, %u size: %u\n", x, y,
772a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca                         lp_scene_bin_size(scene, x, y));
77396689d451a24753e088f40fb167c3cb26d8045acBrian Paul         }
77496689d451a24753e088f40fb167c3cb26d8045acBrian Paul      }
77596689d451a24753e088f40fb167c3cb26d8045acBrian Paul   }
77696689d451a24753e088f40fb167c3cb26d8045acBrian Paul
7772bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul   /* save framebuffer state in the bin */
778663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   util_copy_framebuffer_state(&scene->fb, fb);
779663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   scene->write_depth = write_depth;
780aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
781aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   if (rast->num_threads == 0) {
782aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* no threading */
7832bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
7842bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      lp_rast_begin( rast, fb,
785c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell                     fb->nr_cbufs != 0, /* always write color if cbufs present */
7862bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul                     fb->zsbuf != NULL && write_depth );
7872bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
788663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      lp_scene_bin_iter_begin( scene );
789663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      rasterize_scene( rast, 0, scene, write_depth );
7903bee8c2e7c17893f91f6b62e2db090ef495dca9dBrian Paul
791663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      release_scene( rast, scene );
7922bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
7932bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      lp_rast_end( rast );
79401b1900084152dbacd4025a31ced25f75666ce59Brian Paul   }
795aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   else {
796aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* threaded rendering! */
797aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      unsigned i;
798aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
799663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      lp_scene_enqueue( rast->full_scenes, scene );
8009509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul
801aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* signal the threads that there's work to do */
802aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      for (i = 0; i < rast->num_threads; i++) {
803aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         pipe_semaphore_signal(&rast->tasks[i].work_ready);
804aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      }
805aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
806aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* wait for work to complete */
807aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      for (i = 0; i < rast->num_threads; i++) {
808aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         pipe_semaphore_wait(&rast->tasks[i].work_done);
809cdaea049c95031338040b31ff31944c8a001a1ddBrian Paul      }
810cdaea049c95031338040b31ff31944c8a001a1ddBrian Paul   }
81101b1900084152dbacd4025a31ced25f75666ce59Brian Paul
81201b1900084152dbacd4025a31ced25f75666ce59Brian Paul   LP_DBG(DEBUG_SETUP, "%s done \n", __FUNCTION__);
81301b1900084152dbacd4025a31ced25f75666ce59Brian Paul}
81401b1900084152dbacd4025a31ced25f75666ce59Brian Paul
81501b1900084152dbacd4025a31ced25f75666ce59Brian Paul
816aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul/**
817aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * This is the thread's main entrypoint.
818aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * It's a simple loop:
819aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul *   1. wait for work
820aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul *   2. do work
821aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul *   3. signal that we're done
822aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul */
823a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonsecastatic PIPE_THREAD_ROUTINE( thread_func, init_data )
824aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{
825aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   struct lp_rasterizer_task *task = (struct lp_rasterizer_task *) init_data;
826aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   struct lp_rasterizer *rast = task->rast;
8279509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul   boolean debug = false;
828aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
829aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   while (1) {
830aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* wait for work */
831aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      if (debug)
832aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         debug_printf("thread %d waiting for work\n", task->thread_index);
833aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      pipe_semaphore_wait(&task->work_ready);
834aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
8352bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      if (task->thread_index == 0) {
8362bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul         /* thread[0]:
837663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell          *  - get next scene to rasterize
8382bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul          *  - map the framebuffer surfaces
8392bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul          */
8402bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul         const struct pipe_framebuffer_state *fb;
8412bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul         boolean write_depth;
8422bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
843591401ff05f878ff1607a1a34db1319103025d8fKeith Whitwell         rast->curr_scene = lp_scene_dequeue( rast->full_scenes, TRUE );
8442bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
845663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell         lp_scene_bin_iter_begin( rast->curr_scene );
8462bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
847663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell         fb = &rast->curr_scene->fb;
848663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell         write_depth = rast->curr_scene->write_depth;
8492bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
8502bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul         lp_rast_begin( rast, fb,
851c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell                        fb->nr_cbufs != 0,
8522bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul                        fb->zsbuf != NULL && write_depth );
8532bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      }
8542bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
8552bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      /* Wait for all threads to get here so that threads[1+] don't
856663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell       * get a null rast->curr_scene pointer.
8572bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul       */
8582bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      pipe_barrier_wait( &rast->barrier );
8599509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul
860aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* do work */
861aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      if (debug)
862aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         debug_printf("thread %d doing work\n", task->thread_index);
863663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      rasterize_scene(rast,
864663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell		     task->thread_index,
865663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell                     rast->curr_scene,
866663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell		     rast->curr_scene->write_depth);
8679509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul
868663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell      /* wait for all threads to finish with this scene */
8692bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      pipe_barrier_wait( &rast->barrier );
8702bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
8712bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      if (task->thread_index == 0) {
8722bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul         /* thread[0]:
873663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell          * - release the scene object
8742bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul          * - unmap the framebuffer surfaces
8752bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul          */
876663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell         release_scene( rast, rast->curr_scene );
8772bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul         lp_rast_end( rast );
8782bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul      }
879aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
880aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      /* signal done with work */
881aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      if (debug)
882aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul         debug_printf("thread %d done working\n", task->thread_index);
883aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      pipe_semaphore_signal(&task->work_done);
884aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   }
885aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
886aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   return NULL;
887aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul}
888aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
889aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
890aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul/**
891aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * Initialize semaphores and spawn the threads.
892aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul */
893aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paulstatic void
894aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paulcreate_rast_threads(struct lp_rasterizer *rast)
895aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{
896aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   unsigned i;
897aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
898ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca#ifdef PIPE_OS_WINDOWS
899ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca   /* Multithreading not supported on windows until conditions and barriers are
900ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca    * properly implemented. */
901ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca   rast->num_threads = 0;
902ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca#else
9037f457acabcbeea6a27b4f375f55e318fff52445fJosé Fonseca   rast->num_threads = util_cpu_caps.nr_cpus;
9047f457acabcbeea6a27b4f375f55e318fff52445fJosé Fonseca   rast->num_threads = debug_get_num_option("LP_NUM_THREADS", rast->num_threads);
905aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   rast->num_threads = MIN2(rast->num_threads, MAX_THREADS);
906ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca#endif
907aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
908aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   /* NOTE: if num_threads is zero, we won't use any threads */
909aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   for (i = 0; i < rast->num_threads; i++) {
910aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      pipe_semaphore_init(&rast->tasks[i].work_ready, 0);
911aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      pipe_semaphore_init(&rast->tasks[i].work_done, 0);
912aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      rast->threads[i] = pipe_thread_create(thread_func,
913aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul                                            (void *) &rast->tasks[i]);
914aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   }
915aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul}
916aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
917aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
918aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
919d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul/**
920d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul * Create new lp_rasterizer.
921663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * \param empty  the queue to put empty scenes on after we've finished
922d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul *               processing them.
923d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul */
924d7dbc666367438ee9efe748505907b36bba6b66aBrian Paulstruct lp_rasterizer *
925663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwelllp_rast_create( struct pipe_screen *screen, struct lp_scene_queue *empty )
926aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{
927aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   struct lp_rasterizer *rast;
928c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i, cbuf;
929aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
930aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   rast = CALLOC_STRUCT(lp_rasterizer);
931aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   if(!rast)
932aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul      return NULL;
933aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
934aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   rast->screen = screen;
935aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
936663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   rast->empty_scenes = empty;
937663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell   rast->full_scenes = lp_scene_queue_create();
938d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul
939aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   for (i = 0; i < Elements(rast->tasks); i++) {
940ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul      struct lp_rasterizer_task *task = &rast->tasks[i];
941ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul
942c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      for (cbuf = 0; cbuf < PIPE_MAX_COLOR_BUFS; cbuf++ )
943ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul	 task->tile.color[cbuf] = align_malloc(TILE_SIZE * TILE_SIZE * 4, 16);
944c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell
945ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul      task->rast = rast;
946ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul      task->thread_index = i;
947aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   }
948aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
949aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   create_rast_threads(rast);
950aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
9512bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul   /* for synchronizing rasterization threads */
9522bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul   pipe_barrier_init( &rast->barrier, rast->num_threads );
9532bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
954aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul   return rast;
955aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul}
956aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul
957b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul
95889498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell/* Shutdown:
95989498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell */
96089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwellvoid lp_rast_destroy( struct lp_rasterizer *rast )
96189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{
962c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell   unsigned i, cbuf;
9633a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul
964156eabbaf996f471458ee2a69078674277b89067Brian Paul   util_unreference_framebuffer_state(&rast->state.fb);
9653a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul
9663a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   for (i = 0; i < Elements(rast->tasks); i++) {
967c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell      for (cbuf = 0; cbuf < PIPE_MAX_COLOR_BUFS; cbuf++ )
968c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell	 align_free(rast->tasks[i].tile.color[cbuf]);
9693a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul   }
9703a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul
9712bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul   /* for synchronizing rasterization threads */
9722bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul   pipe_barrier_destroy( &rast->barrier );
9732bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul
97489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell   FREE(rast);
97589498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell}
97689498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell
977932374073863379e9da862d6115410889f038154Brian Paul
978932374073863379e9da862d6115410889f038154Brian Paul/** Return number of rasterization threads */
979932374073863379e9da862d6115410889f038154Brian Paulunsigned
980932374073863379e9da862d6115410889f038154Brian Paullp_rast_get_num_threads( struct lp_rasterizer *rast )
981932374073863379e9da862d6115410889f038154Brian Paul{
982932374073863379e9da862d6115410889f038154Brian Paul   return rast->num_threads;
983932374073863379e9da862d6115410889f038154Brian Paul}
984