lp_rast.c revision 5e6a9005100ec2636ce9734a5e4535216494cf60
1d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca/************************************************************************** 2d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * 3d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * Copyright 2009 VMware, Inc. 4d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * All Rights Reserved. 5d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * 6d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * Permission is hereby granted, free of charge, to any person obtaining a 7d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * copy of this software and associated documentation files (the 8d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * "Software"), to deal in the Software without restriction, including 9d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * without limitation the rights to use, copy, modify, merge, publish, 10d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * distribute, sub license, and/or sell copies of the Software, and to 11d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * permit persons to whom the Software is furnished to do so, subject to 12d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * the following conditions: 13d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * 14d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * The above copyright notice and this permission notice (including the 15d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * next paragraph) shall be included in all copies or substantial portions 16d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * of the Software. 17d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * 18d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 19d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 20d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. 21d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR 22d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 23d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 24d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 25d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca * 26d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca **************************************************************************/ 27d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca 28ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#include <limits.h> 29d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca#include "util/u_memory.h" 30aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#include "util/u_math.h" 317f457acabcbeea6a27b4f375f55e318fff52445fJosé Fonseca#include "util/u_cpu_detect.h" 32156eabbaf996f471458ee2a69078674277b89067Brian Paul#include "util/u_surface.h" 33d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca 34663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell#include "lp_scene_queue.h" 35a08d6302168341001003da32d42cfcff2311fa04Brian Paul#include "lp_debug.h" 364b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul#include "lp_fence.h" 374aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul#include "lp_perf.h" 38d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca#include "lp_rast.h" 39921584181eb2f3b2849d150295dfce1dae25dd11José Fonseca#include "lp_rast_priv.h" 40921584181eb2f3b2849d150295dfce1dae25dd11José Fonseca#include "lp_tile_soa.h" 41c61bf363937f40624a5632745630d4f2b9907082Zack Rusin#include "gallivm/lp_bld_debug.h" 42663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell#include "lp_scene.h" 43d614ced756f2cca64ec83b122da4cd028c08c0ebJosé Fonseca 4489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 457505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 467505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Begin the rasterization phase. 477505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Map the framebuffer surfaces. Initialize the 'rast' state. 487505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */ 4901b1900084152dbacd4025a31ced25f75666ce59Brian Paulstatic boolean 5001b1900084152dbacd4025a31ced25f75666ce59Brian Paullp_rast_begin( struct lp_rasterizer *rast, 51156eabbaf996f471458ee2a69078674277b89067Brian Paul const struct pipe_framebuffer_state *fb, 52156eabbaf996f471458ee2a69078674277b89067Brian Paul boolean write_color, 53156eabbaf996f471458ee2a69078674277b89067Brian Paul boolean write_zstencil ) 5484ab7dcf48e87350c0622c533e51aa495f7256c2Keith Whitwell{ 55e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell struct pipe_screen *screen = rast->screen; 56156eabbaf996f471458ee2a69078674277b89067Brian Paul struct pipe_surface *cbuf, *zsbuf; 57c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell int i; 58e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 59156eabbaf996f471458ee2a69078674277b89067Brian Paul LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__); 604e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 61156eabbaf996f471458ee2a69078674277b89067Brian Paul util_copy_framebuffer_state(&rast->state.fb, fb); 62e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 63e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell rast->state.write_zstencil = write_zstencil; 64e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell rast->state.write_color = write_color; 65e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 66156eabbaf996f471458ee2a69078674277b89067Brian Paul rast->check_for_clipped_tiles = (fb->width % TILE_SIZE != 0 || 67156eabbaf996f471458ee2a69078674277b89067Brian Paul fb->height % TILE_SIZE != 0); 6884ab7dcf48e87350c0622c533e51aa495f7256c2Keith Whitwell 69c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 70c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (i = 0; i < rast->state.fb.nr_cbufs; i++) { 71c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf = rast->state.fb.cbufs[i]; 72c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (cbuf) { 73c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_transfer[i] = screen->get_tex_transfer(rast->screen, 74c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf->texture, 75c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf->face, 76c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf->level, 77c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf->zslice, 78c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell PIPE_TRANSFER_READ_WRITE, 79c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 0, 0, 80c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf->width, 81c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell cbuf->height); 82c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (!rast->cbuf_transfer[i]) 83c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell goto fail; 84c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 85c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_map[i] = screen->transfer_map(rast->screen, 86c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_transfer[i]); 87c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (!rast->cbuf_map[i]) 88c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell goto fail; 89c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell } 90e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell } 914e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 92156eabbaf996f471458ee2a69078674277b89067Brian Paul zsbuf = rast->state.fb.zsbuf; 9351663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul if (zsbuf) { 9451663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul rast->zsbuf_transfer = screen->get_tex_transfer(rast->screen, 95156eabbaf996f471458ee2a69078674277b89067Brian Paul zsbuf->texture, 96156eabbaf996f471458ee2a69078674277b89067Brian Paul zsbuf->face, 97156eabbaf996f471458ee2a69078674277b89067Brian Paul zsbuf->level, 98156eabbaf996f471458ee2a69078674277b89067Brian Paul zsbuf->zslice, 99156eabbaf996f471458ee2a69078674277b89067Brian Paul PIPE_TRANSFER_READ_WRITE, 100156eabbaf996f471458ee2a69078674277b89067Brian Paul 0, 0, 101c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell zsbuf->width, 102c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell zsbuf->height); 10351663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul if (!rast->zsbuf_transfer) 104c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell goto fail; 10551663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul 10651663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul rast->zsbuf_map = screen->transfer_map(rast->screen, 10751663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul rast->zsbuf_transfer); 10851663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul if (!rast->zsbuf_map) 109c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell goto fail; 11051663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul } 11151663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul 112e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell return TRUE; 113c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 114c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwellfail: 115c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell /* Unmap and release transfers? 116c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell */ 117c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell return FALSE; 1180718c7700533a965d7cd06b4f67b82bbae6e66a1Keith Whitwell} 1190718c7700533a965d7cd06b4f67b82bbae6e66a1Keith Whitwell 120e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 1217505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 1227505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Finish the rasterization phase. 1237505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Unmap framebuffer surfaces. 1247505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */ 12501b1900084152dbacd4025a31ced25f75666ce59Brian Paulstatic void 12601b1900084152dbacd4025a31ced25f75666ce59Brian Paullp_rast_end( struct lp_rasterizer *rast ) 1270718c7700533a965d7cd06b4f67b82bbae6e66a1Keith Whitwell{ 128e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell struct pipe_screen *screen = rast->screen; 129c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i; 1304e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 131c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (i = 0; i < rast->state.fb.nr_cbufs; i++) { 132c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (rast->cbuf_map[i]) 133c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell screen->transfer_unmap(screen, rast->cbuf_transfer[i]); 134c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 135c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (rast->cbuf_transfer[i]) 136c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell screen->tex_transfer_destroy(rast->cbuf_transfer[i]); 137c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 138c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_transfer[i] = NULL; 139c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_map[i] = NULL; 140c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell } 141e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 142e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell if (rast->zsbuf_map) 143e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell screen->transfer_unmap(screen, rast->zsbuf_transfer); 144e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 145e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell if (rast->zsbuf_transfer) 14651663f0506ed2534e57b798cdfaf8a0d376eb7a2Brian Paul screen->tex_transfer_destroy(rast->zsbuf_transfer); 147e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell 148e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell rast->zsbuf_transfer = NULL; 149e0e2008f1dcd73a59a184e0ef4c1dd77ac2a1cbfKeith Whitwell rast->zsbuf_map = NULL; 15089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 15189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 152d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwell 1537505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 1547505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Begining rasterization of a tile. 1557505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * \param x window X position of the tile, in pixels 1567505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * \param y window Y position of the tile, in pixels 15789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell */ 158b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paulstatic void 159b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paullp_rast_start_tile( struct lp_rasterizer *rast, 1603a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 161b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul unsigned x, unsigned y ) 16289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 163a08d6302168341001003da32d42cfcff2311fa04Brian Paul LP_DBG(DEBUG_RAST, "%s %d,%d\n", __FUNCTION__, x, y); 1644e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 1653a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul rast->tasks[thread_index].x = x; 1663a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul rast->tasks[thread_index].y = y; 16789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 16889498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 1697505510c7b7c33f3c571647c0398da7e1b823806Brian Paul 1707505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 1717505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Clear the rasterizer's current color tile. 172ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing. 1737505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */ 174d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwellvoid lp_rast_clear_color( struct lp_rasterizer *rast, 1753a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 1764cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell const union lp_rast_cmd_arg arg ) 17789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 1784cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell const uint8_t *clear_color = arg.clear_color; 179c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell uint8_t **color_tile = rast->tasks[thread_index].tile.color; 180c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i; 181c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 182a08d6302168341001003da32d42cfcff2311fa04Brian Paul LP_DBG(DEBUG_RAST, "%s 0x%x,0x%x,0x%x,0x%x\n", __FUNCTION__, 183295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell clear_color[0], 184295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell clear_color[1], 185295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell clear_color[2], 186295aea04895676aae5b67a7016c62bab8e40b996Keith Whitwell clear_color[3]); 1874e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 18837b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca if (clear_color[0] == clear_color[1] && 18937b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca clear_color[1] == clear_color[2] && 19037b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca clear_color[2] == clear_color[3]) { 191f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul /* clear to grayscale value {x, x, x, x} */ 192c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (i = 0; i < rast->state.fb.nr_cbufs; i++) { 193c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell memset(color_tile[i], clear_color[0], TILE_SIZE * TILE_SIZE * 4); 194c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell } 19537b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca } 19637b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca else { 197f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul /* Non-gray color. 198f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul * Note: if the swizzled tile layout changes (see TILE_PIXEL) this code 199f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul * will need to change. It'll be pretty obvious when clearing no longer 200f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul * works. 201f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul */ 202f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul const unsigned chunk = TILE_SIZE / 4; 203f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul for (i = 0; i < rast->state.fb.nr_cbufs; i++) { 204f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul uint8_t *c = color_tile[i]; 205f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul unsigned j; 206f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul for (j = 0; j < 4 * TILE_SIZE; j++) { 207f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul memset(c, clear_color[0], chunk); 208f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul c += chunk; 209f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul memset(c, clear_color[1], chunk); 210f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul c += chunk; 211f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul memset(c, clear_color[2], chunk); 212f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul c += chunk; 213f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul memset(c, clear_color[3], chunk); 214f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul c += chunk; 215f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul } 216f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul assert(c - color_tile[i] == TILE_SIZE * TILE_SIZE * 4); 217f94a99170ecdc3286408b3628fbae9f45518007eBrian Paul } 21837b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca } 2194aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul 2204aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul LP_COUNT(nr_color_tile_clear); 22189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 22289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 2237505510c7b7c33f3c571647c0398da7e1b823806Brian Paul 2247505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 2257505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Clear the rasterizer's current z/stencil tile. 226ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing. 2277505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */ 228d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwellvoid lp_rast_clear_zstencil( struct lp_rasterizer *rast, 2293a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 2304cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell const union lp_rast_cmd_arg arg) 23189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 2325e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca struct lp_rasterizer_task *task = &rast->tasks[thread_index]; 2335e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca const unsigned tile_x = task->x; 2345e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca const unsigned tile_y = task->y; 2355e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca const unsigned height = TILE_SIZE/TILE_VECTOR_HEIGHT; 2365e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca const unsigned width = TILE_SIZE*TILE_VECTOR_HEIGHT; 2375e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca unsigned block_size = util_format_get_blocksize(rast->zsbuf_transfer->texture->format); 2385e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca uint8_t *dst; 2395e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca unsigned dst_stride = rast->zsbuf_transfer->stride*TILE_VECTOR_HEIGHT; 2405e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca unsigned i, j; 2415e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca 242a08d6302168341001003da32d42cfcff2311fa04Brian Paul LP_DBG(DEBUG_RAST, "%s 0x%x\n", __FUNCTION__, arg.clear_zstencil); 2434e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 2445e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca assert(rast->zsbuf_map); 2455e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca if (!rast->zsbuf_map) 2465e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca return; 2475e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca 2485e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__); 2495e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca 2505e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca /* 2515e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca * Clear the aera of the swizzled depth/depth buffer matching this tile, in 2525e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca * stripes of TILE_VECTOR_HEIGHT x TILE_SIZE at a time. 2535e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca * 2545e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca * The swizzled depth format is such that the depths for 2555e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca * TILE_VECTOR_HEIGHT x TILE_VECTOR_WIDTH pixels have consecutive offsets. 2565e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca */ 2575e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca 2585e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca dst = lp_rast_depth_pointer(rast, tile_x, tile_y); 2595e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca 2605e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca switch (block_size) { 2615e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca case 1: 2625e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca memset(dst, (uint8_t) arg.clear_zstencil, height * width); 2635e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca break; 2645e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca case 2: 2655e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca for (i = 0; i < height; i++) { 2665e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca uint16_t *row = (uint16_t *)dst; 2675e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca for (j = 0; j < width; j++) 2685e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca *row++ = (uint16_t) arg.clear_zstencil; 2695e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca dst += dst_stride; 2705e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca } 2715e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca break; 2725e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca case 4: 2735e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca for (i = 0; i < height; i++) { 2745e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca uint32_t *row = (uint32_t *)dst; 2755e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca for (j = 0; j < width; j++) 2765e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca *row++ = arg.clear_zstencil; 2775e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca dst += dst_stride; 2785e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca } 2795e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca break; 2805e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca default: 2815e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca assert(0); 2825e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca break; 2835e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca } 28489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 28589498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 28689498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 287ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul/** 288ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * Load tile color from the framebuffer surface. 289ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing. 290ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul */ 291d0c918b87a9fb0e86d6b3efedf3ef505e04c527fKeith Whitwellvoid lp_rast_load_color( struct lp_rasterizer *rast, 2923a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 2934cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell const union lp_rast_cmd_arg arg) 29489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 29592dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul struct lp_rasterizer_task *task = &rast->tasks[thread_index]; 29692dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul const unsigned x = task->x; 29792dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul const unsigned y = task->y; 298c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i; 29992dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul 30092dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul LP_DBG(DEBUG_RAST, "%s at %u, %u\n", __FUNCTION__, x, y); 30192dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul 302c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (i = 0; i < rast->state.fb.nr_cbufs; i++) { 303c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell struct pipe_transfer *transfer = rast->cbuf_transfer[i]; 304c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell int w = TILE_SIZE; 305c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell int h = TILE_SIZE; 30692dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul 307c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (x >= transfer->width) 308c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell continue; 30992dc0f92b0f0fa2f3e4ba832ef2232169ce19ce8Brian Paul 310c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (y >= transfer->height) 311c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell continue; 312c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 313c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell assert(w >= 0); 314c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell assert(h >= 0); 315c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell assert(w <= TILE_SIZE); 316c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell assert(h <= TILE_SIZE); 317c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 318c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell lp_tile_read_4ub(transfer->texture->format, 319ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul task->tile.color[i], 320c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_map[i], 321c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell transfer->stride, 322c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell x, y, 323c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell w, h); 3244aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul 3254aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul LP_COUNT(nr_color_tile_load); 326c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell } 32789498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 32889498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 329ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul 330ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paulvoid lp_rast_set_state( struct lp_rasterizer *rast, 3313a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 332ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul const union lp_rast_cmd_arg arg ) 333ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul{ 334e2f46344560f8f1193b311ad41883011e67eea00Brian Paul const struct lp_rast_state *state = arg.set_state; 335e2f46344560f8f1193b311ad41883011e67eea00Brian Paul 336a08d6302168341001003da32d42cfcff2311fa04Brian Paul LP_DBG(DEBUG_RAST, "%s %p\n", __FUNCTION__, (void *) state); 337ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul 338b1659b9213f3eeee440590dfe379f0d193948307Brian Paul /* just set the current state pointer for this rasterizer */ 3393a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul rast->tasks[thread_index].current_state = state; 340ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul} 341ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul 342ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul 343ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul 344ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul/** 345ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * Run the shader on all blocks in a tile. This is used when a tile is 346ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * completely contained inside a triangle. 347ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing. 348ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul */ 34989498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwellvoid lp_rast_shade_tile( struct lp_rasterizer *rast, 3503a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 3514cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell const union lp_rast_cmd_arg arg ) 35289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 353ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul struct lp_rasterizer_task *task = &rast->tasks[thread_index]; 354ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul const struct lp_rast_state *state = task->current_state; 355ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul struct lp_rast_tile *tile = &task->tile; 3564cdd10cb4b60d85f6c231a26739f7d5e264a05e5Keith Whitwell const struct lp_rast_shader_inputs *inputs = arg.shade_tile; 357ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul const unsigned tile_x = task->x; 358ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul const unsigned tile_y = task->y; 35986dba3e4142276d76ecffc0cd238506df5efe9afJosé Fonseca unsigned x, y; 36089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 361a08d6302168341001003da32d42cfcff2311fa04Brian Paul LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__); 3624e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 3632797f2bf57562c95a601a67edca3089641215cc4Brian Paul /* render the whole 64x64 tile in 4x4 chunks */ 3642797f2bf57562c95a601a67edca3089641215cc4Brian Paul for (y = 0; y < TILE_SIZE; y += 4){ 3652797f2bf57562c95a601a67edca3089641215cc4Brian Paul for (x = 0; x < TILE_SIZE; x += 4) { 3662797f2bf57562c95a601a67edca3089641215cc4Brian Paul uint8_t *color[PIPE_MAX_COLOR_BUFS]; 3672797f2bf57562c95a601a67edca3089641215cc4Brian Paul uint32_t *depth; 3682797f2bf57562c95a601a67edca3089641215cc4Brian Paul unsigned block_offset, i; 3692797f2bf57562c95a601a67edca3089641215cc4Brian Paul 3702797f2bf57562c95a601a67edca3089641215cc4Brian Paul /* offset of the 16x16 pixel block within the tile */ 3712797f2bf57562c95a601a67edca3089641215cc4Brian Paul block_offset = ((y / 4) * (16 * 16) + (x / 4) * 16); 3722797f2bf57562c95a601a67edca3089641215cc4Brian Paul 3732797f2bf57562c95a601a67edca3089641215cc4Brian Paul /* color buffer */ 3742797f2bf57562c95a601a67edca3089641215cc4Brian Paul for (i = 0; i < rast->state.fb.nr_cbufs; i++) 3752797f2bf57562c95a601a67edca3089641215cc4Brian Paul color[i] = tile->color[i] + 4 * block_offset; 3762797f2bf57562c95a601a67edca3089641215cc4Brian Paul 3772797f2bf57562c95a601a67edca3089641215cc4Brian Paul /* depth buffer */ 3785e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca depth = lp_rast_depth_pointer(rast, tile_x + x, tile_y + y); 3792797f2bf57562c95a601a67edca3089641215cc4Brian Paul 3802797f2bf57562c95a601a67edca3089641215cc4Brian Paul /* run shader */ 3812797f2bf57562c95a601a67edca3089641215cc4Brian Paul state->jit_function[0]( &state->jit_context, 3822797f2bf57562c95a601a67edca3089641215cc4Brian Paul tile_x + x, tile_y + y, 3832797f2bf57562c95a601a67edca3089641215cc4Brian Paul inputs->a0, 3842797f2bf57562c95a601a67edca3089641215cc4Brian Paul inputs->dadx, 3852797f2bf57562c95a601a67edca3089641215cc4Brian Paul inputs->dady, 3862797f2bf57562c95a601a67edca3089641215cc4Brian Paul color, 3872797f2bf57562c95a601a67edca3089641215cc4Brian Paul depth, 3882797f2bf57562c95a601a67edca3089641215cc4Brian Paul INT_MIN, INT_MIN, INT_MIN, 3892797f2bf57562c95a601a67edca3089641215cc4Brian Paul NULL, NULL, NULL ); 3902797f2bf57562c95a601a67edca3089641215cc4Brian Paul } 3912797f2bf57562c95a601a67edca3089641215cc4Brian Paul } 39289498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 39389498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 394a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 395866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul/** 396866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul * Compute shading for a 4x4 block of pixels. 397ffd0759973165368ac8ce07d9bcffeb0acf88e6fBrian Paul * This is a bin command called during bin processing. 398866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul */ 399ab76b2a8b896edc1e972de108d044b70310b4324José Fonsecavoid lp_rast_shade_quads( struct lp_rasterizer *rast, 4003a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 401ab76b2a8b896edc1e972de108d044b70310b4324José Fonseca const struct lp_rast_shader_inputs *inputs, 402ab76b2a8b896edc1e972de108d044b70310b4324José Fonseca unsigned x, unsigned y, 403ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul int32_t c1, int32_t c2, int32_t c3) 404a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca{ 405ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul struct lp_rasterizer_task *task = &rast->tasks[thread_index]; 406ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul const struct lp_rast_state *state = task->current_state; 407ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul struct lp_rast_tile *tile = &task->tile; 408c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell uint8_t *color[PIPE_MAX_COLOR_BUFS]; 40986dba3e4142276d76ecffc0cd238506df5efe9afJosé Fonseca void *depth; 410c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i; 4117b116e13a2aa28a699e30c907c1b1ae5e04cab28Keith Whitwell unsigned ix, iy; 412866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul int block_offset; 413a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 414ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#ifdef DEBUG 415b1659b9213f3eeee440590dfe379f0d193948307Brian Paul assert(state); 416b1659b9213f3eeee440590dfe379f0d193948307Brian Paul 417a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca /* Sanity checks */ 418a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca assert(x % TILE_VECTOR_WIDTH == 0); 419a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca assert(y % TILE_VECTOR_HEIGHT == 0); 420a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 421cdbcd96fdfe2c4d09e9b34cb083664d6b6e0558bBrian Paul assert((x % 4) == 0); 422cdbcd96fdfe2c4d09e9b34cb083664d6b6e0558bBrian Paul assert((y % 4) == 0); 423ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#endif 424866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul 42561f3eeb6403e404d297bdcd924c215ed36060945José Fonseca ix = x % TILE_SIZE; 42661f3eeb6403e404d297bdcd924c215ed36060945José Fonseca iy = y % TILE_SIZE; 42761f3eeb6403e404d297bdcd924c215ed36060945José Fonseca 428866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul /* offset of the 16x16 pixel block within the tile */ 4292797f2bf57562c95a601a67edca3089641215cc4Brian Paul block_offset = ((iy / 4) * (16 * 16) + (ix / 4) * 16); 430866e6856d39efe9b1ec739587f420a640ad8618eBrian Paul 431a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca /* color buffer */ 432c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (i = 0; i < rast->state.fb.nr_cbufs; i++) 433c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell color[i] = tile->color[i] + 4 * block_offset; 434a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 435a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca /* depth buffer */ 4365e6a9005100ec2636ce9734a5e4535216494cf60José Fonseca depth = lp_rast_depth_pointer(rast, x, y); 437a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 438c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 439c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 440ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#ifdef DEBUG 441c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell assert(lp_check_alignment(tile->color[0], 16)); 44285999695829823e459e11822b4846ed1db5c055dJosé Fonseca assert(lp_check_alignment(state->jit_context.blend_color, 16)); 443a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 444ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul assert(lp_check_alignment(inputs->step[0], 16)); 445ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul assert(lp_check_alignment(inputs->step[1], 16)); 446ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul assert(lp_check_alignment(inputs->step[2], 16)); 447ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul#endif 448ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul 449a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca /* run shader */ 4502797f2bf57562c95a601a67edca3089641215cc4Brian Paul state->jit_function[1]( &state->jit_context, 45161f3eeb6403e404d297bdcd924c215ed36060945José Fonseca x, y, 45285999695829823e459e11822b4846ed1db5c055dJosé Fonseca inputs->a0, 45385999695829823e459e11822b4846ed1db5c055dJosé Fonseca inputs->dadx, 45485999695829823e459e11822b4846ed1db5c055dJosé Fonseca inputs->dady, 45585999695829823e459e11822b4846ed1db5c055dJosé Fonseca color, 456ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul depth, 457ab9438193083b7f9a3180cb9cea45e269131048aBrian Paul c1, c2, c3, 458c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell inputs->step[0], inputs->step[1], inputs->step[2]); 459a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca} 460a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 461a6676d896ed18426ed3d7e6340347974c1694ca2José Fonseca 46262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul/** 46362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul * Set top row and left column of the tile's pixels to white. For debugging. 46462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul */ 46562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paulstatic void 46662623c4dc5d8b646942bc65e8de350e812945ad1Brian Pauloutline_tile(uint8_t *tile) 46762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul{ 46862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul const uint8_t val = 0xff; 46962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul unsigned i; 47062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 47162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul for (i = 0; i < TILE_SIZE; i++) { 47262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, 0, 0) = val; 47362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, 0, 1) = val; 47462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, 0, 2) = val; 47562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, 0, 3) = val; 47662623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 47762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, 0, i, 0) = val; 47862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, 0, i, 1) = val; 47962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, 0, i, 2) = val; 48062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, 0, i, 3) = val; 48162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul } 48262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul} 48362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 48462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 48562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul/** 48662623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul * Draw grid of gray lines at 16-pixel intervals across the tile to 48762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul * show the sub-tile boundaries. For debugging. 48862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul */ 48962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paulstatic void 49062623c4dc5d8b646942bc65e8de350e812945ad1Brian Pauloutline_subtiles(uint8_t *tile) 49162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul{ 49262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul const uint8_t val = 0x80; 49362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul const unsigned step = 16; 49462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul unsigned i, j; 49562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 4960fccfc9cc0cb7699598f1739d8cd3811175cdf13Brian Paul for (i = 0; i < TILE_SIZE; i += step) { 49762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul for (j = 0; j < TILE_SIZE; j++) { 49862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, j, 0) = val; 49962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, j, 1) = val; 50062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, j, 2) = val; 50162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, i, j, 3) = val; 50262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 50362623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, j, i, 0) = val; 50462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, j, i, 1) = val; 50562623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, j, i, 2) = val; 50662623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul TILE_PIXEL(tile, j, i, 3) = val; 50762623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul } 50862623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul } 50962623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 51062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul outline_tile(tile); 51162623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul} 51262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 51337b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca 51437b86aa55c6bb520997c00dbf1a2b38d4aed38ebJosé Fonseca 5157505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 5167505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Write the rasterizer's color tile to the framebuffer. 5177505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */ 5183a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paulstatic void lp_rast_store_color( struct lp_rasterizer *rast, 5193a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index) 52089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 521ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul struct lp_rasterizer_task *task = &rast->tasks[thread_index]; 522ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul const unsigned x = task->x; 523ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul const unsigned y = task->y; 524c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i; 52505131f7502150968d7ee19673676f74d4c2fd22bKeith Whitwell 526c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (i = 0; i < rast->state.fb.nr_cbufs; i++) { 527c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell struct pipe_transfer *transfer = rast->cbuf_transfer[i]; 528c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell int w = TILE_SIZE; 529c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell int h = TILE_SIZE; 53073e13c33fd0a9b8574d00d01d301b9d4f88d4051Brian Paul 531c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (x >= transfer->width) 532c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell continue; 53305131f7502150968d7ee19673676f74d4c2fd22bKeith Whitwell 534c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell if (y >= transfer->height) 535c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell continue; 53689498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 537c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell LP_DBG(DEBUG_RAST, "%s [%u] %d,%d %dx%d\n", __FUNCTION__, 538c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell thread_index, x, y, w, h); 539c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 54062623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul if (LP_DEBUG & DEBUG_SHOW_SUBTILES) 541ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul outline_subtiles(task->tile.color[i]); 54262623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul else if (LP_DEBUG & DEBUG_SHOW_TILES) 543ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul outline_tile(task->tile.color[i]); 54462623c4dc5d8b646942bc65e8de350e812945ad1Brian Paul 545c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell lp_tile_write_4ub(transfer->texture->format, 546ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul task->tile.color[i], 547c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell rast->cbuf_map[i], 548c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell transfer->stride, 549c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell x, y, 550c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell w, h); 5514aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul 5524aeacdf8530d69d543cb2b997c1e65edb71ae01aBrian Paul LP_COUNT(nr_color_tile_store); 553c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell } 55489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 55589498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 55647510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca 5577505510c7b7c33f3c571647c0398da7e1b823806Brian Paul/** 5587505510c7b7c33f3c571647c0398da7e1b823806Brian Paul * Write the rasterizer's tiles to the framebuffer. 5597505510c7b7c33f3c571647c0398da7e1b823806Brian Paul */ 560b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paulstatic void 5613a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paullp_rast_end_tile( struct lp_rasterizer *rast, 5623a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index ) 56347510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca{ 564a08d6302168341001003da32d42cfcff2311fa04Brian Paul LP_DBG(DEBUG_RAST, "%s\n", __FUNCTION__); 5654e1334ced68dd25b151250a44af25e8e0d5a33feKeith Whitwell 56647510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca if (rast->state.write_color) 5673a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul lp_rast_store_color(rast, thread_index); 56847510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca} 56947510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca 57047510040a68f5f672aee22eac6c01fb4dd60ec67José Fonseca 571b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul/** 5724b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul * Signal on a fence. This is called during bin execution/rasterization. 5734b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul * Called per thread. 5744b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul */ 5754b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paulvoid lp_rast_fence( struct lp_rasterizer *rast, 5764b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul unsigned thread_index, 5774b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul const union lp_rast_cmd_arg arg ) 5784b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul{ 5794b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul struct lp_fence *fence = arg.fence; 5804b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5814b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul pipe_mutex_lock( fence->mutex ); 5824b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5834b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul fence->count++; 5844b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul assert(fence->count <= fence->rank); 5854b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5864b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul LP_DBG(DEBUG_RAST, "%s count=%u rank=%u\n", __FUNCTION__, 5874b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul fence->count, fence->rank); 5884b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5894b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul pipe_condvar_signal( fence->signalled ); 5904b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5914b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul pipe_mutex_unlock( fence->mutex ); 5924b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul} 5934b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5944b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul 5954b70af918dd9040a6987c6a55e76e49f0e3f90bfBrian Paul/** 596663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * When all the threads are done rasterizing a scene, one thread will 597663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * call this function to reset the scene and put it onto the empty queue. 5982bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul */ 5992bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paulstatic void 600663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwellrelease_scene( struct lp_rasterizer *rast, 601663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell struct lp_scene *scene ) 6022bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul{ 603663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell util_unreference_framebuffer_state( &scene->fb ); 6042bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 605663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell lp_scene_reset( scene ); 606663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell lp_scene_enqueue( rast->empty_scenes, scene ); 607663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rast->curr_scene = NULL; 6082bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul} 6092bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 6102bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 6112bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul/** 612b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul * Rasterize commands for a single bin. 61301b1900084152dbacd4025a31ced25f75666ce59Brian Paul * \param x, y position of the bin's tile in the framebuffer 614b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul * Must be called between lp_rast_begin() and lp_rast_end(). 6159509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul * Called per thread. 616b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul */ 61701b1900084152dbacd4025a31ced25f75666ce59Brian Paulstatic void 61801b1900084152dbacd4025a31ced25f75666ce59Brian Paulrasterize_bin( struct lp_rasterizer *rast, 6193a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul unsigned thread_index, 62001b1900084152dbacd4025a31ced25f75666ce59Brian Paul const struct cmd_bin *bin, 62101b1900084152dbacd4025a31ced25f75666ce59Brian Paul int x, int y) 622b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul{ 623b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul const struct cmd_block_list *commands = &bin->commands; 624b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul struct cmd_block *block; 625b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul unsigned k; 626b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul 6273a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul lp_rast_start_tile( rast, thread_index, x, y ); 628b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul 629b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul /* simply execute each of the commands in the block list */ 630b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul for (block = commands->head; block; block = block->next) { 631b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul for (k = 0; k < block->count; k++) { 632aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul block->cmd[k]( rast, thread_index, block->arg[k] ); 633b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul } 634b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul } 635b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul 6363a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul lp_rast_end_tile( rast, thread_index ); 637b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul} 638b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul 6394231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 6404231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell#define RAST(x) { lp_rast_##x, #x } 6414231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 6424231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwellstatic struct { 6434231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell lp_rast_cmd cmd; 6444231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell const char *name; 6454231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell} cmd_names[] = 6464231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell{ 6474231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(load_color), 6484231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(clear_color), 6494231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(clear_zstencil), 6504231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(triangle), 6514231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(shade_tile), 6524231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(set_state), 6534231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell RAST(fence), 6544231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell}; 6554231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 6564231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwellstatic void 6574231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwelldebug_bin( const struct cmd_bin *bin ) 6584231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell{ 6594231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell const struct cmd_block *head = bin->commands.head; 6604231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell int i, j; 6614231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 6624231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell for (i = 0; i < head->count; i++) { 6634231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell debug_printf("%d: ", i); 6644231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell for (j = 0; j < Elements(cmd_names); j++) { 6654231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell if (head->cmd[i] == cmd_names[j].cmd) { 6664231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell debug_printf("%s\n", cmd_names[j].name); 6674231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell break; 6684231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell } 6694231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell } 6704231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell if (j == Elements(cmd_names)) 6714231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell debug_printf("...other\n"); 6724231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell } 6734231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 6744231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell} 6754231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 676db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell/* An empty bin is one that just loads the contents of the tile and 677db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * stores them again unchanged. This typically happens when bins have 678db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * been flushed for some reason in the middle of a frame, or when 679db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * incremental updates are being made to a render target. 680db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * 681db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell * Try to avoid doing pointless work in this case. 682db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell */ 683da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwellstatic boolean 684db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwellis_empty_bin( const struct cmd_bin *bin ) 685da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell{ 686da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell const struct cmd_block *head = bin->commands.head; 687da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell int i; 6884231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 6894231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell if (0) 6904231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell debug_bin(bin); 6914231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell 692db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell /* We emit at most two load-tile commands at the start of the first 6934231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell * command block. In addition we seem to emit a couple of 6944231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell * set-state commands even in empty bins. 6954231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell * 6964231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell * As a heuristic, if a bin has more than 4 commands, consider it 6974231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell * non-empty. 698db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell */ 699da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell if (head->next != NULL || 7004231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell head->count > 4) { 701da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell return FALSE; 7024231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell } 703da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell 704da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell for (i = 0; i < head->count; i++) 705da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell if (head->cmd[i] != lp_rast_load_color && 7064231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell head->cmd[i] != lp_rast_set_state) { 707da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell return FALSE; 7084231006e29cbf9fb54c72acf35009f3b18fe62abKeith Whitwell } 709da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell 710da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell return TRUE; 711da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell} 712da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell 713da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell 714b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul 71501b1900084152dbacd4025a31ced25f75666ce59Brian Paul/** 716663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * Rasterize/execute all bins within a scene. 7179509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul * Called per thread. 71801b1900084152dbacd4025a31ced25f75666ce59Brian Paul */ 719aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paulstatic void 720663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwellrasterize_scene( struct lp_rasterizer *rast, 721aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul unsigned thread_index, 722663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell struct lp_scene *scene, 723aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul bool write_depth ) 724aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{ 725663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell /* loop over scene bins, rasterize each */ 726aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#if 0 727aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul { 728aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul unsigned i, j; 729663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell for (i = 0; i < scene->tiles_x; i++) { 730663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell for (j = 0; j < scene->tiles_y; j++) { 731663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell struct cmd_bin *bin = lp_get_bin(scene, i, j); 732aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul rasterize_bin( rast, thread_index, 733aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul bin, i * TILE_SIZE, j * TILE_SIZE ); 734aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 735aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 736aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 737aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#else 738aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul { 739aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul struct cmd_bin *bin; 740aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul int x, y; 741aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 742663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell assert(scene); 743663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell while ((bin = lp_scene_bin_iter_next(scene, &x, &y))) { 744db83ad4b4353ea6f9c755f18bf1455ea78b5bf12Keith Whitwell if (!is_empty_bin( bin )) 745da45f49cc63fff06513dc28d9616084fc81798d4Keith Whitwell rasterize_bin( rast, thread_index, bin, x * TILE_SIZE, y * TILE_SIZE); 746aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 747aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 748aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul#endif 749aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul} 750aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 751aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 752aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul/** 7534e67f10331bfd87560e2900e66f3b942902bc65cBrian Paul * Called by setup module when it has something for us to render. 754aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul */ 75501b1900084152dbacd4025a31ced25f75666ce59Brian Paulvoid 756663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwelllp_rasterize_scene( struct lp_rasterizer *rast, 757663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell struct lp_scene *scene, 75801b1900084152dbacd4025a31ced25f75666ce59Brian Paul const struct pipe_framebuffer_state *fb, 75901b1900084152dbacd4025a31ced25f75666ce59Brian Paul bool write_depth ) 76001b1900084152dbacd4025a31ced25f75666ce59Brian Paul{ 76196689d451a24753e088f40fb167c3cb26d8045acBrian Paul boolean debug = false; 76296689d451a24753e088f40fb167c3cb26d8045acBrian Paul 76301b1900084152dbacd4025a31ced25f75666ce59Brian Paul LP_DBG(DEBUG_SETUP, "%s\n", __FUNCTION__); 76401b1900084152dbacd4025a31ced25f75666ce59Brian Paul 76596689d451a24753e088f40fb167c3cb26d8045acBrian Paul if (debug) { 76696689d451a24753e088f40fb167c3cb26d8045acBrian Paul unsigned x, y; 767a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca debug_printf("rasterize scene:\n"); 768a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca debug_printf(" data size: %u\n", lp_scene_data_size(scene)); 769663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell for (y = 0; y < scene->tiles_y; y++) { 770663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell for (x = 0; x < scene->tiles_x; x++) { 771a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca debug_printf(" bin %u, %u size: %u\n", x, y, 772a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonseca lp_scene_bin_size(scene, x, y)); 77396689d451a24753e088f40fb167c3cb26d8045acBrian Paul } 77496689d451a24753e088f40fb167c3cb26d8045acBrian Paul } 77596689d451a24753e088f40fb167c3cb26d8045acBrian Paul } 77696689d451a24753e088f40fb167c3cb26d8045acBrian Paul 7772bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul /* save framebuffer state in the bin */ 778663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell util_copy_framebuffer_state(&scene->fb, fb); 779663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell scene->write_depth = write_depth; 780aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 781aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul if (rast->num_threads == 0) { 782aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* no threading */ 7832bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 7842bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul lp_rast_begin( rast, fb, 785c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell fb->nr_cbufs != 0, /* always write color if cbufs present */ 7862bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul fb->zsbuf != NULL && write_depth ); 7872bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 788663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell lp_scene_bin_iter_begin( scene ); 789663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rasterize_scene( rast, 0, scene, write_depth ); 7903bee8c2e7c17893f91f6b62e2db090ef495dca9dBrian Paul 791663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell release_scene( rast, scene ); 7922bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 7932bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul lp_rast_end( rast ); 79401b1900084152dbacd4025a31ced25f75666ce59Brian Paul } 795aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul else { 796aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* threaded rendering! */ 797aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul unsigned i; 798aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 799663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell lp_scene_enqueue( rast->full_scenes, scene ); 8009509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul 801aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* signal the threads that there's work to do */ 802aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul for (i = 0; i < rast->num_threads; i++) { 803aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul pipe_semaphore_signal(&rast->tasks[i].work_ready); 804aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 805aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 806aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* wait for work to complete */ 807aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul for (i = 0; i < rast->num_threads; i++) { 808aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul pipe_semaphore_wait(&rast->tasks[i].work_done); 809cdaea049c95031338040b31ff31944c8a001a1ddBrian Paul } 810cdaea049c95031338040b31ff31944c8a001a1ddBrian Paul } 81101b1900084152dbacd4025a31ced25f75666ce59Brian Paul 81201b1900084152dbacd4025a31ced25f75666ce59Brian Paul LP_DBG(DEBUG_SETUP, "%s done \n", __FUNCTION__); 81301b1900084152dbacd4025a31ced25f75666ce59Brian Paul} 81401b1900084152dbacd4025a31ced25f75666ce59Brian Paul 81501b1900084152dbacd4025a31ced25f75666ce59Brian Paul 816aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul/** 817aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * This is the thread's main entrypoint. 818aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * It's a simple loop: 819aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * 1. wait for work 820aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * 2. do work 821aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * 3. signal that we're done 822aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul */ 823a1af8eec66c5f7ec421e8011b41c1a7c36319f9fJosé Fonsecastatic PIPE_THREAD_ROUTINE( thread_func, init_data ) 824aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{ 825aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul struct lp_rasterizer_task *task = (struct lp_rasterizer_task *) init_data; 826aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul struct lp_rasterizer *rast = task->rast; 8279509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul boolean debug = false; 828aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 829aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul while (1) { 830aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* wait for work */ 831aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul if (debug) 832aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul debug_printf("thread %d waiting for work\n", task->thread_index); 833aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul pipe_semaphore_wait(&task->work_ready); 834aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 8352bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul if (task->thread_index == 0) { 8362bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul /* thread[0]: 837663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * - get next scene to rasterize 8382bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul * - map the framebuffer surfaces 8392bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul */ 8402bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul const struct pipe_framebuffer_state *fb; 8412bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul boolean write_depth; 8422bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 843591401ff05f878ff1607a1a34db1319103025d8fKeith Whitwell rast->curr_scene = lp_scene_dequeue( rast->full_scenes, TRUE ); 8442bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 845663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell lp_scene_bin_iter_begin( rast->curr_scene ); 8462bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 847663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell fb = &rast->curr_scene->fb; 848663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell write_depth = rast->curr_scene->write_depth; 8492bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 8502bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul lp_rast_begin( rast, fb, 851c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell fb->nr_cbufs != 0, 8522bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul fb->zsbuf != NULL && write_depth ); 8532bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul } 8542bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 8552bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul /* Wait for all threads to get here so that threads[1+] don't 856663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * get a null rast->curr_scene pointer. 8572bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul */ 8582bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul pipe_barrier_wait( &rast->barrier ); 8599509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul 860aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* do work */ 861aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul if (debug) 862aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul debug_printf("thread %d doing work\n", task->thread_index); 863663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rasterize_scene(rast, 864663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell task->thread_index, 865663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rast->curr_scene, 866663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rast->curr_scene->write_depth); 8679509f73c2147a9e225b5ef69a646e5dd711573f5Brian Paul 868663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell /* wait for all threads to finish with this scene */ 8692bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul pipe_barrier_wait( &rast->barrier ); 8702bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 8712bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul if (task->thread_index == 0) { 8722bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul /* thread[0]: 873663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * - release the scene object 8742bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul * - unmap the framebuffer surfaces 8752bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul */ 876663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell release_scene( rast, rast->curr_scene ); 8772bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul lp_rast_end( rast ); 8782bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul } 879aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 880aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* signal done with work */ 881aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul if (debug) 882aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul debug_printf("thread %d done working\n", task->thread_index); 883aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul pipe_semaphore_signal(&task->work_done); 884aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 885aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 886aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul return NULL; 887aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul} 888aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 889aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 890aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul/** 891aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul * Initialize semaphores and spawn the threads. 892aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul */ 893aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paulstatic void 894aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paulcreate_rast_threads(struct lp_rasterizer *rast) 895aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{ 896aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul unsigned i; 897aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 898ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca#ifdef PIPE_OS_WINDOWS 899ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca /* Multithreading not supported on windows until conditions and barriers are 900ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca * properly implemented. */ 901ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca rast->num_threads = 0; 902ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca#else 9037f457acabcbeea6a27b4f375f55e318fff52445fJosé Fonseca rast->num_threads = util_cpu_caps.nr_cpus; 9047f457acabcbeea6a27b4f375f55e318fff52445fJosé Fonseca rast->num_threads = debug_get_num_option("LP_NUM_THREADS", rast->num_threads); 905aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul rast->num_threads = MIN2(rast->num_threads, MAX_THREADS); 906ad60552ca19bce657eadaffd31db752e34e9cda3José Fonseca#endif 907aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 908aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul /* NOTE: if num_threads is zero, we won't use any threads */ 909aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul for (i = 0; i < rast->num_threads; i++) { 910aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul pipe_semaphore_init(&rast->tasks[i].work_ready, 0); 911aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul pipe_semaphore_init(&rast->tasks[i].work_done, 0); 912aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul rast->threads[i] = pipe_thread_create(thread_func, 913aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul (void *) &rast->tasks[i]); 914aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 915aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul} 916aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 917aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 918aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 919d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul/** 920d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul * Create new lp_rasterizer. 921663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell * \param empty the queue to put empty scenes on after we've finished 922d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul * processing them. 923d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul */ 924d7dbc666367438ee9efe748505907b36bba6b66aBrian Paulstruct lp_rasterizer * 925663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwelllp_rast_create( struct pipe_screen *screen, struct lp_scene_queue *empty ) 926aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul{ 927aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul struct lp_rasterizer *rast; 928c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i, cbuf; 929aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 930aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul rast = CALLOC_STRUCT(lp_rasterizer); 931aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul if(!rast) 932aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul return NULL; 933aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 934aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul rast->screen = screen; 935aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 936663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rast->empty_scenes = empty; 937663750d5564a225b4720f7ee8bea93ffb309fc88Keith Whitwell rast->full_scenes = lp_scene_queue_create(); 938d7dbc666367438ee9efe748505907b36bba6b66aBrian Paul 939aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul for (i = 0; i < Elements(rast->tasks); i++) { 940ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul struct lp_rasterizer_task *task = &rast->tasks[i]; 941ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul 942c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (cbuf = 0; cbuf < PIPE_MAX_COLOR_BUFS; cbuf++ ) 943ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul task->tile.color[cbuf] = align_malloc(TILE_SIZE * TILE_SIZE * 4, 16); 944c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell 945ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul task->rast = rast; 946ec459f2aeca39e51f495cde455ba18d0a9489caaBrian Paul task->thread_index = i; 947aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul } 948aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 949aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul create_rast_threads(rast); 950aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 9512bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul /* for synchronizing rasterization threads */ 9522bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul pipe_barrier_init( &rast->barrier, rast->num_threads ); 9532bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 954aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul return rast; 955aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul} 956aab1ceceecbd6449eebce7f5f5b356b1a51552e7Brian Paul 957b533b56750aca8c7e8cb22af93a0fc2a0cfc0d97Brian Paul 95889498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell/* Shutdown: 95989498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell */ 96089498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwellvoid lp_rast_destroy( struct lp_rasterizer *rast ) 96189498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell{ 962c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell unsigned i, cbuf; 9633a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul 964156eabbaf996f471458ee2a69078674277b89067Brian Paul util_unreference_framebuffer_state(&rast->state.fb); 9653a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul 9663a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul for (i = 0; i < Elements(rast->tasks); i++) { 967c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell for (cbuf = 0; cbuf < PIPE_MAX_COLOR_BUFS; cbuf++ ) 968c1a04416023e24621e4992caf593e8dfe8d7a2fcKeith Whitwell align_free(rast->tasks[i].tile.color[cbuf]); 9693a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul } 9703a06c113c76355fc9622adfe7565c18d9787e9a8Brian Paul 9712bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul /* for synchronizing rasterization threads */ 9722bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul pipe_barrier_destroy( &rast->barrier ); 9732bce5c195f94e2cce8f67c6a8066b0ae408487ceBrian Paul 97489498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell FREE(rast); 97589498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell} 97689498d01531cd515c769e570bf799c39fbafc8fbKeith Whitwell 977932374073863379e9da862d6115410889f038154Brian Paul 978932374073863379e9da862d6115410889f038154Brian Paul/** Return number of rasterization threads */ 979932374073863379e9da862d6115410889f038154Brian Paulunsigned 980932374073863379e9da862d6115410889f038154Brian Paullp_rast_get_num_threads( struct lp_rasterizer *rast ) 981932374073863379e9da862d6115410889f038154Brian Paul{ 982932374073863379e9da862d6115410889f038154Brian Paul return rast->num_threads; 983932374073863379e9da862d6115410889f038154Brian Paul} 984