brw_gs.c revision d4976158c7f32705b48c773c3abd1b22bebe9c16
1/* 2 Copyright (C) Intel Corp. 2006. All Rights Reserved. 3 Intel funded Tungsten Graphics (http://www.tungstengraphics.com) to 4 develop this 3D driver. 5 6 Permission is hereby granted, free of charge, to any person obtaining 7 a copy of this software and associated documentation files (the 8 "Software"), to deal in the Software without restriction, including 9 without limitation the rights to use, copy, modify, merge, publish, 10 distribute, sublicense, and/or sell copies of the Software, and to 11 permit persons to whom the Software is furnished to do so, subject to 12 the following conditions: 13 14 The above copyright notice and this permission notice (including the 15 next paragraph) shall be included in all copies or substantial 16 portions of the Software. 17 18 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 19 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 20 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. 21 IN NO EVENT SHALL THE COPYRIGHT OWNER(S) AND/OR ITS SUPPLIERS BE 22 LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION 23 OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION 24 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 25 26 **********************************************************************/ 27 /* 28 * Authors: 29 * Keith Whitwell <keith@tungstengraphics.com> 30 */ 31 32#include "main/glheader.h" 33#include "main/macros.h" 34#include "main/enums.h" 35 36#include "intel_batchbuffer.h" 37 38#include "brw_defines.h" 39#include "brw_context.h" 40#include "brw_eu.h" 41#include "brw_util.h" 42#include "brw_state.h" 43#include "brw_gs.h" 44 45#include "glsl/ralloc.h" 46 47static void compile_gs_prog( struct brw_context *brw, 48 struct brw_gs_prog_key *key ) 49{ 50 struct intel_context *intel = &brw->intel; 51 struct brw_gs_compile c; 52 const GLuint *program; 53 void *mem_ctx; 54 GLuint program_size; 55 56 memset(&c, 0, sizeof(c)); 57 58 c.key = *key; 59 /* The geometry shader needs to access the entire VUE. */ 60 struct brw_vue_map vue_map; 61 brw_compute_vue_map(&vue_map, intel, c.key.userclip_active, c.key.attrs); 62 c.nr_regs = (vue_map.num_slots + 1)/2; 63 64 mem_ctx = NULL; 65 66 /* Begin the compilation: 67 */ 68 brw_init_compile(brw, &c.func, mem_ctx); 69 70 c.func.single_program_flow = 1; 71 72 /* For some reason the thread is spawned with only 4 channels 73 * unmasked. 74 */ 75 brw_set_mask_control(&c.func, BRW_MASK_DISABLE); 76 77 if (intel->gen >= 6) { 78 unsigned num_verts; 79 bool check_edge_flag; 80 /* On Sandybridge, we use the GS for implementing transform feedback 81 * (called "Stream Out" in the PRM). 82 */ 83 switch (key->primitive) { 84 case _3DPRIM_POINTLIST: 85 num_verts = 1; 86 check_edge_flag = false; 87 break; 88 case _3DPRIM_LINELIST: 89 case _3DPRIM_LINESTRIP: 90 case _3DPRIM_LINELOOP: 91 num_verts = 2; 92 check_edge_flag = false; 93 break; 94 case _3DPRIM_TRILIST: 95 case _3DPRIM_TRIFAN: 96 case _3DPRIM_TRISTRIP: 97 case _3DPRIM_RECTLIST: 98 num_verts = 3; 99 check_edge_flag = false; 100 break; 101 case _3DPRIM_QUADLIST: 102 case _3DPRIM_QUADSTRIP: 103 case _3DPRIM_POLYGON: 104 num_verts = 3; 105 check_edge_flag = true; 106 break; 107 default: 108 assert(!"Unexpected primitive type in Gen6 SOL program."); 109 return; 110 } 111 gen6_sol_program(&c, key, num_verts, check_edge_flag); 112 } else { 113 /* On Gen4-5, we use the GS to decompose certain types of primitives. 114 * Note that primitives which don't require a GS program have already 115 * been weeded out by now. 116 */ 117 switch (key->primitive) { 118 case _3DPRIM_QUADLIST: 119 brw_gs_quads( &c, key ); 120 break; 121 case _3DPRIM_QUADSTRIP: 122 brw_gs_quad_strip( &c, key ); 123 break; 124 case _3DPRIM_LINELOOP: 125 brw_gs_lines( &c ); 126 break; 127 default: 128 ralloc_free(mem_ctx); 129 return; 130 } 131 } 132 133 /* get the program 134 */ 135 program = brw_get_program(&c.func, &program_size); 136 137 if (unlikely(INTEL_DEBUG & DEBUG_GS)) { 138 int i; 139 140 printf("gs:\n"); 141 for (i = 0; i < program_size / sizeof(struct brw_instruction); i++) 142 brw_disasm(stdout, &((struct brw_instruction *)program)[i], 143 intel->gen); 144 printf("\n"); 145 } 146 147 brw_upload_cache(&brw->cache, BRW_GS_PROG, 148 &c.key, sizeof(c.key), 149 program, program_size, 150 &c.prog_data, sizeof(c.prog_data), 151 &brw->gs.prog_offset, &brw->gs.prog_data); 152 ralloc_free(mem_ctx); 153} 154 155static void populate_key( struct brw_context *brw, 156 struct brw_gs_prog_key *key ) 157{ 158 struct gl_context *ctx = &brw->intel.ctx; 159 struct intel_context *intel = &brw->intel; 160 161 memset(key, 0, sizeof(*key)); 162 163 /* CACHE_NEW_VS_PROG */ 164 key->attrs = brw->vs.prog_data->outputs_written; 165 166 /* BRW_NEW_PRIMITIVE */ 167 key->primitive = brw->primitive; 168 169 /* _NEW_LIGHT */ 170 key->pv_first = (ctx->Light.ProvokingVertex == GL_FIRST_VERTEX_CONVENTION); 171 if (key->primitive == _3DPRIM_QUADLIST && ctx->Light.ShadeModel != GL_FLAT) { 172 /* Provide consistent primitive order with brw_set_prim's 173 * optimization of single quads to trifans. 174 */ 175 key->pv_first = true; 176 } 177 178 /* _NEW_TRANSFORM */ 179 key->userclip_active = (ctx->Transform.ClipPlanesEnabled != 0); 180 181 if (intel->gen >= 7) { 182 /* On Gen7 and later, we don't use GS (yet). */ 183 key->need_gs_prog = false; 184 } else if (intel->gen == 6) { 185 /* On Gen6, GS is used for transform feedback. */ 186 /* _NEW_TRANSFORM_FEEDBACK */ 187 key->need_gs_prog = ctx->TransformFeedback.CurrentObject->Active; 188 } else { 189 /* Pre-gen6, GS is used to transform QUADLIST, QUADSTRIP, and LINELOOP 190 * into simpler primitives. 191 */ 192 key->need_gs_prog = (brw->primitive == _3DPRIM_QUADLIST || 193 brw->primitive == _3DPRIM_QUADSTRIP || 194 brw->primitive == _3DPRIM_LINELOOP); 195 } 196 /* For testing, the environment variable INTEL_FORCE_GS can be used to 197 * force a GS program to be used, even if it's not necessary. 198 */ 199 if (getenv("INTEL_FORCE_GS")) 200 key->need_gs_prog = true; 201} 202 203/* Calculate interpolants for triangle and line rasterization. 204 */ 205static void 206brw_upload_gs_prog(struct brw_context *brw) 207{ 208 struct brw_gs_prog_key key; 209 /* Populate the key: 210 */ 211 populate_key(brw, &key); 212 213 if (brw->gs.prog_active != key.need_gs_prog) { 214 brw->state.dirty.cache |= CACHE_NEW_GS_PROG; 215 brw->gs.prog_active = key.need_gs_prog; 216 } 217 218 if (brw->gs.prog_active) { 219 if (!brw_search_cache(&brw->cache, BRW_GS_PROG, 220 &key, sizeof(key), 221 &brw->gs.prog_offset, &brw->gs.prog_data)) { 222 compile_gs_prog( brw, &key ); 223 } 224 } 225} 226 227 228const struct brw_tracked_state brw_gs_prog = { 229 .dirty = { 230 .mesa = (_NEW_LIGHT | 231 _NEW_TRANSFORM | 232 _NEW_TRANSFORM_FEEDBACK), 233 .brw = BRW_NEW_PRIMITIVE, 234 .cache = CACHE_NEW_VS_PROG 235 }, 236 .emit = brw_upload_gs_prog 237}; 238