programopt.c revision b6e8256899a9a93c665c34e10efcc918f2fcc095
1c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul/* 2c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Mesa 3-D graphics library 3048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * Version: 6.5.3 4c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * 5048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * Copyright (C) 1999-2007 Brian Paul All Rights Reserved. 6c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * 7c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Permission is hereby granted, free of charge, to any person obtaining a 8c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * copy of this software and associated documentation files (the "Software"), 9c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * to deal in the Software without restriction, including without limitation 10c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * the rights to use, copy, modify, merge, publish, distribute, sublicense, 11c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * and/or sell copies of the Software, and to permit persons to whom the 12c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Software is furnished to do so, subject to the following conditions: 13c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * 14c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * The above copyright notice and this permission notice shall be included 15c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * in all copies or substantial portions of the Software. 16c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * 17c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 18c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 19c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 20c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * BRIAN PAUL BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN 21c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 22c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 23c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul */ 24c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 25c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul/** 26c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * \file programopt.c 27c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Vertex/Fragment program optimizations and transformations for program 28c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * options, etc. 29c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * 30c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * \author Brian Paul 31c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul */ 32c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 33c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 341f4997c2aaf424c8a12cc6fdb1dd994f66074a1dBrian Paul#include "main/glheader.h" 351f4997c2aaf424c8a12cc6fdb1dd994f66074a1dBrian Paul#include "main/context.h" 3657d9531cd644226d15be4a09ad1492ab647165dcBrian#include "prog_parameter.h" 3757d9531cd644226d15be4a09ad1492ab647165dcBrian#include "prog_statevars.h" 386ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul#include "program.h" 39c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul#include "programopt.h" 4057d9531cd644226d15be4a09ad1492ab647165dcBrian#include "prog_instruction.h" 41c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 42c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 43c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul/** 443c54e8376d639465277fac745b0b8134d2918a9fBrian Paul * This function inserts instructions for coordinate modelview * projection 453c54e8376d639465277fac745b0b8134d2918a9fBrian Paul * into a vertex program. 463c54e8376d639465277fac745b0b8134d2918a9fBrian Paul * May be used to implement the position_invariant option. 47c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul */ 48b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwellstatic void 49b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell_mesa_insert_mvp_dp4_code(GLcontext *ctx, struct gl_vertex_program *vprog) 50c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul{ 513c54e8376d639465277fac745b0b8134d2918a9fBrian Paul struct prog_instruction *newInst; 52c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul const GLuint origLen = vprog->Base.NumInstructions; 533c54e8376d639465277fac745b0b8134d2918a9fBrian Paul const GLuint newLen = origLen + 4; 54c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul GLuint i; 55c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 56c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul /* 57c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Setup state references for the modelview/projection matrix. 58c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * XXX we should check if these state vars are already declared. 59c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul */ 60aa9d22a1c0f3256497088985c290d4046e089456Brian static const gl_state_index mvpState[4][STATE_LENGTH] = { 616531952b3c979be0dc95704beb3c3b9dad1dc37bBrian { STATE_MVP_MATRIX, 0, 0, 0, 0 }, /* state.matrix.mvp.row[0] */ 626531952b3c979be0dc95704beb3c3b9dad1dc37bBrian { STATE_MVP_MATRIX, 0, 1, 1, 0 }, /* state.matrix.mvp.row[1] */ 636531952b3c979be0dc95704beb3c3b9dad1dc37bBrian { STATE_MVP_MATRIX, 0, 2, 2, 0 }, /* state.matrix.mvp.row[2] */ 646531952b3c979be0dc95704beb3c3b9dad1dc37bBrian { STATE_MVP_MATRIX, 0, 3, 3, 0 }, /* state.matrix.mvp.row[3] */ 65c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul }; 66c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul GLint mvpRef[4]; 67c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 68c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul for (i = 0; i < 4; i++) { 69c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul mvpRef[i] = _mesa_add_state_reference(vprog->Base.Parameters, 70c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul mvpState[i]); 71c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul } 72c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 733c54e8376d639465277fac745b0b8134d2918a9fBrian Paul /* Alloc storage for new instructions */ 743c54e8376d639465277fac745b0b8134d2918a9fBrian Paul newInst = _mesa_alloc_instructions(newLen); 753c54e8376d639465277fac745b0b8134d2918a9fBrian Paul if (!newInst) { 763c54e8376d639465277fac745b0b8134d2918a9fBrian Paul _mesa_error(ctx, GL_OUT_OF_MEMORY, 773c54e8376d639465277fac745b0b8134d2918a9fBrian Paul "glProgramString(inserting position_invariant code)"); 783c54e8376d639465277fac745b0b8134d2918a9fBrian Paul return; 793c54e8376d639465277fac745b0b8134d2918a9fBrian Paul } 803c54e8376d639465277fac745b0b8134d2918a9fBrian Paul 81c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul /* 82c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Generated instructions: 83c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * newInst[0] = DP4 result.position.x, mvp.row[0], vertex.position; 84c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * newInst[1] = DP4 result.position.y, mvp.row[1], vertex.position; 85c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * newInst[2] = DP4 result.position.z, mvp.row[2], vertex.position; 86c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * newInst[3] = DP4 result.position.w, mvp.row[3], vertex.position; 87c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul */ 88d6272e06172f7ac7a0d6e8062e8ffba33e1ab3baBrian Paul _mesa_init_instructions(newInst, 4); 89c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul for (i = 0; i < 4; i++) { 90c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].Opcode = OPCODE_DP4; 91c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].DstReg.File = PROGRAM_OUTPUT; 92c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].DstReg.Index = VERT_RESULT_HPOS; 93c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].DstReg.WriteMask = (WRITEMASK_X << i); 94c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].SrcReg[0].File = PROGRAM_STATE_VAR; 95c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].SrcReg[0].Index = mvpRef[i]; 96c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].SrcReg[0].Swizzle = SWIZZLE_NOOP; 97c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].SrcReg[1].File = PROGRAM_INPUT; 98c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].SrcReg[1].Index = VERT_ATTRIB_POS; 99c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul newInst[i].SrcReg[1].Swizzle = SWIZZLE_NOOP; 100c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul } 101c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 1023c54e8376d639465277fac745b0b8134d2918a9fBrian Paul /* Append original instructions after new instructions */ 103cfe984dbd0c478906785dbf8a9430504173ae952Oliver McFadden _mesa_copy_instructions (newInst + 4, vprog->Base.Instructions, origLen); 1043c54e8376d639465277fac745b0b8134d2918a9fBrian Paul 1053c54e8376d639465277fac745b0b8134d2918a9fBrian Paul /* free old instructions */ 1066ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul _mesa_free_instructions(vprog->Base.Instructions, origLen); 107c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 1083c54e8376d639465277fac745b0b8134d2918a9fBrian Paul /* install new instructions */ 1093c54e8376d639465277fac745b0b8134d2918a9fBrian Paul vprog->Base.Instructions = newInst; 1103c54e8376d639465277fac745b0b8134d2918a9fBrian Paul vprog->Base.NumInstructions = newLen; 111c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul vprog->Base.InputsRead |= VERT_BIT_POS; 112c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul vprog->Base.OutputsWritten |= (1 << VERT_RESULT_HPOS); 113c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul} 114c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 115c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 116b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwellstatic void 117b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell_mesa_insert_mvp_mad_code(GLcontext *ctx, struct gl_vertex_program *vprog) 118b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell{ 119b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell struct prog_instruction *newInst; 120b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell const GLuint origLen = vprog->Base.NumInstructions; 121b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell const GLuint newLen = origLen + 4; 122b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell GLuint hposTemp; 123b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell GLuint i; 124b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 125b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* 126b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * Setup state references for the modelview/projection matrix. 127b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * XXX we should check if these state vars are already declared. 128b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell */ 129b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell static const gl_state_index mvpState[4][STATE_LENGTH] = { 130b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell { STATE_MVP_MATRIX, 0, 0, 0, STATE_MATRIX_TRANSPOSE }, 131b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell { STATE_MVP_MATRIX, 0, 1, 1, STATE_MATRIX_TRANSPOSE }, 132b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell { STATE_MVP_MATRIX, 0, 2, 2, STATE_MATRIX_TRANSPOSE }, 133b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell { STATE_MVP_MATRIX, 0, 3, 3, STATE_MATRIX_TRANSPOSE }, 134b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell }; 135b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell GLint mvpRef[4]; 136b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 137b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell for (i = 0; i < 4; i++) { 138b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell mvpRef[i] = _mesa_add_state_reference(vprog->Base.Parameters, 139b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell mvpState[i]); 140b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell } 141b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 142b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* Alloc storage for new instructions */ 143b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst = _mesa_alloc_instructions(newLen); 144b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell if (!newInst) { 145b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell _mesa_error(ctx, GL_OUT_OF_MEMORY, 146b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell "glProgramString(inserting position_invariant code)"); 147b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell return; 148b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell } 149b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 150b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* TEMP hposTemp; */ 151b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell hposTemp = vprog->Base.NumTemporaries++; 152b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 153b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* 154b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * Generated instructions: 155b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * emit_op2(p, OPCODE_MUL, tmp, 0, swizzle1(src,X), mat[0]); 156b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * emit_op3(p, OPCODE_MAD, tmp, 0, swizzle1(src,Y), mat[1], tmp); 157b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * emit_op3(p, OPCODE_MAD, tmp, 0, swizzle1(src,Z), mat[2], tmp); 158b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell * emit_op3(p, OPCODE_MAD, dest, 0, swizzle1(src,W), mat[3], tmp); 159b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell */ 160b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell _mesa_init_instructions(newInst, 4); 161b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 162b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].Opcode = OPCODE_MUL; 163b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].DstReg.File = PROGRAM_TEMPORARY; 164b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].DstReg.Index = hposTemp; 165b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].DstReg.WriteMask = WRITEMASK_XYZW; 166b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].SrcReg[0].File = PROGRAM_INPUT; 167b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].SrcReg[0].Index = VERT_ATTRIB_POS; 168b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].SrcReg[0].Swizzle = SWIZZLE_XXXX; 169b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].SrcReg[1].File = PROGRAM_STATE_VAR; 170b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].SrcReg[1].Index = mvpRef[0]; 171b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[0].SrcReg[1].Swizzle = SWIZZLE_NOOP; 172b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 173b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell for (i = 1; i <= 2; i++) { 174b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].Opcode = OPCODE_MAD; 175b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].DstReg.File = PROGRAM_TEMPORARY; 176b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].DstReg.Index = hposTemp; 177b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].DstReg.WriteMask = WRITEMASK_XYZW; 178b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[0].File = PROGRAM_INPUT; 179b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[0].Index = VERT_ATTRIB_POS; 180b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[0].Swizzle = MAKE_SWIZZLE4(i,i,i,i); 181b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[1].File = PROGRAM_STATE_VAR; 182b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[1].Index = mvpRef[i]; 183b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[1].Swizzle = SWIZZLE_NOOP; 184b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[2].File = PROGRAM_TEMPORARY; 185b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[i].SrcReg[2].Index = hposTemp; 186b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[1].SrcReg[2].Swizzle = SWIZZLE_NOOP; 187b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell } 188b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 189b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].Opcode = OPCODE_MAD; 190b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].DstReg.File = PROGRAM_OUTPUT; 191b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].DstReg.Index = VERT_RESULT_HPOS; 192b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].DstReg.WriteMask = WRITEMASK_XYZW; 193b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[0].File = PROGRAM_INPUT; 194b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[0].Index = VERT_ATTRIB_POS; 195b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[0].Swizzle = SWIZZLE_WWWW; 196b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[1].File = PROGRAM_STATE_VAR; 197b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[1].Index = mvpRef[3]; 198b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[1].Swizzle = SWIZZLE_NOOP; 199b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[2].File = PROGRAM_TEMPORARY; 200b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[2].Index = hposTemp; 201b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell newInst[3].SrcReg[2].Swizzle = SWIZZLE_NOOP; 202b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 203b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 204b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* Append original instructions after new instructions */ 205b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell _mesa_copy_instructions (newInst + 4, vprog->Base.Instructions, origLen); 206b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 207b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* free old instructions */ 208b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell _mesa_free_instructions(vprog->Base.Instructions, origLen); 209b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 210b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell /* install new instructions */ 211b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell vprog->Base.Instructions = newInst; 212b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell vprog->Base.NumInstructions = newLen; 213b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell vprog->Base.InputsRead |= VERT_BIT_POS; 214b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell vprog->Base.OutputsWritten |= (1 << VERT_RESULT_HPOS); 215b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell} 216b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 217b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 218b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwellvoid 219b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell_mesa_insert_mvp_code(GLcontext *ctx, struct gl_vertex_program *vprog) 220b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell{ 221b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell if (ctx->mvp_with_dp4) 222b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell _mesa_insert_mvp_dp4_code( ctx, vprog ); 223b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell else 224b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell _mesa_insert_mvp_mad_code( ctx, vprog ); 225b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell} 226b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 227b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 228b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 229b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 230b6e8256899a9a93c665c34e10efcc918f2fcc095Keith Whitwell 231c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 232c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul/** 233c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul * Append extra instructions onto the given fragment program to implement 234f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul * the fog mode specified by fprog->FogOption. 235f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul * The fragment.fogcoord input is used to compute the fog blend factor. 236f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul * 237f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul * XXX with a little work, this function could be adapted to add fog code 238f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul * to vertex programs too. 239c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul */ 240c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paulvoid 241c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul_mesa_append_fog_code(GLcontext *ctx, struct gl_fragment_program *fprog) 242c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul{ 243aa9d22a1c0f3256497088985c290d4046e089456Brian static const gl_state_index fogPStateOpt[STATE_LENGTH] 244776bc9cf55b116e17dddde4d097985b51879c83fBrian = { STATE_INTERNAL, STATE_FOG_PARAMS_OPTIMIZED, 0, 0, 0 }; 245aa9d22a1c0f3256497088985c290d4046e089456Brian static const gl_state_index fogColorState[STATE_LENGTH] 246776bc9cf55b116e17dddde4d097985b51879c83fBrian = { STATE_FOG_COLOR, 0, 0, 0, 0}; 247f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul struct prog_instruction *newInst, *inst; 248f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul const GLuint origLen = fprog->Base.NumInstructions; 249b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger const GLuint newLen = origLen + 5; 250f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul GLuint i; 251b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger GLint fogPRefOpt, fogColorRef; /* state references */ 252f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul GLuint colorTemp, fogFactorTemp; /* temporary registerss */ 253f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 254abb1430c79024198bdc9816465d3c8bc963adf8bBrian Paul if (fprog->FogOption == GL_NONE) { 255f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul _mesa_problem(ctx, "_mesa_append_fog_code() called for fragment program" 256f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul " with FogOption == GL_NONE"); 257c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul return; 258f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul } 259f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 260f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* Alloc storage for new instructions */ 261f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul newInst = _mesa_alloc_instructions(newLen); 262f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul if (!newInst) { 263f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul _mesa_error(ctx, GL_OUT_OF_MEMORY, 264f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul "glProgramString(inserting fog_option code)"); 265c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul return; 266c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul } 267c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 268f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* Copy orig instructions into new instruction buffer */ 26912229f119d754715e0315846fdd8d6e9213e8edfBrian _mesa_copy_instructions(newInst, fprog->Base.Instructions, origLen); 270f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 271b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger /* PARAM fogParamsRefOpt = internal optimized fog params; */ 272b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger fogPRefOpt 273b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger = _mesa_add_state_reference(fprog->Base.Parameters, fogPStateOpt); 274f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* PARAM fogColorRef = state.fog.color; */ 275f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul fogColorRef 276f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul = _mesa_add_state_reference(fprog->Base.Parameters, fogColorState); 277c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 278f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* TEMP colorTemp; */ 279f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul colorTemp = fprog->Base.NumTemporaries++; 280f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* TEMP fogFactorTemp; */ 281f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul fogFactorTemp = fprog->Base.NumTemporaries++; 282c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul 283f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* Scan program to find where result.color is written */ 284f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst = newInst; 285f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul for (i = 0; i < fprog->Base.NumInstructions; i++) { 286f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul if (inst->Opcode == OPCODE_END) 287f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul break; 288f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul if (inst->DstReg.File == PROGRAM_OUTPUT && 2898d475822e6e19fa79719c856a2db5b6a205db1b9Brian Paul inst->DstReg.Index == FRAG_RESULT_COLOR) { 290f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* change the instruction to write to colorTemp w/ clamping */ 291f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_TEMPORARY; 292f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.Index = colorTemp; 293f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SaturateMode = SATURATE_ZERO_ONE; 294f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* don't break (may be several writes to result.color) */ 295f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul } 296f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 297f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul } 298f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul assert(inst->Opcode == OPCODE_END); /* we'll overwrite this inst */ 299f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 300b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger _mesa_init_instructions(inst, 5); 301f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 302f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* emit instructions to compute fog blending factor */ 303f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul if (fprog->FogOption == GL_LINEAR) { 304b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger /* MAD fogFactorTemp.x, fragment.fogcoord.x, fogPRefOpt.x, fogPRefOpt.y; */ 305b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->Opcode = OPCODE_MAD; 306f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_TEMPORARY; 307f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.Index = fogFactorTemp; 308f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.WriteMask = WRITEMASK_X; 309b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[0].File = PROGRAM_INPUT; 310b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[0].Index = FRAG_ATTRIB_FOGC; 311e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[0].Swizzle = SWIZZLE_XXXX; 312f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].File = PROGRAM_STATE_VAR; 313b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[1].Index = fogPRefOpt; 314e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[1].Swizzle = SWIZZLE_XXXX; 315b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[2].File = PROGRAM_STATE_VAR; 316b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[2].Index = fogPRefOpt; 317e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[2].Swizzle = SWIZZLE_YYYY; 3181560de2c3c7f9d4e07b34e805e649769ca5a0cbeBrian inst->SaturateMode = SATURATE_ZERO_ONE; 319f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 320f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul } 321f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul else { 322f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul ASSERT(fprog->FogOption == GL_EXP || fprog->FogOption == GL_EXP2); 323b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger /* fogPRefOpt.z = d/ln(2), fogPRefOpt.w = d/sqrt(ln(2) */ 324b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger /* EXP: MUL fogFactorTemp.x, fogPRefOpt.z, fragment.fogcoord.x; */ 325b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger /* EXP2: MUL fogFactorTemp.x, fogPRefOpt.w, fragment.fogcoord.x; */ 326f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->Opcode = OPCODE_MUL; 327f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_TEMPORARY; 328f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.Index = fogFactorTemp; 329f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.WriteMask = WRITEMASK_X; 330f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].File = PROGRAM_STATE_VAR; 331b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[0].Index = fogPRefOpt; 332b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[0].Swizzle 333e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul = (fprog->FogOption == GL_EXP) ? SWIZZLE_ZZZZ : SWIZZLE_WWWW; 334f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].File = PROGRAM_INPUT; 335f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].Index = FRAG_ATTRIB_FOGC; 336e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[1].Swizzle = SWIZZLE_XXXX; 337f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 338f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul if (fprog->FogOption == GL_EXP2) { 339f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* MUL fogFactorTemp.x, fogFactorTemp.x, fogFactorTemp.x; */ 340f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->Opcode = OPCODE_MUL; 341f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_TEMPORARY; 342f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.Index = fogFactorTemp; 343f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.WriteMask = WRITEMASK_X; 344f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].File = PROGRAM_TEMPORARY; 345f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].Index = fogFactorTemp; 346e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[0].Swizzle = SWIZZLE_XXXX; 347f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].File = PROGRAM_TEMPORARY; 348f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].Index = fogFactorTemp; 349e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[1].Swizzle = SWIZZLE_XXXX; 350f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 351f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul } 352f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* EX2_SAT fogFactorTemp.x, -fogFactorTemp.x; */ 353f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->Opcode = OPCODE_EX2; 354f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_TEMPORARY; 355f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.Index = fogFactorTemp; 356f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.WriteMask = WRITEMASK_X; 357f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].File = PROGRAM_TEMPORARY; 358f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].Index = fogFactorTemp; 3597db7ff878d3e5a6b345228e6eaee4797bb68b360Brian Paul inst->SrcReg[0].Negate = NEGATE_XYZW; 360e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[0].Swizzle = SWIZZLE_XXXX; 361f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SaturateMode = SATURATE_ZERO_ONE; 362f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 363f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul } 364f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* LRP result.color.xyz, fogFactorTemp.xxxx, colorTemp, fogColorRef; */ 365f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->Opcode = OPCODE_LRP; 366f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_OUTPUT; 3678d475822e6e19fa79719c856a2db5b6a205db1b9Brian Paul inst->DstReg.Index = FRAG_RESULT_COLOR; 368f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.WriteMask = WRITEMASK_XYZ; 369f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].File = PROGRAM_TEMPORARY; 370f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].Index = fogFactorTemp; 371e0f160663e50d0481afd8a9e1ec90c334be489e1Brian Paul inst->SrcReg[0].Swizzle = SWIZZLE_XXXX; 372f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].File = PROGRAM_TEMPORARY; 373f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[1].Index = colorTemp; 374b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[1].Swizzle = SWIZZLE_NOOP; 375f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[2].File = PROGRAM_STATE_VAR; 376f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[2].Index = fogColorRef; 377b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[2].Swizzle = SWIZZLE_NOOP; 378f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 379f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* MOV result.color.w, colorTemp.x; # copy alpha */ 380f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->Opcode = OPCODE_MOV; 381f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.File = PROGRAM_OUTPUT; 3828d475822e6e19fa79719c856a2db5b6a205db1b9Brian Paul inst->DstReg.Index = FRAG_RESULT_COLOR; 383f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->DstReg.WriteMask = WRITEMASK_W; 384f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].File = PROGRAM_TEMPORARY; 385f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->SrcReg[0].Index = colorTemp; 386b2d30ca0cb01a80ff440a4a07b293daa16486e12Roland Scheidegger inst->SrcReg[0].Swizzle = SWIZZLE_NOOP; 387f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 388f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* END; */ 389f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst->Opcode = OPCODE_END; 390f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul inst++; 391f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 392f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* free old instructions */ 3936ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul _mesa_free_instructions(fprog->Base.Instructions, origLen); 394f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul 395f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* install new instructions */ 396f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul fprog->Base.Instructions = newInst; 397f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul fprog->Base.NumInstructions = inst - newInst; 398f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul fprog->Base.InputsRead |= FRAG_BIT_FOGC; 399f5eea0cc7a8c568b00035427294812712c6c6081Brian Paul /* XXX do this? fprog->FogOption = GL_NONE; */ 400c6511ab950e2865e606ff13ce87f0ffc782c57adBrian Paul} 401048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 402048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 403048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 404048412473bda3db3e58b9840de5ef82d2ecce3c0Brianstatic GLboolean 405048412473bda3db3e58b9840de5ef82d2ecce3c0Brianis_texture_instruction(const struct prog_instruction *inst) 406048412473bda3db3e58b9840de5ef82d2ecce3c0Brian{ 407048412473bda3db3e58b9840de5ef82d2ecce3c0Brian switch (inst->Opcode) { 408048412473bda3db3e58b9840de5ef82d2ecce3c0Brian case OPCODE_TEX: 409048412473bda3db3e58b9840de5ef82d2ecce3c0Brian case OPCODE_TXB: 410048412473bda3db3e58b9840de5ef82d2ecce3c0Brian case OPCODE_TXD: 411048412473bda3db3e58b9840de5ef82d2ecce3c0Brian case OPCODE_TXL: 412048412473bda3db3e58b9840de5ef82d2ecce3c0Brian case OPCODE_TXP: 413048412473bda3db3e58b9840de5ef82d2ecce3c0Brian case OPCODE_TXP_NV: 414048412473bda3db3e58b9840de5ef82d2ecce3c0Brian return GL_TRUE; 415048412473bda3db3e58b9840de5ef82d2ecce3c0Brian default: 416048412473bda3db3e58b9840de5ef82d2ecce3c0Brian return GL_FALSE; 417048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 418048412473bda3db3e58b9840de5ef82d2ecce3c0Brian} 419048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 420048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 421048412473bda3db3e58b9840de5ef82d2ecce3c0Brian/** 422048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * Count the number of texure indirections in the given program. 423048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * The program's NumTexIndirections field will be updated. 424048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * See the GL_ARB_fragment_program spec (issue 24) for details. 425048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * XXX we count texture indirections in texenvprogram.c (maybe use this code 426048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * instead and elsewhere). 427048412473bda3db3e58b9840de5ef82d2ecce3c0Brian */ 428048412473bda3db3e58b9840de5ef82d2ecce3c0Brianvoid 429048412473bda3db3e58b9840de5ef82d2ecce3c0Brian_mesa_count_texture_indirections(struct gl_program *prog) 430048412473bda3db3e58b9840de5ef82d2ecce3c0Brian{ 431048412473bda3db3e58b9840de5ef82d2ecce3c0Brian GLuint indirections = 1; 432048412473bda3db3e58b9840de5ef82d2ecce3c0Brian GLbitfield tempsOutput = 0x0; 433048412473bda3db3e58b9840de5ef82d2ecce3c0Brian GLbitfield aluTemps = 0x0; 434048412473bda3db3e58b9840de5ef82d2ecce3c0Brian GLuint i; 435048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 436048412473bda3db3e58b9840de5ef82d2ecce3c0Brian for (i = 0; i < prog->NumInstructions; i++) { 437048412473bda3db3e58b9840de5ef82d2ecce3c0Brian const struct prog_instruction *inst = prog->Instructions + i; 438048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 439048412473bda3db3e58b9840de5ef82d2ecce3c0Brian if (is_texture_instruction(inst)) { 440048412473bda3db3e58b9840de5ef82d2ecce3c0Brian if (((inst->SrcReg[0].File == PROGRAM_TEMPORARY) && 441048412473bda3db3e58b9840de5ef82d2ecce3c0Brian (tempsOutput & (1 << inst->SrcReg[0].Index))) || 442048412473bda3db3e58b9840de5ef82d2ecce3c0Brian ((inst->Opcode != OPCODE_KIL) && 443048412473bda3db3e58b9840de5ef82d2ecce3c0Brian (inst->DstReg.File == PROGRAM_TEMPORARY) && 444048412473bda3db3e58b9840de5ef82d2ecce3c0Brian (aluTemps & (1 << inst->DstReg.Index)))) 445048412473bda3db3e58b9840de5ef82d2ecce3c0Brian { 446048412473bda3db3e58b9840de5ef82d2ecce3c0Brian indirections++; 447048412473bda3db3e58b9840de5ef82d2ecce3c0Brian tempsOutput = 0x0; 448048412473bda3db3e58b9840de5ef82d2ecce3c0Brian aluTemps = 0x0; 449048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 450048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 451048412473bda3db3e58b9840de5ef82d2ecce3c0Brian else { 452048412473bda3db3e58b9840de5ef82d2ecce3c0Brian GLuint j; 453048412473bda3db3e58b9840de5ef82d2ecce3c0Brian for (j = 0; j < 3; j++) { 454048412473bda3db3e58b9840de5ef82d2ecce3c0Brian if (inst->SrcReg[j].File == PROGRAM_TEMPORARY) 455048412473bda3db3e58b9840de5ef82d2ecce3c0Brian aluTemps |= (1 << inst->SrcReg[j].Index); 456048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 457048412473bda3db3e58b9840de5ef82d2ecce3c0Brian if (inst->DstReg.File == PROGRAM_TEMPORARY) 458048412473bda3db3e58b9840de5ef82d2ecce3c0Brian aluTemps |= (1 << inst->DstReg.Index); 459048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 460048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 461048412473bda3db3e58b9840de5ef82d2ecce3c0Brian if ((inst->Opcode != OPCODE_KIL) && (inst->DstReg.File == PROGRAM_TEMPORARY)) 462048412473bda3db3e58b9840de5ef82d2ecce3c0Brian tempsOutput |= (1 << inst->DstReg.Index); 463048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 464048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 465048412473bda3db3e58b9840de5ef82d2ecce3c0Brian prog->NumTexIndirections = indirections; 466048412473bda3db3e58b9840de5ef82d2ecce3c0Brian} 467048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 468048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 469048412473bda3db3e58b9840de5ef82d2ecce3c0Brian/** 470048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * Count number of texture instructions in given program and update the 471048412473bda3db3e58b9840de5ef82d2ecce3c0Brian * program's NumTexInstructions field. 472048412473bda3db3e58b9840de5ef82d2ecce3c0Brian */ 473048412473bda3db3e58b9840de5ef82d2ecce3c0Brianvoid 474048412473bda3db3e58b9840de5ef82d2ecce3c0Brian_mesa_count_texture_instructions(struct gl_program *prog) 475048412473bda3db3e58b9840de5ef82d2ecce3c0Brian{ 476048412473bda3db3e58b9840de5ef82d2ecce3c0Brian GLuint i; 477048412473bda3db3e58b9840de5ef82d2ecce3c0Brian prog->NumTexInstructions = 0; 478048412473bda3db3e58b9840de5ef82d2ecce3c0Brian for (i = 0; i < prog->NumInstructions; i++) { 479048412473bda3db3e58b9840de5ef82d2ecce3c0Brian prog->NumTexInstructions += is_texture_instruction(prog->Instructions + i); 480048412473bda3db3e58b9840de5ef82d2ecce3c0Brian } 481048412473bda3db3e58b9840de5ef82d2ecce3c0Brian} 482048412473bda3db3e58b9840de5ef82d2ecce3c0Brian 4836ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 4846ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul/** 485928ec5cd3be5c7d6f3d9df0ace18371b1ec8c68cZack Rusin * Scan/rewrite program to remove reads of custom (output) registers. 4861f4997c2aaf424c8a12cc6fdb1dd994f66074a1dBrian Paul * The passed type has to be either PROGRAM_OUTPUT or PROGRAM_VARYING 4871f4997c2aaf424c8a12cc6fdb1dd994f66074a1dBrian Paul * (for vertex shaders). 4881f4997c2aaf424c8a12cc6fdb1dd994f66074a1dBrian Paul * In GLSL shaders, varying vars can be read and written. 4896ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul * On some hardware, trying to read an output register causes trouble. 4906ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul * So, rewrite the program to use a temporary register in this case. 4916ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul */ 4926ca948a303e1af7ae66ea7082af741f6880887f2Brian Paulvoid 493b4026d9be828bd0b6f60158456edf24994efb053Brian Paul_mesa_remove_output_reads(struct gl_program *prog, gl_register_file type) 4946ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul{ 4956ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul GLuint i; 4966ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul GLint outputMap[VERT_RESULT_MAX]; 4976ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul GLuint numVaryingReads = 0; 4986ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 49995b34baa8f981b08e21a36f9163d98a426559839Zack Rusin assert(type == PROGRAM_VARYING || type == PROGRAM_OUTPUT); 5001f4997c2aaf424c8a12cc6fdb1dd994f66074a1dBrian Paul assert(prog->Target == GL_VERTEX_PROGRAM_ARB || type != PROGRAM_VARYING); 5016ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5026ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (i = 0; i < VERT_RESULT_MAX; i++) 5036ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul outputMap[i] = -1; 5046ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5056ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* look for instructions which read from varying vars */ 5066ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (i = 0; i < prog->NumInstructions; i++) { 5076ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul struct prog_instruction *inst = prog->Instructions + i; 5086ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul const GLuint numSrc = _mesa_num_inst_src_regs(inst->Opcode); 5096ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul GLuint j; 5106ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (j = 0; j < numSrc; j++) { 511928ec5cd3be5c7d6f3d9df0ace18371b1ec8c68cZack Rusin if (inst->SrcReg[j].File == type) { 5126ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* replace the read with a temp reg */ 5136ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul const GLuint var = inst->SrcReg[j].Index; 5146ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul if (outputMap[var] == -1) { 5156ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul numVaryingReads++; 5166ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul outputMap[var] = _mesa_find_free_register(prog, 5176ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul PROGRAM_TEMPORARY); 5186ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5196ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->SrcReg[j].File = PROGRAM_TEMPORARY; 5206ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->SrcReg[j].Index = outputMap[var]; 5216ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5226ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5236ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5246ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5256ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul if (numVaryingReads == 0) 5266ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul return; /* nothing to be done */ 5276ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5286ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* look for instructions which write to the varying vars identified above */ 5296ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (i = 0; i < prog->NumInstructions; i++) { 5306ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul struct prog_instruction *inst = prog->Instructions + i; 5316ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul const GLuint numSrc = _mesa_num_inst_src_regs(inst->Opcode); 5326ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul GLuint j; 5336ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (j = 0; j < numSrc; j++) { 534928ec5cd3be5c7d6f3d9df0ace18371b1ec8c68cZack Rusin if (inst->DstReg.File == type && 5356ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul outputMap[inst->DstReg.Index] >= 0) { 5366ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* change inst to write to the temp reg, instead of the varying */ 5376ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->DstReg.File = PROGRAM_TEMPORARY; 5386ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->DstReg.Index = outputMap[inst->DstReg.Index]; 5396ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5406ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5416ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5426ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5436ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* insert new instructions to copy the temp vars to the varying vars */ 5446ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul { 5456ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul struct prog_instruction *inst; 5466ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul GLint endPos, var; 5476ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5486ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* Look for END instruction and insert the new varying writes */ 5496ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul endPos = -1; 5506ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (i = 0; i < prog->NumInstructions; i++) { 5516ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul struct prog_instruction *inst = prog->Instructions + i; 5526ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul if (inst->Opcode == OPCODE_END) { 5536ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul endPos = i; 5546ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul _mesa_insert_instructions(prog, i, numVaryingReads); 5556ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul break; 5566ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5576ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5586ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5596ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul assert(endPos >= 0); 5606ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul 5616ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* insert new MOV instructions here */ 5626ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst = prog->Instructions + endPos; 5636ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul for (var = 0; var < VERT_RESULT_MAX; var++) { 5646ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul if (outputMap[var] >= 0) { 5656ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul /* MOV VAR[var], TEMP[tmp]; */ 5666ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->Opcode = OPCODE_MOV; 567928ec5cd3be5c7d6f3d9df0ace18371b1ec8c68cZack Rusin inst->DstReg.File = type; 5686ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->DstReg.Index = var; 5696ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->SrcReg[0].File = PROGRAM_TEMPORARY; 5706ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst->SrcReg[0].Index = outputMap[var]; 5716ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul inst++; 5726ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5736ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5746ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul } 5756ca948a303e1af7ae66ea7082af741f6880887f2Brian Paul} 576