vl_idct.c revision 19bcd21ed151cf1716f2f87dff0f712231aa2ce7
1508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König/************************************************************************** 2508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 3508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * Copyright 2010 Christian König 4508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * All Rights Reserved. 5508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 6508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * Permission is hereby granted, free of charge, to any person obtaining a 7508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * copy of this software and associated documentation files (the 8508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * "Software"), to deal in the Software without restriction, including 9508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * without limitation the rights to use, copy, modify, merge, publish, 10508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * distribute, sub license, and/or sell copies of the Software, and to 11508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * permit persons to whom the Software is furnished to do so, subject to 12508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * the following conditions: 13508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 14508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * The above copyright notice and this permission notice (including the 15508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * next paragraph) shall be included in all copies or substantial portions 16508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * of the Software. 17508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 18508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 19508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 20508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. 21508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR 22508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 23508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 24508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 25508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 26508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König **************************************************************************/ 27508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 28508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include <assert.h> 295ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 3019bcd21ed151cf1716f2f87dff0f712231aa2ce7Kai Wasserbäch#include "pipe/p_context.h" 3119bcd21ed151cf1716f2f87dff0f712231aa2ce7Kai Wasserbäch#include "pipe/p_screen.h" 325ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 3319bcd21ed151cf1716f2f87dff0f712231aa2ce7Kai Wasserbäch#include "util/u_draw.h" 3419bcd21ed151cf1716f2f87dff0f712231aa2ce7Kai Wasserbäch#include "util/u_sampler.h" 3519bcd21ed151cf1716f2f87dff0f712231aa2ce7Kai Wasserbäch#include "util/u_memory.h" 365ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 3719bcd21ed151cf1716f2f87dff0f712231aa2ce7Kai Wasserbäch#include "tgsi/tgsi_ureg.h" 385ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 395ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include "vl_defines.h" 40508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include "vl_types.h" 415ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include "vl_vertex_buffers.h" 425ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include "vl_idct.h" 43508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 44508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königenum VS_OUTPUT 45508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 46508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König VS_O_VPOS, 47be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_L_ADDR0, 48be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_L_ADDR1, 49be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_R_ADDR0, 50be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_R_ADDR1 51508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König}; 52508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 533e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König/** 543e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * The DCT matrix stored as hex representation of floats. Equal to the following equation: 553e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * for (i = 0; i < 8; ++i) 563e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * for (j = 0; j < 8; ++j) 573e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * if (i == 0) const_matrix[i][j] = 1.0f / sqrtf(8.0f); 583e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * else const_matrix[i][j] = sqrtf(2.0f / 8.0f) * cosf((2 * j + 1) * i * M_PI / (2.0f * 8.0f)); 593e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König */ 603e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian Königstatic const uint32_t const_matrix[8][8] = { 613e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3 }, 623e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3efb14be, 0x3ed4db31, 0x3e8e39da, 0x3dc7c5c4, 0xbdc7c5c2, 0xbe8e39d9, 0xbed4db32, 0xbefb14bf }, 633e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3eec835f, 0x3e43ef15, 0xbe43ef14, 0xbeec835e, 0xbeec835f, 0xbe43ef1a, 0x3e43ef1b, 0x3eec835f }, 643e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3ed4db31, 0xbdc7c5c2, 0xbefb14bf, 0xbe8e39dd, 0x3e8e39d7, 0x3efb14bf, 0x3dc7c5d0, 0xbed4db34 }, 653e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3eb504f3, 0xbeb504f3, 0xbeb504f4, 0x3eb504f1, 0x3eb504f3, 0xbeb504f0, 0xbeb504ef, 0x3eb504f4 }, 663e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3e8e39da, 0xbefb14bf, 0x3dc7c5c8, 0x3ed4db32, 0xbed4db34, 0xbdc7c5bb, 0x3efb14bf, 0xbe8e39d7 }, 673e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3e43ef15, 0xbeec835f, 0x3eec835f, 0xbe43ef07, 0xbe43ef23, 0x3eec8361, 0xbeec835c, 0x3e43ef25 }, 683e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3dc7c5c4, 0xbe8e39dd, 0x3ed4db32, 0xbefb14c0, 0x3efb14be, 0xbed4db31, 0x3e8e39ce, 0xbdc7c596 }, 69508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König}; 70508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 71be4de05c1093db27b3fca12b782055ab8a1eba13Christian Königstatic void 72be4de05c1093db27b3fca12b782055ab8a1eba13Christian Königcalc_addr(struct ureg_program *shader, struct ureg_dst addr[2], 73be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_src tc, struct ureg_src start, bool right_side, 74be4de05c1093db27b3fca12b782055ab8a1eba13Christian König bool transposed, float size) 75be4de05c1093db27b3fca12b782055ab8a1eba13Christian König{ 76be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned wm_start = (right_side == transposed) ? TGSI_WRITEMASK_X : TGSI_WRITEMASK_Y; 77be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned sw_start = right_side ? TGSI_SWIZZLE_Y : TGSI_SWIZZLE_X; 78be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 79be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned wm_tc = (right_side == transposed) ? TGSI_WRITEMASK_Y : TGSI_WRITEMASK_X; 80be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned sw_tc = right_side ? TGSI_SWIZZLE_X : TGSI_SWIZZLE_Y; 81be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 82be4de05c1093db27b3fca12b782055ab8a1eba13Christian König /* 83be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[0..1].(start) = right_side ? start.x : tc.x 84be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[0..1].(tc) = right_side ? tc.y : start.y 85be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[0..1].z = tc.z 86be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[1].(start) += 1.0f / scale 87be4de05c1093db27b3fca12b782055ab8a1eba13Christian König */ 88be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_MOV(shader, ureg_writemask(addr[0], wm_start), ureg_scalar(start, sw_start)); 89be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_MOV(shader, ureg_writemask(addr[0], wm_tc), ureg_scalar(tc, sw_tc)); 90be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 91be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_ADD(shader, ureg_writemask(addr[1], wm_start), ureg_scalar(start, sw_start), ureg_imm1f(shader, 1.0f / size)); 92be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_MOV(shader, ureg_writemask(addr[1], wm_tc), ureg_scalar(tc, sw_tc)); 93be4de05c1093db27b3fca12b782055ab8a1eba13Christian König} 94be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 957f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königstatic void 967f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königincrement_addr(struct ureg_program *shader, struct ureg_dst daddr[2], 977f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_src saddr[2], bool right_side, bool transposed, 987f04fe5338d0846ec9a6003033da5357d2785c8bChristian König int pos, float size) 997f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 1007f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned wm_start = (right_side == transposed) ? TGSI_WRITEMASK_X : TGSI_WRITEMASK_Y; 1017f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned wm_tc = (right_side == transposed) ? TGSI_WRITEMASK_Y : TGSI_WRITEMASK_X; 1027f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1037f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* 1047f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * daddr[0..1].(start) = saddr[0..1].(start) 1057f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * daddr[0..1].(tc) = saddr[0..1].(tc) 1067f04fe5338d0846ec9a6003033da5357d2785c8bChristian König */ 1077f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1087f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MOV(shader, ureg_writemask(daddr[0], wm_start), saddr[0]); 1097f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_ADD(shader, ureg_writemask(daddr[0], wm_tc), saddr[0], ureg_imm1f(shader, pos / size)); 1107f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MOV(shader, ureg_writemask(daddr[1], wm_start), saddr[1]); 1117f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_ADD(shader, ureg_writemask(daddr[1], wm_tc), saddr[1], ureg_imm1f(shader, pos / size)); 1127f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 1137f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1147f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königstatic void 115b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian Königfetch_four(struct ureg_program *shader, struct ureg_dst m[2], struct ureg_src addr[2], 116b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König struct ureg_src sampler, bool resource3d) 1177f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 118b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_TEX(shader, m[0], resource3d ? TGSI_TEXTURE_3D : TGSI_TEXTURE_2D, addr[0], sampler); 119b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_TEX(shader, m[1], resource3d ? TGSI_TEXTURE_3D : TGSI_TEXTURE_2D, addr[1], sampler); 1207f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 1217f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1227f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königstatic void 1237f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königmatrix_mul(struct ureg_program *shader, struct ureg_dst dst, struct ureg_dst l[2], struct ureg_dst r[2]) 1247f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 1257f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_dst tmp; 1267f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1277f04fe5338d0846ec9a6003033da5357d2785c8bChristian König tmp = ureg_DECL_temporary(shader); 1287f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1297f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* 1307f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * tmp.xy = dot4(m[0][0..1], m[1][0..1]) 1317f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * dst = tmp.x + tmp.y 1327f04fe5338d0846ec9a6003033da5357d2785c8bChristian König */ 1337f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_DP4(shader, ureg_writemask(tmp, TGSI_WRITEMASK_X), ureg_src(l[0]), ureg_src(r[0])); 1347f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_DP4(shader, ureg_writemask(tmp, TGSI_WRITEMASK_Y), ureg_src(l[1]), ureg_src(r[1])); 1357f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_ADD(shader, dst, 1367f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_scalar(ureg_src(tmp), TGSI_SWIZZLE_X), 1377f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_scalar(ureg_src(tmp), TGSI_SWIZZLE_Y)); 1387f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1397f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_release_temporary(shader, tmp); 1407f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 1417f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 142508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void * 143ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königcreate_mismatch_vert_shader(struct vl_idct *idct) 144ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 145ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_program *shader; 1462d960d3f4e8fcf7819bb94ba4913ec0a2a723daaMarek Olšák struct ureg_src vpos; 147ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_src scale; 148ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst t_tex; 149ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst o_vpos, o_addr[2]; 150ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 151ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König shader = ureg_create(TGSI_PROCESSOR_VERTEX); 152ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!shader) 153ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return NULL; 154ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 155ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König vpos = ureg_DECL_vs_input(shader, VS_I_VPOS); 156ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 157ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König t_tex = ureg_DECL_temporary(shader); 158ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 159ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König o_vpos = ureg_DECL_output(shader, TGSI_SEMANTIC_POSITION, VS_O_VPOS); 160ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 161ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König o_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0); 162ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König o_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1); 163ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 164ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König /* 165ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * scale = (BLOCK_WIDTH, BLOCK_HEIGHT) / (dst.width, dst.height) 166ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * 167ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * t_vpos = vpos + 7 / BLOCK_WIDTH 168ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * o_vpos.xy = t_vpos * scale 169ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * 170ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * o_addr = calc_addr(...) 171ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * 172ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König */ 173ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 174ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König scale = ureg_imm2f(shader, 175ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König (float)BLOCK_WIDTH / idct->buffer_width, 176ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König (float)BLOCK_HEIGHT / idct->buffer_height); 177ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 178ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MAD(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_XY), vpos, scale, scale); 179ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MOV(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_ZW), ureg_imm1f(shader, 1.0f)); 180ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 181ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MUL(shader, ureg_writemask(t_tex, TGSI_WRITEMASK_XY), vpos, scale); 182ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König calc_addr(shader, o_addr, ureg_src(t_tex), ureg_src(t_tex), false, false, idct->buffer_width / 4); 183ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 184ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_release_temporary(shader, t_tex); 185ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 186ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_END(shader); 187ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 188ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return ureg_create_shader_and_destroy(shader, idct->pipe); 189ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 190ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 191ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic void * 192ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königcreate_mismatch_frag_shader(struct vl_idct *idct) 193ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 194ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_program *shader; 195ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 196ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_src addr[2]; 197ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 198ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst m[8][2]; 199ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst fragment; 200ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 201ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König unsigned i; 202ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 203ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König shader = ureg_create(TGSI_PROCESSOR_FRAGMENT); 204ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!shader) 205ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return NULL; 206ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 207ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0, TGSI_INTERPOLATE_LINEAR); 208ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1, TGSI_INTERPOLATE_LINEAR); 209ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 210ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fragment = ureg_DECL_output(shader, TGSI_SEMANTIC_COLOR, 0); 211ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 212ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 213ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König m[i][0] = ureg_DECL_temporary(shader); 214ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König m[i][1] = ureg_DECL_temporary(shader); 215ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 216ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 217ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 218ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König increment_addr(shader, m[i], addr, false, false, i, idct->buffer_height); 219ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 220ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 221ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 2223cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee struct ureg_src s_addr[2]; 2233cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee s_addr[0] = ureg_src(m[i][0]); 2243cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee s_addr[1] = ureg_src(m[i][1]); 225ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, m[i], s_addr, ureg_DECL_sampler(shader, 0), false); 226ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 227ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 228ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 1; i < 8; ++i) { 229ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, m[0][0], ureg_src(m[0][0]), ureg_src(m[i][0])); 230ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, m[0][1], ureg_src(m[0][1]), ureg_src(m[i][1])); 231ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 232ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 233ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, m[0][0], ureg_src(m[0][0]), ureg_src(m[0][1])); 234ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_DP4(shader, m[0][0], ureg_abs(ureg_src(m[0][0])), ureg_imm1f(shader, 1 << 14)); 235ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 236ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MUL(shader, ureg_writemask(m[0][0], TGSI_WRITEMASK_W), ureg_abs(ureg_src(m[7][1])), ureg_imm1f(shader, 1 << 14)); 237ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_FRC(shader, m[0][0], ureg_src(m[0][0])); 238ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_SGT(shader, m[0][0], ureg_imm1f(shader, 0.5f), ureg_abs(ureg_src(m[0][0]))); 239ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 240ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_CMP(shader, ureg_writemask(m[0][0], TGSI_WRITEMASK_W), ureg_negate(ureg_src(m[0][0])), 241ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_imm1f(shader, 1.0f / (1 << 15)), ureg_imm1f(shader, -1.0f / (1 << 15))); 242ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MUL(shader, ureg_writemask(m[0][0], TGSI_WRITEMASK_W), ureg_src(m[0][0]), 243ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_scalar(ureg_src(m[0][0]), TGSI_SWIZZLE_X)); 244ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 245ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MOV(shader, ureg_writemask(fragment, TGSI_WRITEMASK_XYZ), ureg_src(m[7][1])); 246ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, ureg_writemask(fragment, TGSI_WRITEMASK_W), ureg_src(m[0][0]), ureg_src(m[7][1])); 247ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 248ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 249ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_release_temporary(shader, m[i][0]); 250ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_release_temporary(shader, m[i][1]); 251ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 252ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 253ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_END(shader); 254ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 255ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return ureg_create_shader_and_destroy(shader, idct->pipe); 256ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 257ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 258ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic void * 2597f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königcreate_stage1_vert_shader(struct vl_idct *idct) 260508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 261508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König struct ureg_program *shader; 2623511780a43077d1359bd491eadb4ab9b3b86795aChristian König struct ureg_src vrect, vpos; 2633511780a43077d1359bd491eadb4ab9b3b86795aChristian König struct ureg_src scale; 264be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_dst t_tex, t_start; 265be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_dst o_vpos, o_l_addr[2], o_r_addr[2]; 266508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 267508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König shader = ureg_create(TGSI_PROCESSOR_VERTEX); 268508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König if (!shader) 269508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return NULL; 270508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 271508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König vrect = ureg_DECL_vs_input(shader, VS_I_RECT); 272508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König vpos = ureg_DECL_vs_input(shader, VS_I_VPOS); 273508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 2747f04fe5338d0846ec9a6003033da5357d2785c8bChristian König t_tex = ureg_DECL_temporary(shader); 2757f04fe5338d0846ec9a6003033da5357d2785c8bChristian König t_start = ureg_DECL_temporary(shader); 2767f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 277508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König o_vpos = ureg_DECL_output(shader, TGSI_SEMANTIC_POSITION, VS_O_VPOS); 278be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 279be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_l_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0); 280be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_l_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1); 281be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 282be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_r_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR0); 283be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_r_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR1); 284508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 285508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König /* 28612836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König * scale = (BLOCK_WIDTH, BLOCK_HEIGHT) / (dst.width, dst.height) 287508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 2883511780a43077d1359bd491eadb4ab9b3b86795aChristian König * t_vpos = vpos + vrect 2893511780a43077d1359bd491eadb4ab9b3b86795aChristian König * o_vpos.xy = t_vpos * scale 290310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian König * o_vpos.zw = vpos 291508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 2923511780a43077d1359bd491eadb4ab9b3b86795aChristian König * o_l_addr = calc_addr(...) 2933511780a43077d1359bd491eadb4ab9b3b86795aChristian König * o_r_addr = calc_addr(...) 2943511780a43077d1359bd491eadb4ab9b3b86795aChristian König * 295508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König */ 296310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian König 29712836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König scale = ureg_imm2f(shader, 29822b4acb2069a368e986805d3b43395172ebf9146Christian König (float)BLOCK_WIDTH / idct->buffer_width, 29922b4acb2069a368e986805d3b43395172ebf9146Christian König (float)BLOCK_HEIGHT / idct->buffer_height); 30012836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König 3013511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_ADD(shader, ureg_writemask(t_tex, TGSI_WRITEMASK_XY), vpos, vrect); 3023511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MUL(shader, ureg_writemask(t_tex, TGSI_WRITEMASK_XY), ureg_src(t_tex), scale); 303ab130400cf91ab471e265e58193c95f04c7aeedaChristian König 3043511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MOV(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_XY), ureg_src(t_tex)); 3053511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MOV(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_ZW), ureg_imm1f(shader, 1.0f)); 306f853ea007816cdad4395b42388e12cd65bb8eb43Christian König 3073511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MUL(shader, ureg_writemask(t_start, TGSI_WRITEMASK_XY), vpos, scale); 308508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 3097f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_l_addr, ureg_src(t_tex), ureg_src(t_start), false, false, idct->buffer_width / 4); 3107f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_r_addr, vrect, ureg_imm1f(shader, 0.0f), true, true, BLOCK_WIDTH / 4); 311be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 312be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, t_tex); 313be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, t_start); 314508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 315508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König ureg_END(shader); 316508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 317508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return ureg_create_shader_and_destroy(shader, idct->pipe); 318508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 319508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 320508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void * 3217f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königcreate_stage1_frag_shader(struct vl_idct *idct) 322508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 323508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König struct ureg_program *shader; 324cfe489b89723117e56674c2be7761c201f8d78ffChristian König 325f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König struct ureg_src l_addr[2], r_addr[2]; 326cfe489b89723117e56674c2be7761c201f8d78ffChristian König 327f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König struct ureg_dst l[4][2], r[2]; 3283cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee struct ureg_dst *fragment; 32912836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König 3303db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König int i, j; 331508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 332508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König shader = ureg_create(TGSI_PROCESSOR_FRAGMENT); 333508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König if (!shader) 334508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return NULL; 335508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 3363cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee fragment = MALLOC(idct->nr_of_render_targets * sizeof(struct ureg_dst)); 3373cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee 338be4de05c1093db27b3fca12b782055ab8a1eba13Christian König l_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0, TGSI_INTERPOLATE_LINEAR); 339be4de05c1093db27b3fca12b782055ab8a1eba13Christian König l_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1, TGSI_INTERPOLATE_LINEAR); 340be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 341be4de05c1093db27b3fca12b782055ab8a1eba13Christian König r_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR0, TGSI_INTERPOLATE_LINEAR); 342be4de05c1093db27b3fca12b782055ab8a1eba13Christian König r_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR1, TGSI_INTERPOLATE_LINEAR); 343cfe489b89723117e56674c2be7761c201f8d78ffChristian König 344fcf765620d803b376582afb618b1f643242b641bChristian König for (i = 0; i < idct->nr_of_render_targets; ++i) 345e742a1043dbd56fe11f0490cb74b7a738bab2238Christian König fragment[i] = ureg_DECL_output(shader, TGSI_SEMANTIC_COLOR, i); 346e742a1043dbd56fe11f0490cb74b7a738bab2238Christian König 34774c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König for (i = 0; i < 4; ++i) { 348f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[i][0] = ureg_DECL_temporary(shader); 349f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[i][1] = ureg_DECL_temporary(shader); 350f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König } 3514a8420513d653cd2fccf93a51315120a1a5d0fccChristian König 352f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[0] = ureg_DECL_temporary(shader); 353f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[1] = ureg_DECL_temporary(shader); 354f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König 3553db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König for (i = 0; i < 4; ++i) { 3563db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König increment_addr(shader, l[i], l_addr, false, false, i - 2, idct->buffer_height); 357f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König } 358f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König 359f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König for (i = 0; i < 4; ++i) { 3603cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee struct ureg_src s_addr[2]; 3613cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee s_addr[0] = ureg_src(l[i][0]); 3623cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee s_addr[1] = ureg_src(l[i][1]); 363ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, l[i], s_addr, ureg_DECL_sampler(shader, 0), false); 36474c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König } 365c8236aaf7056bd8645804e71596d2d6460e62d15Christian König 366fcf765620d803b376582afb618b1f643242b641bChristian König for (i = 0; i < idct->nr_of_render_targets; ++i) { 3673cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee struct ureg_src s_addr[2]; 3683cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee 3693db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König increment_addr(shader, r, r_addr, true, true, i - (signed)idct->nr_of_render_targets / 2, BLOCK_HEIGHT); 370a984c67b316ac2ca9aaf6d38a3127cf3d61a249eChristian König 3713cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee s_addr[0] = ureg_src(r[0]); 3723cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee s_addr[1] = ureg_src(r[1]); 373ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, r, s_addr, ureg_DECL_sampler(shader, 1), false); 374a984c67b316ac2ca9aaf6d38a3127cf3d61a249eChristian König 37574c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König for (j = 0; j < 4; ++j) { 37674c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König matrix_mul(shader, ureg_writemask(fragment[i], TGSI_WRITEMASK_X << j), l[j], r); 37774c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König } 378e742a1043dbd56fe11f0490cb74b7a738bab2238Christian König } 37974c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König 38074c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König for (i = 0; i < 4; ++i) { 38174c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König ureg_release_temporary(shader, l[i][0]); 38274c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König ureg_release_temporary(shader, l[i][1]); 38374c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König } 384f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König ureg_release_temporary(shader, r[0]); 385f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König ureg_release_temporary(shader, r[1]); 386be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 387be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_END(shader); 388be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 3893cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee FREE(fragment); 3903cf22a0c6e215535266e7a7fac5ddd2404d4345dVinson Lee 391be4de05c1093db27b3fca12b782055ab8a1eba13Christian König return ureg_create_shader_and_destroy(shader, idct->pipe); 392be4de05c1093db27b3fca12b782055ab8a1eba13Christian König} 393be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 3947f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvoid 3957f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvl_idct_stage2_vert_shader(struct vl_idct *idct, struct ureg_program *shader, 3967f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned first_output, struct ureg_dst tex) 397be4de05c1093db27b3fca12b782055ab8a1eba13Christian König{ 3987f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_src vrect, vpos; 3997f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_src scale; 4007f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_dst t_start; 4017f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_dst o_l_addr[2], o_r_addr[2]; 4027f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4037f04fe5338d0846ec9a6003033da5357d2785c8bChristian König vrect = ureg_DECL_vs_input(shader, VS_I_RECT); 4047f04fe5338d0846ec9a6003033da5357d2785c8bChristian König vpos = ureg_DECL_vs_input(shader, VS_I_VPOS); 405be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4067f04fe5338d0846ec9a6003033da5357d2785c8bChristian König t_start = ureg_DECL_temporary(shader); 4077f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4087f04fe5338d0846ec9a6003033da5357d2785c8bChristian König --first_output; 4097f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4107f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_l_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_L_ADDR0); 4117f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_l_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_L_ADDR1); 4127f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4137f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_r_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_R_ADDR0); 4147f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_r_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_R_ADDR1); 4157f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4167f04fe5338d0846ec9a6003033da5357d2785c8bChristian König scale = ureg_imm2f(shader, 4177f04fe5338d0846ec9a6003033da5357d2785c8bChristian König (float)BLOCK_WIDTH / idct->buffer_width, 4187f04fe5338d0846ec9a6003033da5357d2785c8bChristian König (float)BLOCK_HEIGHT / idct->buffer_height); 4197f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4207f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MUL(shader, ureg_writemask(tex, TGSI_WRITEMASK_Z), 4217f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_scalar(vrect, TGSI_SWIZZLE_X), 4227f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_imm1f(shader, BLOCK_WIDTH / idct->nr_of_render_targets)); 4237f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MUL(shader, ureg_writemask(t_start, TGSI_WRITEMASK_XY), vpos, scale); 4247f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4257f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_l_addr, vrect, ureg_imm1f(shader, 0.0f), false, false, BLOCK_WIDTH / 4); 4267f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_r_addr, ureg_src(tex), ureg_src(t_start), true, false, idct->buffer_height / 4); 427b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König 428b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_MOV(shader, ureg_writemask(o_r_addr[0], TGSI_WRITEMASK_Z), ureg_src(tex)); 429b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_MOV(shader, ureg_writemask(o_r_addr[1], TGSI_WRITEMASK_Z), ureg_src(tex)); 4307f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 4317f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4327f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvoid 4337f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvl_idct_stage2_frag_shader(struct vl_idct *idct, struct ureg_program *shader, 4347f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned first_input, struct ureg_dst fragment) 4357f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 436be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_src l_addr[2], r_addr[2]; 437be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 438be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_dst l[2], r[2]; 439be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4407f04fe5338d0846ec9a6003033da5357d2785c8bChristian König --first_input; 441be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4427f04fe5338d0846ec9a6003033da5357d2785c8bChristian König l_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_L_ADDR0, TGSI_INTERPOLATE_LINEAR); 4437f04fe5338d0846ec9a6003033da5357d2785c8bChristian König l_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_L_ADDR1, TGSI_INTERPOLATE_LINEAR); 444be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4457f04fe5338d0846ec9a6003033da5357d2785c8bChristian König r_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_R_ADDR0, TGSI_INTERPOLATE_LINEAR); 4467f04fe5338d0846ec9a6003033da5357d2785c8bChristian König r_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_R_ADDR1, TGSI_INTERPOLATE_LINEAR); 447be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 448f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[0] = ureg_DECL_temporary(shader); 449f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[1] = ureg_DECL_temporary(shader); 450f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[0] = ureg_DECL_temporary(shader); 451f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[1] = ureg_DECL_temporary(shader); 452f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König 453ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, l, l_addr, ureg_DECL_sampler(shader, 1), false); 454ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, r, r_addr, ureg_DECL_sampler(shader, 0), true); 455be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4567f04fe5338d0846ec9a6003033da5357d2785c8bChristian König matrix_mul(shader, fragment, l, r); 457be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 458be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, l[0]); 459be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, l[1]); 460be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, r[0]); 461be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, r[1]); 462508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 463508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 464508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic bool 46559774e5c7a2756c5c430fc74bc80ea75d54f594dChristian Königinit_shaders(struct vl_idct *idct) 466508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 467ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->vs_mismatch = create_mismatch_vert_shader(idct); 468ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!idct->vs_mismatch) 469ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König goto error_vs_mismatch; 470ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 471ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->fs_mismatch = create_mismatch_frag_shader(idct); 472ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!idct->fs_mismatch) 473ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König goto error_fs_mismatch; 474ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 4757f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->vs = create_stage1_vert_shader(idct); 4767f04fe5338d0846ec9a6003033da5357d2785c8bChristian König if (!idct->vs) 4777f04fe5338d0846ec9a6003033da5357d2785c8bChristian König goto error_vs; 478be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4797f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->fs = create_stage1_frag_shader(idct); 4807f04fe5338d0846ec9a6003033da5357d2785c8bChristian König if (!idct->fs) 4817f04fe5338d0846ec9a6003033da5357d2785c8bChristian König goto error_fs; 4828330bc29dda71c41c56b3c1989334823ae8779d4Christian König 4838330bc29dda71c41c56b3c1989334823ae8779d4Christian König return true; 4848330bc29dda71c41c56b3c1989334823ae8779d4Christian König 4857f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königerror_fs: 4867f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->delete_vs_state(idct->pipe, idct->vs); 4878330bc29dda71c41c56b3c1989334823ae8779d4Christian König 4887f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königerror_vs: 489ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_vs_state(idct->pipe, idct->vs_mismatch); 490ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 491ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königerror_fs_mismatch: 492ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_vs_state(idct->pipe, idct->fs); 493ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 494ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königerror_vs_mismatch: 4958330bc29dda71c41c56b3c1989334823ae8779d4Christian König return false; 496508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 497508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 498508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void 499508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königcleanup_shaders(struct vl_idct *idct) 500508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 501ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_vs_state(idct->pipe, idct->vs_mismatch); 502ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_fs_state(idct->pipe, idct->fs_mismatch); 5037f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->delete_vs_state(idct->pipe, idct->vs); 5047f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->delete_fs_state(idct->pipe, idct->fs); 505508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 506508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 507508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic bool 5080b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königinit_state(struct vl_idct *idct) 5090b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 5100a2310b375068694d5700395aededc3fe68a0f3aChristian König struct pipe_blend_state blend; 5110b749d6dcb537472771d6fe6e454aafc916ab3feChristian König struct pipe_rasterizer_state rs_state; 5120a2310b375068694d5700395aededc3fe68a0f3aChristian König struct pipe_sampler_state sampler; 5130b749d6dcb537472771d6fe6e454aafc916ab3feChristian König unsigned i; 5140b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5150b749d6dcb537472771d6fe6e454aafc916ab3feChristian König assert(idct); 5160b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5178330bc29dda71c41c56b3c1989334823ae8779d4Christian König memset(&rs_state, 0, sizeof(rs_state)); 518ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König rs_state.point_size = 1; 5193db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König rs_state.gl_rasterization_rules = true; 5208330bc29dda71c41c56b3c1989334823ae8779d4Christian König idct->rs_state = idct->pipe->create_rasterizer_state(idct->pipe, &rs_state); 5218330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!idct->rs_state) 5228330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_rs_state; 5238330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5240a2310b375068694d5700395aededc3fe68a0f3aChristian König memset(&blend, 0, sizeof blend); 5250a2310b375068694d5700395aededc3fe68a0f3aChristian König 5260a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.independent_blend_enable = 0; 5270a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].blend_enable = 0; 5280a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].rgb_func = PIPE_BLEND_ADD; 5290a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].rgb_src_factor = PIPE_BLENDFACTOR_ONE; 5300a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].rgb_dst_factor = PIPE_BLENDFACTOR_ONE; 5310a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].alpha_func = PIPE_BLEND_ADD; 5320a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].alpha_src_factor = PIPE_BLENDFACTOR_ONE; 5330a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].alpha_dst_factor = PIPE_BLENDFACTOR_ONE; 5340a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.logicop_enable = 0; 5350a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.logicop_func = PIPE_LOGICOP_CLEAR; 5360a2310b375068694d5700395aededc3fe68a0f3aChristian König /* Needed to allow color writes to FB, even if blending disabled */ 5370a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].colormask = PIPE_MASK_RGBA; 5380a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.dither = 0; 5390a2310b375068694d5700395aededc3fe68a0f3aChristian König idct->blend = idct->pipe->create_blend_state(idct->pipe, &blend); 5400a2310b375068694d5700395aededc3fe68a0f3aChristian König if (!idct->blend) 5410a2310b375068694d5700395aededc3fe68a0f3aChristian König goto error_blend; 5420a2310b375068694d5700395aededc3fe68a0f3aChristian König 5435a351e51291922aa295926215fdecccc0baeef51Christian König for (i = 0; i < 2; ++i) { 5440b749d6dcb537472771d6fe6e454aafc916ab3feChristian König memset(&sampler, 0, sizeof(sampler)); 545be4de05c1093db27b3fca12b782055ab8a1eba13Christian König sampler.wrap_s = PIPE_TEX_WRAP_REPEAT; 546be4de05c1093db27b3fca12b782055ab8a1eba13Christian König sampler.wrap_t = PIPE_TEX_WRAP_REPEAT; 547be4de05c1093db27b3fca12b782055ab8a1eba13Christian König sampler.wrap_r = PIPE_TEX_WRAP_REPEAT; 5480b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.min_img_filter = PIPE_TEX_FILTER_NEAREST; 5490b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.min_mip_filter = PIPE_TEX_MIPFILTER_NONE; 5500b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.mag_img_filter = PIPE_TEX_FILTER_NEAREST; 5510b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.compare_mode = PIPE_TEX_COMPARE_NONE; 5520b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.compare_func = PIPE_FUNC_ALWAYS; 5530b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.normalized_coords = 1; 5545a351e51291922aa295926215fdecccc0baeef51Christian König idct->samplers[i] = idct->pipe->create_sampler_state(idct->pipe, &sampler); 5555a351e51291922aa295926215fdecccc0baeef51Christian König if (!idct->samplers[i]) 5568330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_samplers; 5570b749d6dcb537472771d6fe6e454aafc916ab3feChristian König } 5580b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5590b749d6dcb537472771d6fe6e454aafc916ab3feChristian König return true; 5608330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5618330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_samplers: 5625a351e51291922aa295926215fdecccc0baeef51Christian König for (i = 0; i < 2; ++i) 5635a351e51291922aa295926215fdecccc0baeef51Christian König if (idct->samplers[i]) 5645a351e51291922aa295926215fdecccc0baeef51Christian König idct->pipe->delete_sampler_state(idct->pipe, idct->samplers[i]); 5658330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5668330bc29dda71c41c56b3c1989334823ae8779d4Christian König idct->pipe->delete_rasterizer_state(idct->pipe, idct->rs_state); 5678330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5680a2310b375068694d5700395aededc3fe68a0f3aChristian Königerror_blend: 5690a2310b375068694d5700395aededc3fe68a0f3aChristian König idct->pipe->delete_blend_state(idct->pipe, idct->blend); 5700a2310b375068694d5700395aededc3fe68a0f3aChristian König 5718330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_rs_state: 5728330bc29dda71c41c56b3c1989334823ae8779d4Christian König return false; 5730b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 5740b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5750b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königstatic void 5760b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königcleanup_state(struct vl_idct *idct) 5770b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 5780b749d6dcb537472771d6fe6e454aafc916ab3feChristian König unsigned i; 5790b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5805a351e51291922aa295926215fdecccc0baeef51Christian König for (i = 0; i < 2; ++i) 5815a351e51291922aa295926215fdecccc0baeef51Christian König idct->pipe->delete_sampler_state(idct->pipe, idct->samplers[i]); 5820b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5830b749d6dcb537472771d6fe6e454aafc916ab3feChristian König idct->pipe->delete_rasterizer_state(idct->pipe, idct->rs_state); 5840a2310b375068694d5700395aededc3fe68a0f3aChristian König idct->pipe->delete_blend_state(idct->pipe, idct->blend); 5850b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 5860b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5870b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königstatic bool 588ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königinit_source(struct vl_idct *idct, struct vl_idct_buffer *buffer) 589ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 590ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct pipe_resource *tex; 591ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct pipe_surface surf_templ; 592ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 593ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König assert(idct && buffer); 594ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 595ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König tex = buffer->sampler_views.individual.source->texture; 596ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 597ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.width = tex->width0; 598ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.height = tex->height0; 599ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.nr_cbufs = 1; 600ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 601ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König memset(&surf_templ, 0, sizeof(surf_templ)); 602ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.format = tex->format; 603ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.u.tex.first_layer = 0; 604ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.u.tex.last_layer = 0; 605ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.usage = PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_RENDER_TARGET; 606ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.cbufs[0] = idct->pipe->create_surface(idct->pipe, tex, &surf_templ); 607ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 608ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[0] = tex->width0; 609ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[1] = tex->height0; 610ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[2] = 1; 611ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[3] = 1; 612ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 613ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return true; 614ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 615ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 616ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic void 617ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königcleanup_source(struct vl_idct *idct, struct vl_idct_buffer *buffer) 618ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 619ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König assert(idct && buffer); 620ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 621ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König pipe_surface_reference(&buffer->fb_state_mismatch.cbufs[0], NULL); 622ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 623ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König pipe_sampler_view_reference(&buffer->sampler_views.individual.source, NULL); 624ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 625ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 626ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic bool 627020328ca32a3b6548b4c064c4fe115e386752daaChristian Königinit_intermediate(struct vl_idct *idct, struct vl_idct_buffer *buffer) 628508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 62931109e1be20d7c94521879c3221a9f77bacbdb8dChristian König struct pipe_resource *tex; 630020328ca32a3b6548b4c064c4fe115e386752daaChristian König struct pipe_surface surf_templ; 63121efda86875096333dc0412c0edab1e188f551d8Christian König unsigned i; 632508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6330b749d6dcb537472771d6fe6e454aafc916ab3feChristian König assert(idct && buffer); 6340b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 63531109e1be20d7c94521879c3221a9f77bacbdb8dChristian König tex = buffer->sampler_views.individual.intermediate->texture; 636020328ca32a3b6548b4c064c4fe115e386752daaChristian König 6377f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.width = tex->width0; 6387f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.height = tex->height0; 6397f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.nr_cbufs = idct->nr_of_render_targets; 640fcf765620d803b376582afb618b1f643242b641bChristian König for(i = 0; i < idct->nr_of_render_targets; ++i) { 641020328ca32a3b6548b4c064c4fe115e386752daaChristian König memset(&surf_templ, 0, sizeof(surf_templ)); 642020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.format = tex->format; 643020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.u.tex.first_layer = i; 644020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.u.tex.last_layer = i; 645020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.usage = PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_RENDER_TARGET; 6467f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.cbufs[i] = idct->pipe->create_surface( 647020328ca32a3b6548b4c064c4fe115e386752daaChristian König idct->pipe, tex, &surf_templ); 648508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6497f04fe5338d0846ec9a6003033da5357d2785c8bChristian König if (!buffer->fb_state.cbufs[i]) 650020328ca32a3b6548b4c064c4fe115e386752daaChristian König goto error_surfaces; 651508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König } 652508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6537f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->viewport.scale[0] = tex->width0; 6547f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->viewport.scale[1] = tex->height0; 655ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport.scale[2] = 1; 656ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport.scale[3] = 1; 6570f07da0a1c87e1c7b53700c33d6b1f8f03c1fe11Christian König 658508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return true; 6598330bc29dda71c41c56b3c1989334823ae8779d4Christian König 660020328ca32a3b6548b4c064c4fe115e386752daaChristian Königerror_surfaces: 661fcf765620d803b376582afb618b1f643242b641bChristian König for(i = 0; i < idct->nr_of_render_targets; ++i) 6627f04fe5338d0846ec9a6003033da5357d2785c8bChristian König pipe_surface_reference(&buffer->fb_state.cbufs[i], NULL); 663020328ca32a3b6548b4c064c4fe115e386752daaChristian König 6648330bc29dda71c41c56b3c1989334823ae8779d4Christian König return false; 665508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 666508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 667508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void 668020328ca32a3b6548b4c064c4fe115e386752daaChristian Königcleanup_intermediate(struct vl_idct *idct, struct vl_idct_buffer *buffer) 669508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 670508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König unsigned i; 671508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6720b749d6dcb537472771d6fe6e454aafc916ab3feChristian König assert(idct && buffer); 673508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 674fcf765620d803b376582afb618b1f643242b641bChristian König for(i = 0; i < idct->nr_of_render_targets; ++i) 6757f04fe5338d0846ec9a6003033da5357d2785c8bChristian König pipe_surface_reference(&buffer->fb_state.cbufs[i], NULL); 676020328ca32a3b6548b4c064c4fe115e386752daaChristian König 677020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.intermediate, NULL); 678508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 679508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 680020328ca32a3b6548b4c064c4fe115e386752daaChristian Königstruct pipe_sampler_view * 681fcdf50f74befad8d89eb3f9cdfd88b82d1daa98cChristian Königvl_idct_upload_matrix(struct pipe_context *pipe, float scale) 6823dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König{ 683020328ca32a3b6548b4c064c4fe115e386752daaChristian König struct pipe_resource tex_templ, *matrix; 684020328ca32a3b6548b4c064c4fe115e386752daaChristian König struct pipe_sampler_view sv_templ, *sv; 6853dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König struct pipe_transfer *buf_transfer; 6863dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König unsigned i, j, pitch; 6873dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König float *f; 6883dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 6893dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König struct pipe_box rect = 6903dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König { 6913dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 0, 0, 0, 6927c4887f5ae642131d7895da5bffda77a6287c6d4Christian König BLOCK_WIDTH / 4, 6933dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König BLOCK_HEIGHT, 6943dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 1 6953dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König }; 6963dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 6978330bc29dda71c41c56b3c1989334823ae8779d4Christian König assert(pipe); 6988330bc29dda71c41c56b3c1989334823ae8779d4Christian König 699020328ca32a3b6548b4c064c4fe115e386752daaChristian König memset(&tex_templ, 0, sizeof(tex_templ)); 700020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.target = PIPE_TEXTURE_2D; 701020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.format = PIPE_FORMAT_R32G32B32A32_FLOAT; 702020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.last_level = 0; 703020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.width0 = 2; 704020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.height0 = 8; 705020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.depth0 = 1; 706020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.array_size = 1; 707020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.usage = PIPE_USAGE_IMMUTABLE; 708020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.bind = PIPE_BIND_SAMPLER_VIEW; 709020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.flags = 0; 710020328ca32a3b6548b4c064c4fe115e386752daaChristian König 711020328ca32a3b6548b4c064c4fe115e386752daaChristian König matrix = pipe->screen->resource_create(pipe->screen, &tex_templ); 7128330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!matrix) 7138330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_matrix; 7143dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 7153dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König buf_transfer = pipe->get_transfer 7163dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König ( 7173dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König pipe, matrix, 718772b25e1f366edc857e77b8c1ccdc5297d82cc41Christian König 0, PIPE_TRANSFER_WRITE | PIPE_TRANSFER_DISCARD, 7193dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König &rect 7203dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König ); 7218330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!buf_transfer) 7228330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_transfer; 7238330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7243fd53e6c2a05e65872de4292557d7839cbcf7395Christian König pitch = buf_transfer->stride / sizeof(float); 7253dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 7263dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König f = pipe->transfer_map(pipe, buf_transfer); 7278330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!f) 7288330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_map; 7298330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7303dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König for(i = 0; i < BLOCK_HEIGHT; ++i) 7313dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König for(j = 0; j < BLOCK_WIDTH; ++j) 7324a8420513d653cd2fccf93a51315120a1a5d0fccChristian König // transpose and scale 7333e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König f[i * pitch + j] = ((const float (*)[8])const_matrix)[j][i] * scale; 7343dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 7353dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König pipe->transfer_unmap(pipe, buf_transfer); 7363dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König pipe->transfer_destroy(pipe, buf_transfer); 7373dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 738020328ca32a3b6548b4c064c4fe115e386752daaChristian König memset(&sv_templ, 0, sizeof(sv_templ)); 739020328ca32a3b6548b4c064c4fe115e386752daaChristian König u_sampler_view_default_template(&sv_templ, matrix, matrix->format); 740020328ca32a3b6548b4c064c4fe115e386752daaChristian König sv = pipe->create_sampler_view(pipe, matrix, &sv_templ); 741020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_resource_reference(&matrix, NULL); 742020328ca32a3b6548b4c064c4fe115e386752daaChristian König if (!sv) 743020328ca32a3b6548b4c064c4fe115e386752daaChristian König goto error_map; 744020328ca32a3b6548b4c064c4fe115e386752daaChristian König 745020328ca32a3b6548b4c064c4fe115e386752daaChristian König return sv; 7468330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7478330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_map: 7488330bc29dda71c41c56b3c1989334823ae8779d4Christian König pipe->transfer_destroy(pipe, buf_transfer); 7498330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7508330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_transfer: 7518330bc29dda71c41c56b3c1989334823ae8779d4Christian König pipe_resource_reference(&matrix, NULL); 7528330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7538330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_matrix: 7548330bc29dda71c41c56b3c1989334823ae8779d4Christian König return NULL; 7553dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König} 7563dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 757c8236aaf7056bd8645804e71596d2d6460e62d15Christian Königbool vl_idct_init(struct vl_idct *idct, struct pipe_context *pipe, 7580b749d6dcb537472771d6fe6e454aafc916ab3feChristian König unsigned buffer_width, unsigned buffer_height, 759fcf765620d803b376582afb618b1f643242b641bChristian König unsigned nr_of_render_targets, 760ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König struct pipe_sampler_view *matrix, 761ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König struct pipe_sampler_view *transpose) 762e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König{ 763df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(idct && pipe); 764df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(matrix && transpose); 765e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König 766e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König idct->pipe = pipe; 7670b749d6dcb537472771d6fe6e454aafc916ab3feChristian König idct->buffer_width = buffer_width; 7680b749d6dcb537472771d6fe6e454aafc916ab3feChristian König idct->buffer_height = buffer_height; 769fcf765620d803b376582afb618b1f643242b641bChristian König idct->nr_of_render_targets = nr_of_render_targets; 770ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König 771020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&idct->matrix, matrix); 772ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König pipe_sampler_view_reference(&idct->transpose, transpose); 773508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 77459774e5c7a2756c5c430fc74bc80ea75d54f594dChristian König if(!init_shaders(idct)) 775508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return false; 776508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 7770b749d6dcb537472771d6fe6e454aafc916ab3feChristian König if(!init_state(idct)) { 7780b749d6dcb537472771d6fe6e454aafc916ab3feChristian König cleanup_shaders(idct); 779508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return false; 780508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König } 781508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 7820b749d6dcb537472771d6fe6e454aafc916ab3feChristian König return true; 7830b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 7840b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 7850b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königvoid 7860b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königvl_idct_cleanup(struct vl_idct *idct) 7870b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 7880b749d6dcb537472771d6fe6e454aafc916ab3feChristian König cleanup_shaders(idct); 7890b749d6dcb537472771d6fe6e454aafc916ab3feChristian König cleanup_state(idct); 7900b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 791020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&idct->matrix, NULL); 792df5e0b9435c869f88234a69db9bfe97342b027d4Christian König pipe_sampler_view_reference(&idct->transpose, NULL); 7930b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 7940b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 795020328ca32a3b6548b4c064c4fe115e386752daaChristian Königbool 796020328ca32a3b6548b4c064c4fe115e386752daaChristian Königvl_idct_init_buffer(struct vl_idct *idct, struct vl_idct_buffer *buffer, 79731109e1be20d7c94521879c3221a9f77bacbdb8dChristian König struct pipe_sampler_view *source, 798ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct pipe_sampler_view *intermediate) 7990b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 800df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(buffer && idct); 801df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(source && intermediate); 8020b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 8037f04fe5338d0846ec9a6003033da5357d2785c8bChristian König memset(buffer, 0, sizeof(struct vl_idct_buffer)); 8047f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8057c48575402e8c384db2fab24e4dd0fc72bef0451Christian König buffer->idct = idct; 8067c48575402e8c384db2fab24e4dd0fc72bef0451Christian König 807020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.matrix, idct->matrix); 808020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.source, source); 809ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.transpose, idct->transpose); 81031109e1be20d7c94521879c3221a9f77bacbdb8dChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.intermediate, intermediate); 8110b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 812ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!init_source(idct, buffer)) 813020328ca32a3b6548b4c064c4fe115e386752daaChristian König return false; 8140b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 815ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!init_intermediate(idct, buffer)) 816ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return false; 817508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 818020328ca32a3b6548b4c064c4fe115e386752daaChristian König return true; 819508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 820508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 82103c5a0ea5cd5b3e5931d6784749f87789a016b98Christian Königvoid 8227c48575402e8c384db2fab24e4dd0fc72bef0451Christian Königvl_idct_cleanup_buffer(struct vl_idct_buffer *buffer) 823508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 8247c48575402e8c384db2fab24e4dd0fc72bef0451Christian König assert(buffer); 825e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König 8267c48575402e8c384db2fab24e4dd0fc72bef0451Christian König cleanup_source(buffer->idct, buffer); 8277c48575402e8c384db2fab24e4dd0fc72bef0451Christian König cleanup_intermediate(buffer->idct, buffer); 828df5e0b9435c869f88234a69db9bfe97342b027d4Christian König 829df5e0b9435c869f88234a69db9bfe97342b027d4Christian König pipe_sampler_view_reference(&buffer->sampler_views.individual.matrix, NULL); 830df5e0b9435c869f88234a69db9bfe97342b027d4Christian König pipe_sampler_view_reference(&buffer->sampler_views.individual.transpose, NULL); 831508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 832508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 83303c5a0ea5cd5b3e5931d6784749f87789a016b98Christian Königvoid 8347c48575402e8c384db2fab24e4dd0fc72bef0451Christian Königvl_idct_flush(struct vl_idct_buffer *buffer, unsigned num_instances) 835508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 8367c48575402e8c384db2fab24e4dd0fc72bef0451Christian König struct vl_idct *idct; 837310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian König assert(buffer); 8387c48575402e8c384db2fab24e4dd0fc72bef0451Christian König 8397c48575402e8c384db2fab24e4dd0fc72bef0451Christian König idct = buffer->idct; 8404abe7382882a451a7750ccc451b8568768d122cbChristian König 8417f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_rasterizer_state(idct->pipe, idct->rs_state); 8427f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_blend_state(idct->pipe, idct->blend); 8437f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_fragment_sampler_states(idct->pipe, 2, idct->samplers); 844ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->set_fragment_sampler_views(idct->pipe, 2, buffer->sampler_views.stage[0]); 845ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 846ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König /* mismatch control */ 847ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->set_framebuffer_state(idct->pipe, &buffer->fb_state_mismatch); 848ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->set_viewport_state(idct->pipe, &buffer->viewport_mismatch); 849ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->bind_vs_state(idct->pipe, idct->vs_mismatch); 850ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->bind_fs_state(idct->pipe, idct->fs_mismatch); 851ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König util_draw_arrays_instanced(idct->pipe, PIPE_PRIM_POINTS, 0, 1, 0, num_instances); 8527f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8537f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* first stage */ 8547f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->set_framebuffer_state(idct->pipe, &buffer->fb_state); 8557f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->set_viewport_state(idct->pipe, &buffer->viewport); 8567f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_vs_state(idct->pipe, idct->vs); 8577f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_fs_state(idct->pipe, idct->fs); 8587f04fe5338d0846ec9a6003033da5357d2785c8bChristian König util_draw_arrays_instanced(idct->pipe, PIPE_PRIM_QUADS, 0, 4, 0, num_instances); 8597f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 8607f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8617f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvoid 8627c48575402e8c384db2fab24e4dd0fc72bef0451Christian Königvl_idct_prepare_stage2(struct vl_idct_buffer *buffer) 8637f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 8647f04fe5338d0846ec9a6003033da5357d2785c8bChristian König assert(buffer); 8657f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8667f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* second stage */ 8677c48575402e8c384db2fab24e4dd0fc72bef0451Christian König buffer->idct->pipe->bind_rasterizer_state(buffer->idct->pipe, buffer->idct->rs_state); 8687c48575402e8c384db2fab24e4dd0fc72bef0451Christian König buffer->idct->pipe->bind_fragment_sampler_states(buffer->idct->pipe, 2, buffer->idct->samplers); 8697c48575402e8c384db2fab24e4dd0fc72bef0451Christian König buffer->idct->pipe->set_fragment_sampler_views(buffer->idct->pipe, 2, buffer->sampler_views.stage[1]); 870508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 8717f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 872