vl_idct.c revision df5e0b9435c869f88234a69db9bfe97342b027d4
1508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König/************************************************************************** 2508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 3508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * Copyright 2010 Christian König 4508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * All Rights Reserved. 5508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 6508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * Permission is hereby granted, free of charge, to any person obtaining a 7508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * copy of this software and associated documentation files (the 8508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * "Software"), to deal in the Software without restriction, including 9508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * without limitation the rights to use, copy, modify, merge, publish, 10508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * distribute, sub license, and/or sell copies of the Software, and to 11508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * permit persons to whom the Software is furnished to do so, subject to 12508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * the following conditions: 13508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 14508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * The above copyright notice and this permission notice (including the 15508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * next paragraph) shall be included in all copies or substantial portions 16508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * of the Software. 17508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 18508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 19508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 20508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. 21508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR 22508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 23508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 24508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 25508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 26508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König **************************************************************************/ 27508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 28508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include <assert.h> 295ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 30508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include <pipe/p_context.h> 31508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include <pipe/p_screen.h> 325ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 335ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include <util/u_draw.h> 34508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include <util/u_sampler.h> 355ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 36508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include <tgsi/tgsi_ureg.h> 375ed848129cb57269e80caf2c1ca522ae41f4500bChristian König 385ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include "vl_defines.h" 39508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König#include "vl_types.h" 405ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include "vl_vertex_buffers.h" 415ed848129cb57269e80caf2c1ca522ae41f4500bChristian König#include "vl_idct.h" 42508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 43508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königenum VS_OUTPUT 44508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 45508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König VS_O_VPOS, 46be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_L_ADDR0, 47be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_L_ADDR1, 48be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_R_ADDR0, 49be4de05c1093db27b3fca12b782055ab8a1eba13Christian König VS_O_R_ADDR1 50508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König}; 51508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 523e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König/** 533e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * The DCT matrix stored as hex representation of floats. Equal to the following equation: 543e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * for (i = 0; i < 8; ++i) 553e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * for (j = 0; j < 8; ++j) 563e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * if (i == 0) const_matrix[i][j] = 1.0f / sqrtf(8.0f); 573e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König * else const_matrix[i][j] = sqrtf(2.0f / 8.0f) * cosf((2 * j + 1) * i * M_PI / (2.0f * 8.0f)); 583e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König */ 593e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian Königstatic const uint32_t const_matrix[8][8] = { 603e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3, 0x3eb504f3 }, 613e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3efb14be, 0x3ed4db31, 0x3e8e39da, 0x3dc7c5c4, 0xbdc7c5c2, 0xbe8e39d9, 0xbed4db32, 0xbefb14bf }, 623e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3eec835f, 0x3e43ef15, 0xbe43ef14, 0xbeec835e, 0xbeec835f, 0xbe43ef1a, 0x3e43ef1b, 0x3eec835f }, 633e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3ed4db31, 0xbdc7c5c2, 0xbefb14bf, 0xbe8e39dd, 0x3e8e39d7, 0x3efb14bf, 0x3dc7c5d0, 0xbed4db34 }, 643e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3eb504f3, 0xbeb504f3, 0xbeb504f4, 0x3eb504f1, 0x3eb504f3, 0xbeb504f0, 0xbeb504ef, 0x3eb504f4 }, 653e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3e8e39da, 0xbefb14bf, 0x3dc7c5c8, 0x3ed4db32, 0xbed4db34, 0xbdc7c5bb, 0x3efb14bf, 0xbe8e39d7 }, 663e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3e43ef15, 0xbeec835f, 0x3eec835f, 0xbe43ef07, 0xbe43ef23, 0x3eec8361, 0xbeec835c, 0x3e43ef25 }, 673e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König { 0x3dc7c5c4, 0xbe8e39dd, 0x3ed4db32, 0xbefb14c0, 0x3efb14be, 0xbed4db31, 0x3e8e39ce, 0xbdc7c596 }, 68508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König}; 69508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 70be4de05c1093db27b3fca12b782055ab8a1eba13Christian Königstatic void 71be4de05c1093db27b3fca12b782055ab8a1eba13Christian Königcalc_addr(struct ureg_program *shader, struct ureg_dst addr[2], 72be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_src tc, struct ureg_src start, bool right_side, 73be4de05c1093db27b3fca12b782055ab8a1eba13Christian König bool transposed, float size) 74be4de05c1093db27b3fca12b782055ab8a1eba13Christian König{ 75be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned wm_start = (right_side == transposed) ? TGSI_WRITEMASK_X : TGSI_WRITEMASK_Y; 76be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned sw_start = right_side ? TGSI_SWIZZLE_Y : TGSI_SWIZZLE_X; 77be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 78be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned wm_tc = (right_side == transposed) ? TGSI_WRITEMASK_Y : TGSI_WRITEMASK_X; 79be4de05c1093db27b3fca12b782055ab8a1eba13Christian König unsigned sw_tc = right_side ? TGSI_SWIZZLE_X : TGSI_SWIZZLE_Y; 80be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 81be4de05c1093db27b3fca12b782055ab8a1eba13Christian König /* 82be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[0..1].(start) = right_side ? start.x : tc.x 83be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[0..1].(tc) = right_side ? tc.y : start.y 84be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[0..1].z = tc.z 85be4de05c1093db27b3fca12b782055ab8a1eba13Christian König * addr[1].(start) += 1.0f / scale 86be4de05c1093db27b3fca12b782055ab8a1eba13Christian König */ 87be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_MOV(shader, ureg_writemask(addr[0], wm_start), ureg_scalar(start, sw_start)); 88be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_MOV(shader, ureg_writemask(addr[0], wm_tc), ureg_scalar(tc, sw_tc)); 89be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 90be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_ADD(shader, ureg_writemask(addr[1], wm_start), ureg_scalar(start, sw_start), ureg_imm1f(shader, 1.0f / size)); 91be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_MOV(shader, ureg_writemask(addr[1], wm_tc), ureg_scalar(tc, sw_tc)); 92be4de05c1093db27b3fca12b782055ab8a1eba13Christian König} 93be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 947f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königstatic void 957f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königincrement_addr(struct ureg_program *shader, struct ureg_dst daddr[2], 967f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_src saddr[2], bool right_side, bool transposed, 977f04fe5338d0846ec9a6003033da5357d2785c8bChristian König int pos, float size) 987f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 997f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned wm_start = (right_side == transposed) ? TGSI_WRITEMASK_X : TGSI_WRITEMASK_Y; 1007f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned wm_tc = (right_side == transposed) ? TGSI_WRITEMASK_Y : TGSI_WRITEMASK_X; 1017f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1027f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* 1037f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * daddr[0..1].(start) = saddr[0..1].(start) 1047f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * daddr[0..1].(tc) = saddr[0..1].(tc) 1057f04fe5338d0846ec9a6003033da5357d2785c8bChristian König */ 1067f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1077f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MOV(shader, ureg_writemask(daddr[0], wm_start), saddr[0]); 1087f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_ADD(shader, ureg_writemask(daddr[0], wm_tc), saddr[0], ureg_imm1f(shader, pos / size)); 1097f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MOV(shader, ureg_writemask(daddr[1], wm_start), saddr[1]); 1107f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_ADD(shader, ureg_writemask(daddr[1], wm_tc), saddr[1], ureg_imm1f(shader, pos / size)); 1117f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 1127f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1137f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königstatic void 114b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian Königfetch_four(struct ureg_program *shader, struct ureg_dst m[2], struct ureg_src addr[2], 115b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König struct ureg_src sampler, bool resource3d) 1167f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 117b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_TEX(shader, m[0], resource3d ? TGSI_TEXTURE_3D : TGSI_TEXTURE_2D, addr[0], sampler); 118b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_TEX(shader, m[1], resource3d ? TGSI_TEXTURE_3D : TGSI_TEXTURE_2D, addr[1], sampler); 1197f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 1207f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1217f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königstatic void 1227f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königmatrix_mul(struct ureg_program *shader, struct ureg_dst dst, struct ureg_dst l[2], struct ureg_dst r[2]) 1237f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 1247f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_dst tmp; 1257f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1267f04fe5338d0846ec9a6003033da5357d2785c8bChristian König tmp = ureg_DECL_temporary(shader); 1277f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1287f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* 1297f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * tmp.xy = dot4(m[0][0..1], m[1][0..1]) 1307f04fe5338d0846ec9a6003033da5357d2785c8bChristian König * dst = tmp.x + tmp.y 1317f04fe5338d0846ec9a6003033da5357d2785c8bChristian König */ 1327f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_DP4(shader, ureg_writemask(tmp, TGSI_WRITEMASK_X), ureg_src(l[0]), ureg_src(r[0])); 1337f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_DP4(shader, ureg_writemask(tmp, TGSI_WRITEMASK_Y), ureg_src(l[1]), ureg_src(r[1])); 1347f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_ADD(shader, dst, 1357f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_scalar(ureg_src(tmp), TGSI_SWIZZLE_X), 1367f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_scalar(ureg_src(tmp), TGSI_SWIZZLE_Y)); 1377f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 1387f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_release_temporary(shader, tmp); 1397f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 1407f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 141508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void * 142ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königcreate_mismatch_vert_shader(struct vl_idct *idct) 143ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 144ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_program *shader; 145ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_src vrect, vpos; 146ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_src scale; 147ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst t_tex; 148ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst o_vpos, o_addr[2]; 149ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 150ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König shader = ureg_create(TGSI_PROCESSOR_VERTEX); 151ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!shader) 152ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return NULL; 153ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 154ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König vrect = ureg_DECL_vs_input(shader, VS_I_RECT); 155ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König vpos = ureg_DECL_vs_input(shader, VS_I_VPOS); 156ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 157ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König t_tex = ureg_DECL_temporary(shader); 158ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 159ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König o_vpos = ureg_DECL_output(shader, TGSI_SEMANTIC_POSITION, VS_O_VPOS); 160ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 161ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König o_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0); 162ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König o_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1); 163ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 164ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König /* 165ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * scale = (BLOCK_WIDTH, BLOCK_HEIGHT) / (dst.width, dst.height) 166ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * 167ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * t_vpos = vpos + 7 / BLOCK_WIDTH 168ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * o_vpos.xy = t_vpos * scale 169ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * 170ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * o_addr = calc_addr(...) 171ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König * 172ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König */ 173ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 174ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König scale = ureg_imm2f(shader, 175ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König (float)BLOCK_WIDTH / idct->buffer_width, 176ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König (float)BLOCK_HEIGHT / idct->buffer_height); 177ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 178ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MAD(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_XY), vpos, scale, scale); 179ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MOV(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_ZW), ureg_imm1f(shader, 1.0f)); 180ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 181ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MUL(shader, ureg_writemask(t_tex, TGSI_WRITEMASK_XY), vpos, scale); 182ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König calc_addr(shader, o_addr, ureg_src(t_tex), ureg_src(t_tex), false, false, idct->buffer_width / 4); 183ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 184ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_release_temporary(shader, t_tex); 185ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 186ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_END(shader); 187ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 188ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return ureg_create_shader_and_destroy(shader, idct->pipe); 189ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 190ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 191ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic void * 192ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königcreate_mismatch_frag_shader(struct vl_idct *idct) 193ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 194ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_program *shader; 195ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 196ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_src addr[2]; 197ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 198ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst m[8][2]; 199ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_dst fragment; 200ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 201ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König unsigned i; 202ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 203ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König shader = ureg_create(TGSI_PROCESSOR_FRAGMENT); 204ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!shader) 205ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return NULL; 206ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 207ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0, TGSI_INTERPOLATE_LINEAR); 208ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1, TGSI_INTERPOLATE_LINEAR); 209ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 210ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fragment = ureg_DECL_output(shader, TGSI_SEMANTIC_COLOR, 0); 211ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 212ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 213ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König m[i][0] = ureg_DECL_temporary(shader); 214ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König m[i][1] = ureg_DECL_temporary(shader); 215ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 216ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 217ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 218ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König increment_addr(shader, m[i], addr, false, false, i, idct->buffer_height); 219ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 220ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 221ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 222ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct ureg_src s_addr[2] = { ureg_src(m[i][0]), ureg_src(m[i][1]) }; 223ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, m[i], s_addr, ureg_DECL_sampler(shader, 0), false); 224ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 225ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 226ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 1; i < 8; ++i) { 227ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, m[0][0], ureg_src(m[0][0]), ureg_src(m[i][0])); 228ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, m[0][1], ureg_src(m[0][1]), ureg_src(m[i][1])); 229ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 230ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 231ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, m[0][0], ureg_src(m[0][0]), ureg_src(m[0][1])); 232ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_DP4(shader, m[0][0], ureg_abs(ureg_src(m[0][0])), ureg_imm1f(shader, 1 << 14)); 233ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 234ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MUL(shader, ureg_writemask(m[0][0], TGSI_WRITEMASK_W), ureg_abs(ureg_src(m[7][1])), ureg_imm1f(shader, 1 << 14)); 235ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_FRC(shader, m[0][0], ureg_src(m[0][0])); 236ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_SGT(shader, m[0][0], ureg_imm1f(shader, 0.5f), ureg_abs(ureg_src(m[0][0]))); 237ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 238ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_CMP(shader, ureg_writemask(m[0][0], TGSI_WRITEMASK_W), ureg_negate(ureg_src(m[0][0])), 239ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_imm1f(shader, 1.0f / (1 << 15)), ureg_imm1f(shader, -1.0f / (1 << 15))); 240ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MUL(shader, ureg_writemask(m[0][0], TGSI_WRITEMASK_W), ureg_src(m[0][0]), 241ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_scalar(ureg_src(m[0][0]), TGSI_SWIZZLE_X)); 242ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 243ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_MOV(shader, ureg_writemask(fragment, TGSI_WRITEMASK_XYZ), ureg_src(m[7][1])); 244ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_ADD(shader, ureg_writemask(fragment, TGSI_WRITEMASK_W), ureg_src(m[0][0]), ureg_src(m[7][1])); 245ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 246ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König for (i = 0; i < 8; ++i) { 247ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_release_temporary(shader, m[i][0]); 248ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_release_temporary(shader, m[i][1]); 249ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König } 250ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 251ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König ureg_END(shader); 252ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 253ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return ureg_create_shader_and_destroy(shader, idct->pipe); 254ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 255ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 256ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic void * 2577f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königcreate_stage1_vert_shader(struct vl_idct *idct) 258508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 259508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König struct ureg_program *shader; 2603511780a43077d1359bd491eadb4ab9b3b86795aChristian König struct ureg_src vrect, vpos; 2613511780a43077d1359bd491eadb4ab9b3b86795aChristian König struct ureg_src scale; 262be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_dst t_tex, t_start; 263be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_dst o_vpos, o_l_addr[2], o_r_addr[2]; 264508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 265508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König shader = ureg_create(TGSI_PROCESSOR_VERTEX); 266508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König if (!shader) 267508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return NULL; 268508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 269508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König vrect = ureg_DECL_vs_input(shader, VS_I_RECT); 270508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König vpos = ureg_DECL_vs_input(shader, VS_I_VPOS); 271508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 2727f04fe5338d0846ec9a6003033da5357d2785c8bChristian König t_tex = ureg_DECL_temporary(shader); 2737f04fe5338d0846ec9a6003033da5357d2785c8bChristian König t_start = ureg_DECL_temporary(shader); 2747f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 275508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König o_vpos = ureg_DECL_output(shader, TGSI_SEMANTIC_POSITION, VS_O_VPOS); 276be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 277be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_l_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0); 278be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_l_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1); 279be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 280be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_r_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR0); 281be4de05c1093db27b3fca12b782055ab8a1eba13Christian König o_r_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR1); 282508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 283508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König /* 28412836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König * scale = (BLOCK_WIDTH, BLOCK_HEIGHT) / (dst.width, dst.height) 285508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 2863511780a43077d1359bd491eadb4ab9b3b86795aChristian König * t_vpos = vpos + vrect 2873511780a43077d1359bd491eadb4ab9b3b86795aChristian König * o_vpos.xy = t_vpos * scale 288310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian König * o_vpos.zw = vpos 289508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König * 2903511780a43077d1359bd491eadb4ab9b3b86795aChristian König * o_l_addr = calc_addr(...) 2913511780a43077d1359bd491eadb4ab9b3b86795aChristian König * o_r_addr = calc_addr(...) 2923511780a43077d1359bd491eadb4ab9b3b86795aChristian König * 293508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König */ 294310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian König 29512836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König scale = ureg_imm2f(shader, 29622b4acb2069a368e986805d3b43395172ebf9146Christian König (float)BLOCK_WIDTH / idct->buffer_width, 29722b4acb2069a368e986805d3b43395172ebf9146Christian König (float)BLOCK_HEIGHT / idct->buffer_height); 29812836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König 2993511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_ADD(shader, ureg_writemask(t_tex, TGSI_WRITEMASK_XY), vpos, vrect); 3003511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MUL(shader, ureg_writemask(t_tex, TGSI_WRITEMASK_XY), ureg_src(t_tex), scale); 301ab130400cf91ab471e265e58193c95f04c7aeedaChristian König 3023511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MOV(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_XY), ureg_src(t_tex)); 3033511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MOV(shader, ureg_writemask(o_vpos, TGSI_WRITEMASK_ZW), ureg_imm1f(shader, 1.0f)); 304f853ea007816cdad4395b42388e12cd65bb8eb43Christian König 3053511780a43077d1359bd491eadb4ab9b3b86795aChristian König ureg_MUL(shader, ureg_writemask(t_start, TGSI_WRITEMASK_XY), vpos, scale); 306508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 3077f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_l_addr, ureg_src(t_tex), ureg_src(t_start), false, false, idct->buffer_width / 4); 3087f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_r_addr, vrect, ureg_imm1f(shader, 0.0f), true, true, BLOCK_WIDTH / 4); 309be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 310be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, t_tex); 311be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, t_start); 312508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 313508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König ureg_END(shader); 314508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 315508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return ureg_create_shader_and_destroy(shader, idct->pipe); 316508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 317508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 318508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void * 3197f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königcreate_stage1_frag_shader(struct vl_idct *idct) 320508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 321508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König struct ureg_program *shader; 322cfe489b89723117e56674c2be7761c201f8d78ffChristian König 323f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König struct ureg_src l_addr[2], r_addr[2]; 324cfe489b89723117e56674c2be7761c201f8d78ffChristian König 325f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König struct ureg_dst l[4][2], r[2]; 326fcf765620d803b376582afb618b1f643242b641bChristian König struct ureg_dst fragment[idct->nr_of_render_targets]; 32712836fbcfad7f317b1f5aa5e46f9946894bf040cChristian König 3283db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König int i, j; 329508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 330508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König shader = ureg_create(TGSI_PROCESSOR_FRAGMENT); 331508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König if (!shader) 332508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return NULL; 333508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 334be4de05c1093db27b3fca12b782055ab8a1eba13Christian König l_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR0, TGSI_INTERPOLATE_LINEAR); 335be4de05c1093db27b3fca12b782055ab8a1eba13Christian König l_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_L_ADDR1, TGSI_INTERPOLATE_LINEAR); 336be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 337be4de05c1093db27b3fca12b782055ab8a1eba13Christian König r_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR0, TGSI_INTERPOLATE_LINEAR); 338be4de05c1093db27b3fca12b782055ab8a1eba13Christian König r_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, VS_O_R_ADDR1, TGSI_INTERPOLATE_LINEAR); 339cfe489b89723117e56674c2be7761c201f8d78ffChristian König 340fcf765620d803b376582afb618b1f643242b641bChristian König for (i = 0; i < idct->nr_of_render_targets; ++i) 341e742a1043dbd56fe11f0490cb74b7a738bab2238Christian König fragment[i] = ureg_DECL_output(shader, TGSI_SEMANTIC_COLOR, i); 342e742a1043dbd56fe11f0490cb74b7a738bab2238Christian König 34374c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König for (i = 0; i < 4; ++i) { 344f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[i][0] = ureg_DECL_temporary(shader); 345f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[i][1] = ureg_DECL_temporary(shader); 346f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König } 3474a8420513d653cd2fccf93a51315120a1a5d0fccChristian König 348f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[0] = ureg_DECL_temporary(shader); 349f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[1] = ureg_DECL_temporary(shader); 350f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König 3513db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König for (i = 0; i < 4; ++i) { 3523db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König increment_addr(shader, l[i], l_addr, false, false, i - 2, idct->buffer_height); 353f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König } 354f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König 355f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König for (i = 0; i < 4; ++i) { 3563db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König struct ureg_src s_addr[2] = { ureg_src(l[i][0]), ureg_src(l[i][1]) }; 357ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, l[i], s_addr, ureg_DECL_sampler(shader, 0), false); 35874c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König } 359c8236aaf7056bd8645804e71596d2d6460e62d15Christian König 360fcf765620d803b376582afb618b1f643242b641bChristian König for (i = 0; i < idct->nr_of_render_targets; ++i) { 3613db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König increment_addr(shader, r, r_addr, true, true, i - (signed)idct->nr_of_render_targets / 2, BLOCK_HEIGHT); 362a984c67b316ac2ca9aaf6d38a3127cf3d61a249eChristian König 363f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König struct ureg_src s_addr[2] = { ureg_src(r[0]), ureg_src(r[1]) }; 364ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, r, s_addr, ureg_DECL_sampler(shader, 1), false); 365a984c67b316ac2ca9aaf6d38a3127cf3d61a249eChristian König 36674c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König for (j = 0; j < 4; ++j) { 36774c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König matrix_mul(shader, ureg_writemask(fragment[i], TGSI_WRITEMASK_X << j), l[j], r); 36874c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König } 369e742a1043dbd56fe11f0490cb74b7a738bab2238Christian König } 37074c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König 37174c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König for (i = 0; i < 4; ++i) { 37274c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König ureg_release_temporary(shader, l[i][0]); 37374c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König ureg_release_temporary(shader, l[i][1]); 37474c71f09f3d321963b738acfb0bfd30b1e1efaebChristian König } 375f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König ureg_release_temporary(shader, r[0]); 376f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König ureg_release_temporary(shader, r[1]); 377be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 378be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_END(shader); 379be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 380be4de05c1093db27b3fca12b782055ab8a1eba13Christian König return ureg_create_shader_and_destroy(shader, idct->pipe); 381be4de05c1093db27b3fca12b782055ab8a1eba13Christian König} 382be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 3837f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvoid 3847f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvl_idct_stage2_vert_shader(struct vl_idct *idct, struct ureg_program *shader, 3857f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned first_output, struct ureg_dst tex) 386be4de05c1093db27b3fca12b782055ab8a1eba13Christian König{ 3877f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_src vrect, vpos; 3887f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_src scale; 3897f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_dst t_start; 3907f04fe5338d0846ec9a6003033da5357d2785c8bChristian König struct ureg_dst o_l_addr[2], o_r_addr[2]; 3917f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 3927f04fe5338d0846ec9a6003033da5357d2785c8bChristian König vrect = ureg_DECL_vs_input(shader, VS_I_RECT); 3937f04fe5338d0846ec9a6003033da5357d2785c8bChristian König vpos = ureg_DECL_vs_input(shader, VS_I_VPOS); 394be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 3957f04fe5338d0846ec9a6003033da5357d2785c8bChristian König t_start = ureg_DECL_temporary(shader); 3967f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 3977f04fe5338d0846ec9a6003033da5357d2785c8bChristian König --first_output; 3987f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 3997f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_l_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_L_ADDR0); 4007f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_l_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_L_ADDR1); 4017f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4027f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_r_addr[0] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_R_ADDR0); 4037f04fe5338d0846ec9a6003033da5357d2785c8bChristian König o_r_addr[1] = ureg_DECL_output(shader, TGSI_SEMANTIC_GENERIC, first_output + VS_O_R_ADDR1); 4047f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4057f04fe5338d0846ec9a6003033da5357d2785c8bChristian König scale = ureg_imm2f(shader, 4067f04fe5338d0846ec9a6003033da5357d2785c8bChristian König (float)BLOCK_WIDTH / idct->buffer_width, 4077f04fe5338d0846ec9a6003033da5357d2785c8bChristian König (float)BLOCK_HEIGHT / idct->buffer_height); 4087f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4097f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MUL(shader, ureg_writemask(tex, TGSI_WRITEMASK_Z), 4107f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_scalar(vrect, TGSI_SWIZZLE_X), 4117f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_imm1f(shader, BLOCK_WIDTH / idct->nr_of_render_targets)); 4127f04fe5338d0846ec9a6003033da5357d2785c8bChristian König ureg_MUL(shader, ureg_writemask(t_start, TGSI_WRITEMASK_XY), vpos, scale); 4137f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4147f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_l_addr, vrect, ureg_imm1f(shader, 0.0f), false, false, BLOCK_WIDTH / 4); 4157f04fe5338d0846ec9a6003033da5357d2785c8bChristian König calc_addr(shader, o_r_addr, ureg_src(tex), ureg_src(t_start), true, false, idct->buffer_height / 4); 416b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König 417b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_MOV(shader, ureg_writemask(o_r_addr[0], TGSI_WRITEMASK_Z), ureg_src(tex)); 418b4837a53d365bd1bd5f50b3fb40910eeaac869a5Christian König ureg_MOV(shader, ureg_writemask(o_r_addr[1], TGSI_WRITEMASK_Z), ureg_src(tex)); 4197f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 4207f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 4217f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvoid 4227f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvl_idct_stage2_frag_shader(struct vl_idct *idct, struct ureg_program *shader, 4237f04fe5338d0846ec9a6003033da5357d2785c8bChristian König unsigned first_input, struct ureg_dst fragment) 4247f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 425be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_src l_addr[2], r_addr[2]; 426be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 427be4de05c1093db27b3fca12b782055ab8a1eba13Christian König struct ureg_dst l[2], r[2]; 428be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4297f04fe5338d0846ec9a6003033da5357d2785c8bChristian König --first_input; 430be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4317f04fe5338d0846ec9a6003033da5357d2785c8bChristian König l_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_L_ADDR0, TGSI_INTERPOLATE_LINEAR); 4327f04fe5338d0846ec9a6003033da5357d2785c8bChristian König l_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_L_ADDR1, TGSI_INTERPOLATE_LINEAR); 433be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4347f04fe5338d0846ec9a6003033da5357d2785c8bChristian König r_addr[0] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_R_ADDR0, TGSI_INTERPOLATE_LINEAR); 4357f04fe5338d0846ec9a6003033da5357d2785c8bChristian König r_addr[1] = ureg_DECL_fs_input(shader, TGSI_SEMANTIC_GENERIC, first_input + VS_O_R_ADDR1, TGSI_INTERPOLATE_LINEAR); 436be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 437f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[0] = ureg_DECL_temporary(shader); 438f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König l[1] = ureg_DECL_temporary(shader); 439f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[0] = ureg_DECL_temporary(shader); 440f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König r[1] = ureg_DECL_temporary(shader); 441f780626c35c7c3cac2e9aa7c2ec77ca587d6ab95Christian König 442ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, l, l_addr, ureg_DECL_sampler(shader, 1), false); 443ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König fetch_four(shader, r, r_addr, ureg_DECL_sampler(shader, 0), true); 444be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4457f04fe5338d0846ec9a6003033da5357d2785c8bChristian König matrix_mul(shader, fragment, l, r); 446be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 447be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, l[0]); 448be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, l[1]); 449be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, r[0]); 450be4de05c1093db27b3fca12b782055ab8a1eba13Christian König ureg_release_temporary(shader, r[1]); 451508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 452508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 453508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic bool 45459774e5c7a2756c5c430fc74bc80ea75d54f594dChristian Königinit_shaders(struct vl_idct *idct) 455508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 456ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->vs_mismatch = create_mismatch_vert_shader(idct); 457ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!idct->vs_mismatch) 458ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König goto error_vs_mismatch; 459ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 460ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->fs_mismatch = create_mismatch_frag_shader(idct); 461ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!idct->fs_mismatch) 462ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König goto error_fs_mismatch; 463ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 4647f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->vs = create_stage1_vert_shader(idct); 4657f04fe5338d0846ec9a6003033da5357d2785c8bChristian König if (!idct->vs) 4667f04fe5338d0846ec9a6003033da5357d2785c8bChristian König goto error_vs; 467be4de05c1093db27b3fca12b782055ab8a1eba13Christian König 4687f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->fs = create_stage1_frag_shader(idct); 4697f04fe5338d0846ec9a6003033da5357d2785c8bChristian König if (!idct->fs) 4707f04fe5338d0846ec9a6003033da5357d2785c8bChristian König goto error_fs; 4718330bc29dda71c41c56b3c1989334823ae8779d4Christian König 4728330bc29dda71c41c56b3c1989334823ae8779d4Christian König return true; 4738330bc29dda71c41c56b3c1989334823ae8779d4Christian König 4747f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königerror_fs: 4757f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->delete_vs_state(idct->pipe, idct->vs); 4768330bc29dda71c41c56b3c1989334823ae8779d4Christian König 4777f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königerror_vs: 478ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_vs_state(idct->pipe, idct->vs_mismatch); 479ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 480ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königerror_fs_mismatch: 481ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_vs_state(idct->pipe, idct->fs); 482ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 483ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königerror_vs_mismatch: 4848330bc29dda71c41c56b3c1989334823ae8779d4Christian König return false; 485508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 486508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 487508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void 488508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königcleanup_shaders(struct vl_idct *idct) 489508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 490ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_vs_state(idct->pipe, idct->vs_mismatch); 491ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->delete_fs_state(idct->pipe, idct->fs_mismatch); 4927f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->delete_vs_state(idct->pipe, idct->vs); 4937f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->delete_fs_state(idct->pipe, idct->fs); 494508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 495508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 496508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic bool 4970b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königinit_state(struct vl_idct *idct) 4980b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 4990a2310b375068694d5700395aededc3fe68a0f3aChristian König struct pipe_blend_state blend; 5000b749d6dcb537472771d6fe6e454aafc916ab3feChristian König struct pipe_rasterizer_state rs_state; 5010a2310b375068694d5700395aededc3fe68a0f3aChristian König struct pipe_sampler_state sampler; 5020b749d6dcb537472771d6fe6e454aafc916ab3feChristian König unsigned i; 5030b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5040b749d6dcb537472771d6fe6e454aafc916ab3feChristian König assert(idct); 5050b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5068330bc29dda71c41c56b3c1989334823ae8779d4Christian König memset(&rs_state, 0, sizeof(rs_state)); 507ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König rs_state.point_size = 1; 5083db6514357a7c634045ae7bc7bba7d7dbf9d58c5Christian König rs_state.gl_rasterization_rules = true; 5098330bc29dda71c41c56b3c1989334823ae8779d4Christian König idct->rs_state = idct->pipe->create_rasterizer_state(idct->pipe, &rs_state); 5108330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!idct->rs_state) 5118330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_rs_state; 5128330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5130a2310b375068694d5700395aededc3fe68a0f3aChristian König memset(&blend, 0, sizeof blend); 5140a2310b375068694d5700395aededc3fe68a0f3aChristian König 5150a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.independent_blend_enable = 0; 5160a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].blend_enable = 0; 5170a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].rgb_func = PIPE_BLEND_ADD; 5180a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].rgb_src_factor = PIPE_BLENDFACTOR_ONE; 5190a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].rgb_dst_factor = PIPE_BLENDFACTOR_ONE; 5200a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].alpha_func = PIPE_BLEND_ADD; 5210a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].alpha_src_factor = PIPE_BLENDFACTOR_ONE; 5220a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].alpha_dst_factor = PIPE_BLENDFACTOR_ONE; 5230a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.logicop_enable = 0; 5240a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.logicop_func = PIPE_LOGICOP_CLEAR; 5250a2310b375068694d5700395aededc3fe68a0f3aChristian König /* Needed to allow color writes to FB, even if blending disabled */ 5260a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.rt[0].colormask = PIPE_MASK_RGBA; 5270a2310b375068694d5700395aededc3fe68a0f3aChristian König blend.dither = 0; 5280a2310b375068694d5700395aededc3fe68a0f3aChristian König idct->blend = idct->pipe->create_blend_state(idct->pipe, &blend); 5290a2310b375068694d5700395aededc3fe68a0f3aChristian König if (!idct->blend) 5300a2310b375068694d5700395aededc3fe68a0f3aChristian König goto error_blend; 5310a2310b375068694d5700395aededc3fe68a0f3aChristian König 5325a351e51291922aa295926215fdecccc0baeef51Christian König for (i = 0; i < 2; ++i) { 5330b749d6dcb537472771d6fe6e454aafc916ab3feChristian König memset(&sampler, 0, sizeof(sampler)); 534be4de05c1093db27b3fca12b782055ab8a1eba13Christian König sampler.wrap_s = PIPE_TEX_WRAP_REPEAT; 535be4de05c1093db27b3fca12b782055ab8a1eba13Christian König sampler.wrap_t = PIPE_TEX_WRAP_REPEAT; 536be4de05c1093db27b3fca12b782055ab8a1eba13Christian König sampler.wrap_r = PIPE_TEX_WRAP_REPEAT; 5370b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.min_img_filter = PIPE_TEX_FILTER_NEAREST; 5380b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.min_mip_filter = PIPE_TEX_MIPFILTER_NONE; 5390b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.mag_img_filter = PIPE_TEX_FILTER_NEAREST; 5400b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.compare_mode = PIPE_TEX_COMPARE_NONE; 5410b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.compare_func = PIPE_FUNC_ALWAYS; 5420b749d6dcb537472771d6fe6e454aafc916ab3feChristian König sampler.normalized_coords = 1; 5435a351e51291922aa295926215fdecccc0baeef51Christian König idct->samplers[i] = idct->pipe->create_sampler_state(idct->pipe, &sampler); 5445a351e51291922aa295926215fdecccc0baeef51Christian König if (!idct->samplers[i]) 5458330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_samplers; 5460b749d6dcb537472771d6fe6e454aafc916ab3feChristian König } 5470b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5480b749d6dcb537472771d6fe6e454aafc916ab3feChristian König return true; 5498330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5508330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_samplers: 5515a351e51291922aa295926215fdecccc0baeef51Christian König for (i = 0; i < 2; ++i) 5525a351e51291922aa295926215fdecccc0baeef51Christian König if (idct->samplers[i]) 5535a351e51291922aa295926215fdecccc0baeef51Christian König idct->pipe->delete_sampler_state(idct->pipe, idct->samplers[i]); 5548330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5558330bc29dda71c41c56b3c1989334823ae8779d4Christian König idct->pipe->delete_rasterizer_state(idct->pipe, idct->rs_state); 5568330bc29dda71c41c56b3c1989334823ae8779d4Christian König 5570a2310b375068694d5700395aededc3fe68a0f3aChristian Königerror_blend: 5580a2310b375068694d5700395aededc3fe68a0f3aChristian König idct->pipe->delete_blend_state(idct->pipe, idct->blend); 5590a2310b375068694d5700395aededc3fe68a0f3aChristian König 5608330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_rs_state: 5618330bc29dda71c41c56b3c1989334823ae8779d4Christian König return false; 5620b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 5630b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5640b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königstatic void 5650b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königcleanup_state(struct vl_idct *idct) 5660b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 5670b749d6dcb537472771d6fe6e454aafc916ab3feChristian König unsigned i; 5680b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5695a351e51291922aa295926215fdecccc0baeef51Christian König for (i = 0; i < 2; ++i) 5705a351e51291922aa295926215fdecccc0baeef51Christian König idct->pipe->delete_sampler_state(idct->pipe, idct->samplers[i]); 5710b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5720b749d6dcb537472771d6fe6e454aafc916ab3feChristian König idct->pipe->delete_rasterizer_state(idct->pipe, idct->rs_state); 5730a2310b375068694d5700395aededc3fe68a0f3aChristian König idct->pipe->delete_blend_state(idct->pipe, idct->blend); 5740b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 5750b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 5760b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königstatic bool 577ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königinit_source(struct vl_idct *idct, struct vl_idct_buffer *buffer) 578ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 579ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct pipe_resource *tex; 580ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct pipe_surface surf_templ; 581ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 582ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König assert(idct && buffer); 583ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 584ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König tex = buffer->sampler_views.individual.source->texture; 585ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 586ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.width = tex->width0; 587ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.height = tex->height0; 588ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.nr_cbufs = 1; 589ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 590ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König memset(&surf_templ, 0, sizeof(surf_templ)); 591ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.format = tex->format; 592ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.u.tex.first_layer = 0; 593ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.u.tex.last_layer = 0; 594ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König surf_templ.usage = PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_RENDER_TARGET; 595ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->fb_state_mismatch.cbufs[0] = idct->pipe->create_surface(idct->pipe, tex, &surf_templ); 596ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 597ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[0] = tex->width0; 598ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[1] = tex->height0; 599ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[2] = 1; 600ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport_mismatch.scale[3] = 1; 601ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 602ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return true; 603ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 604ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 605ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic void 606ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königcleanup_source(struct vl_idct *idct, struct vl_idct_buffer *buffer) 607ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König{ 608ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König assert(idct && buffer); 609ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 610ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König pipe_surface_reference(&buffer->fb_state_mismatch.cbufs[0], NULL); 611ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 612ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König pipe_sampler_view_reference(&buffer->sampler_views.individual.source, NULL); 613ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König} 614ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 615ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian Königstatic bool 616020328ca32a3b6548b4c064c4fe115e386752daaChristian Königinit_intermediate(struct vl_idct *idct, struct vl_idct_buffer *buffer) 617508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 61831109e1be20d7c94521879c3221a9f77bacbdb8dChristian König struct pipe_resource *tex; 619020328ca32a3b6548b4c064c4fe115e386752daaChristian König struct pipe_surface surf_templ; 62021efda86875096333dc0412c0edab1e188f551d8Christian König unsigned i; 621508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6220b749d6dcb537472771d6fe6e454aafc916ab3feChristian König assert(idct && buffer); 6230b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 62431109e1be20d7c94521879c3221a9f77bacbdb8dChristian König tex = buffer->sampler_views.individual.intermediate->texture; 625020328ca32a3b6548b4c064c4fe115e386752daaChristian König 6267f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.width = tex->width0; 6277f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.height = tex->height0; 6287f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.nr_cbufs = idct->nr_of_render_targets; 629fcf765620d803b376582afb618b1f643242b641bChristian König for(i = 0; i < idct->nr_of_render_targets; ++i) { 630020328ca32a3b6548b4c064c4fe115e386752daaChristian König memset(&surf_templ, 0, sizeof(surf_templ)); 631020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.format = tex->format; 632020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.u.tex.first_layer = i; 633020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.u.tex.last_layer = i; 634020328ca32a3b6548b4c064c4fe115e386752daaChristian König surf_templ.usage = PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_RENDER_TARGET; 6357f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->fb_state.cbufs[i] = idct->pipe->create_surface( 636020328ca32a3b6548b4c064c4fe115e386752daaChristian König idct->pipe, tex, &surf_templ); 637508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6387f04fe5338d0846ec9a6003033da5357d2785c8bChristian König if (!buffer->fb_state.cbufs[i]) 639020328ca32a3b6548b4c064c4fe115e386752daaChristian König goto error_surfaces; 640508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König } 641508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6427f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->viewport.scale[0] = tex->width0; 6437f04fe5338d0846ec9a6003033da5357d2785c8bChristian König buffer->viewport.scale[1] = tex->height0; 644ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport.scale[2] = 1; 645ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König buffer->viewport.scale[3] = 1; 6460f07da0a1c87e1c7b53700c33d6b1f8f03c1fe11Christian König 647508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return true; 6488330bc29dda71c41c56b3c1989334823ae8779d4Christian König 649020328ca32a3b6548b4c064c4fe115e386752daaChristian Königerror_surfaces: 650fcf765620d803b376582afb618b1f643242b641bChristian König for(i = 0; i < idct->nr_of_render_targets; ++i) 6517f04fe5338d0846ec9a6003033da5357d2785c8bChristian König pipe_surface_reference(&buffer->fb_state.cbufs[i], NULL); 652020328ca32a3b6548b4c064c4fe115e386752daaChristian König 6538330bc29dda71c41c56b3c1989334823ae8779d4Christian König return false; 654508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 655508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 656508a4a056c3140dc1f90b93acd46c06c30f7094eChristian Königstatic void 657020328ca32a3b6548b4c064c4fe115e386752daaChristian Königcleanup_intermediate(struct vl_idct *idct, struct vl_idct_buffer *buffer) 658508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 659508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König unsigned i; 660508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 6610b749d6dcb537472771d6fe6e454aafc916ab3feChristian König assert(idct && buffer); 662508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 663fcf765620d803b376582afb618b1f643242b641bChristian König for(i = 0; i < idct->nr_of_render_targets; ++i) 6647f04fe5338d0846ec9a6003033da5357d2785c8bChristian König pipe_surface_reference(&buffer->fb_state.cbufs[i], NULL); 665020328ca32a3b6548b4c064c4fe115e386752daaChristian König 666020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.intermediate, NULL); 667508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 668508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 669020328ca32a3b6548b4c064c4fe115e386752daaChristian Königstruct pipe_sampler_view * 670fcdf50f74befad8d89eb3f9cdfd88b82d1daa98cChristian Königvl_idct_upload_matrix(struct pipe_context *pipe, float scale) 6713dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König{ 672020328ca32a3b6548b4c064c4fe115e386752daaChristian König struct pipe_resource tex_templ, *matrix; 673020328ca32a3b6548b4c064c4fe115e386752daaChristian König struct pipe_sampler_view sv_templ, *sv; 6743dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König struct pipe_transfer *buf_transfer; 6753dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König unsigned i, j, pitch; 6763dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König float *f; 6773dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 6783dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König struct pipe_box rect = 6793dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König { 6803dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 0, 0, 0, 6817c4887f5ae642131d7895da5bffda77a6287c6d4Christian König BLOCK_WIDTH / 4, 6823dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König BLOCK_HEIGHT, 6833dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 1 6843dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König }; 6853dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 6868330bc29dda71c41c56b3c1989334823ae8779d4Christian König assert(pipe); 6878330bc29dda71c41c56b3c1989334823ae8779d4Christian König 688020328ca32a3b6548b4c064c4fe115e386752daaChristian König memset(&tex_templ, 0, sizeof(tex_templ)); 689020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.target = PIPE_TEXTURE_2D; 690020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.format = PIPE_FORMAT_R32G32B32A32_FLOAT; 691020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.last_level = 0; 692020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.width0 = 2; 693020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.height0 = 8; 694020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.depth0 = 1; 695020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.array_size = 1; 696020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.usage = PIPE_USAGE_IMMUTABLE; 697020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.bind = PIPE_BIND_SAMPLER_VIEW; 698020328ca32a3b6548b4c064c4fe115e386752daaChristian König tex_templ.flags = 0; 699020328ca32a3b6548b4c064c4fe115e386752daaChristian König 700020328ca32a3b6548b4c064c4fe115e386752daaChristian König matrix = pipe->screen->resource_create(pipe->screen, &tex_templ); 7018330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!matrix) 7028330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_matrix; 7033dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 7043dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König buf_transfer = pipe->get_transfer 7053dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König ( 7063dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König pipe, matrix, 707772b25e1f366edc857e77b8c1ccdc5297d82cc41Christian König 0, PIPE_TRANSFER_WRITE | PIPE_TRANSFER_DISCARD, 7083dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König &rect 7093dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König ); 7108330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!buf_transfer) 7118330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_transfer; 7128330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7133fd53e6c2a05e65872de4292557d7839cbcf7395Christian König pitch = buf_transfer->stride / sizeof(float); 7143dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 7153dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König f = pipe->transfer_map(pipe, buf_transfer); 7168330bc29dda71c41c56b3c1989334823ae8779d4Christian König if (!f) 7178330bc29dda71c41c56b3c1989334823ae8779d4Christian König goto error_map; 7188330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7193dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König for(i = 0; i < BLOCK_HEIGHT; ++i) 7203dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König for(j = 0; j < BLOCK_WIDTH; ++j) 7214a8420513d653cd2fccf93a51315120a1a5d0fccChristian König // transpose and scale 7223e976ef31a27ca9a23372f4364955f0f0a5c4ef4Christian König f[i * pitch + j] = ((const float (*)[8])const_matrix)[j][i] * scale; 7233dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 7243dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König pipe->transfer_unmap(pipe, buf_transfer); 7253dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König pipe->transfer_destroy(pipe, buf_transfer); 7263dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 727020328ca32a3b6548b4c064c4fe115e386752daaChristian König memset(&sv_templ, 0, sizeof(sv_templ)); 728020328ca32a3b6548b4c064c4fe115e386752daaChristian König u_sampler_view_default_template(&sv_templ, matrix, matrix->format); 729020328ca32a3b6548b4c064c4fe115e386752daaChristian König sv = pipe->create_sampler_view(pipe, matrix, &sv_templ); 730020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_resource_reference(&matrix, NULL); 731020328ca32a3b6548b4c064c4fe115e386752daaChristian König if (!sv) 732020328ca32a3b6548b4c064c4fe115e386752daaChristian König goto error_map; 733020328ca32a3b6548b4c064c4fe115e386752daaChristian König 734020328ca32a3b6548b4c064c4fe115e386752daaChristian König return sv; 7358330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7368330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_map: 7378330bc29dda71c41c56b3c1989334823ae8779d4Christian König pipe->transfer_destroy(pipe, buf_transfer); 7388330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7398330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_transfer: 7408330bc29dda71c41c56b3c1989334823ae8779d4Christian König pipe_resource_reference(&matrix, NULL); 7418330bc29dda71c41c56b3c1989334823ae8779d4Christian König 7428330bc29dda71c41c56b3c1989334823ae8779d4Christian Königerror_matrix: 7438330bc29dda71c41c56b3c1989334823ae8779d4Christian König return NULL; 7443dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König} 7453dd7bf7d39781f3ef4c0b53732945674c9924cdfChristian König 746c8236aaf7056bd8645804e71596d2d6460e62d15Christian Königbool vl_idct_init(struct vl_idct *idct, struct pipe_context *pipe, 7470b749d6dcb537472771d6fe6e454aafc916ab3feChristian König unsigned buffer_width, unsigned buffer_height, 748fcf765620d803b376582afb618b1f643242b641bChristian König unsigned nr_of_render_targets, 749ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König struct pipe_sampler_view *matrix, 750ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König struct pipe_sampler_view *transpose) 751e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König{ 752df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(idct && pipe); 753df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(matrix && transpose); 754e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König 755e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König idct->pipe = pipe; 7560b749d6dcb537472771d6fe6e454aafc916ab3feChristian König idct->buffer_width = buffer_width; 7570b749d6dcb537472771d6fe6e454aafc916ab3feChristian König idct->buffer_height = buffer_height; 758fcf765620d803b376582afb618b1f643242b641bChristian König idct->nr_of_render_targets = nr_of_render_targets; 759ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König 760020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&idct->matrix, matrix); 761ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König pipe_sampler_view_reference(&idct->transpose, transpose); 762508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 76359774e5c7a2756c5c430fc74bc80ea75d54f594dChristian König if(!init_shaders(idct)) 764508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return false; 765508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 7660b749d6dcb537472771d6fe6e454aafc916ab3feChristian König if(!init_state(idct)) { 7670b749d6dcb537472771d6fe6e454aafc916ab3feChristian König cleanup_shaders(idct); 768508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König return false; 769508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König } 770508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 7710b749d6dcb537472771d6fe6e454aafc916ab3feChristian König return true; 7720b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 7730b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 7740b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königvoid 7750b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königvl_idct_cleanup(struct vl_idct *idct) 7760b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 7770b749d6dcb537472771d6fe6e454aafc916ab3feChristian König cleanup_shaders(idct); 7780b749d6dcb537472771d6fe6e454aafc916ab3feChristian König cleanup_state(idct); 7790b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 780020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&idct->matrix, NULL); 781df5e0b9435c869f88234a69db9bfe97342b027d4Christian König pipe_sampler_view_reference(&idct->transpose, NULL); 7820b749d6dcb537472771d6fe6e454aafc916ab3feChristian König} 7830b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 784020328ca32a3b6548b4c064c4fe115e386752daaChristian Königbool 785020328ca32a3b6548b4c064c4fe115e386752daaChristian Königvl_idct_init_buffer(struct vl_idct *idct, struct vl_idct_buffer *buffer, 78631109e1be20d7c94521879c3221a9f77bacbdb8dChristian König struct pipe_sampler_view *source, 787ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König struct pipe_sampler_view *intermediate) 7880b749d6dcb537472771d6fe6e454aafc916ab3feChristian König{ 789df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(buffer && idct); 790df5e0b9435c869f88234a69db9bfe97342b027d4Christian König assert(source && intermediate); 7910b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 7927f04fe5338d0846ec9a6003033da5357d2785c8bChristian König memset(buffer, 0, sizeof(struct vl_idct_buffer)); 7937f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 794020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.matrix, idct->matrix); 795020328ca32a3b6548b4c064c4fe115e386752daaChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.source, source); 796ccc80d2c09ad35f867c0c0a85f7e1cadd73941bbChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.transpose, idct->transpose); 79731109e1be20d7c94521879c3221a9f77bacbdb8dChristian König pipe_sampler_view_reference(&buffer->sampler_views.individual.intermediate, intermediate); 7980b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 799ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!init_source(idct, buffer)) 800020328ca32a3b6548b4c064c4fe115e386752daaChristian König return false; 8010b749d6dcb537472771d6fe6e454aafc916ab3feChristian König 802ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König if (!init_intermediate(idct, buffer)) 803ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König return false; 804508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 805020328ca32a3b6548b4c064c4fe115e386752daaChristian König return true; 806508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 807508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 80803c5a0ea5cd5b3e5931d6784749f87789a016b98Christian Königvoid 8090b749d6dcb537472771d6fe6e454aafc916ab3feChristian Königvl_idct_cleanup_buffer(struct vl_idct *idct, struct vl_idct_buffer *buffer) 810508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 8118330bc29dda71c41c56b3c1989334823ae8779d4Christian König assert(idct && buffer); 812e639e1b83ea65985cd84d12dc120d77cab80ba9eChristian König 813ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König cleanup_source(idct, buffer); 814020328ca32a3b6548b4c064c4fe115e386752daaChristian König cleanup_intermediate(idct, buffer); 815df5e0b9435c869f88234a69db9bfe97342b027d4Christian König 816df5e0b9435c869f88234a69db9bfe97342b027d4Christian König pipe_sampler_view_reference(&buffer->sampler_views.individual.matrix, NULL); 817df5e0b9435c869f88234a69db9bfe97342b027d4Christian König pipe_sampler_view_reference(&buffer->sampler_views.individual.transpose, NULL); 818508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 819508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König 82003c5a0ea5cd5b3e5931d6784749f87789a016b98Christian Königvoid 821310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian Königvl_idct_flush(struct vl_idct *idct, struct vl_idct_buffer *buffer, unsigned num_instances) 822508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König{ 8234abe7382882a451a7750ccc451b8568768d122cbChristian König assert(idct); 824310eea52ca1e997295c84163066cc5d0fd4f8cf6Christian König assert(buffer); 8254abe7382882a451a7750ccc451b8568768d122cbChristian König 8267f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_rasterizer_state(idct->pipe, idct->rs_state); 8277f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_blend_state(idct->pipe, idct->blend); 8287f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_fragment_sampler_states(idct->pipe, 2, idct->samplers); 829ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->set_fragment_sampler_views(idct->pipe, 2, buffer->sampler_views.stage[0]); 830ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König 831ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König /* mismatch control */ 832ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->set_framebuffer_state(idct->pipe, &buffer->fb_state_mismatch); 833ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->set_viewport_state(idct->pipe, &buffer->viewport_mismatch); 834ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->bind_vs_state(idct->pipe, idct->vs_mismatch); 835ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König idct->pipe->bind_fs_state(idct->pipe, idct->fs_mismatch); 836ae56a1dd67040dc5d53f4a1622f775462f0fec05Christian König util_draw_arrays_instanced(idct->pipe, PIPE_PRIM_POINTS, 0, 1, 0, num_instances); 8377f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8387f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* first stage */ 8397f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->set_framebuffer_state(idct->pipe, &buffer->fb_state); 8407f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->set_viewport_state(idct->pipe, &buffer->viewport); 8417f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_vs_state(idct->pipe, idct->vs); 8427f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_fs_state(idct->pipe, idct->fs); 8437f04fe5338d0846ec9a6003033da5357d2785c8bChristian König util_draw_arrays_instanced(idct->pipe, PIPE_PRIM_QUADS, 0, 4, 0, num_instances); 8447f04fe5338d0846ec9a6003033da5357d2785c8bChristian König} 8457f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8467f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvoid 8477f04fe5338d0846ec9a6003033da5357d2785c8bChristian Königvl_idct_prepare_stage2(struct vl_idct *idct, struct vl_idct_buffer *buffer) 8487f04fe5338d0846ec9a6003033da5357d2785c8bChristian König{ 8497f04fe5338d0846ec9a6003033da5357d2785c8bChristian König assert(idct); 8507f04fe5338d0846ec9a6003033da5357d2785c8bChristian König assert(buffer); 8517f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 8527f04fe5338d0846ec9a6003033da5357d2785c8bChristian König /* second stage */ 8537f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_rasterizer_state(idct->pipe, idct->rs_state); 8547f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->bind_fragment_sampler_states(idct->pipe, 2, idct->samplers); 8557f04fe5338d0846ec9a6003033da5357d2785c8bChristian König idct->pipe->set_fragment_sampler_views(idct->pipe, 2, buffer->sampler_views.stage[1]); 856508a4a056c3140dc1f90b93acd46c06c30f7094eChristian König} 8577f04fe5338d0846ec9a6003033da5357d2785c8bChristian König 858