r600_shader.c revision 5555cd776b970bce020be59193054474a2a63317
172128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse/* 272128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * Copyright 2010 Jerome Glisse <glisse@freedesktop.org> 372128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * 472128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * Permission is hereby granted, free of charge, to any person obtaining a 572128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * copy of this software and associated documentation files (the "Software"), 672128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * to deal in the Software without restriction, including without limitation 772128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * on the rights to use, copy, modify, merge, publish, distribute, sub 872128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * license, and/or sell copies of the Software, and to permit persons to whom 972128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * the Software is furnished to do so, subject to the following conditions: 1072128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * 1172128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * The above copyright notice and this permission notice (including the next 1272128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * paragraph) shall be included in all copies or substantial portions of the 1372128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * Software. 1472128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * 1572128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1672128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1772128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 1872128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, 1972128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 2072128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 2172128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse * USE OR OTHER DEALINGS IN THE SOFTWARE. 2272128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse */ 23de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include "pipe/p_shader_tokens.h" 24de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include "tgsi/tgsi_parse.h" 25de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include "tgsi/tgsi_scan.h" 2633241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse#include "tgsi/tgsi_dump.h" 27de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include "util/u_format.h" 289c284b5cae916a083d17d1039d2f2da128b47882Jerome Glisse#include "r600_pipe.h" 29de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include "r600_asm.h" 30de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include "r600_sq.h" 31a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie#include "r600_opcodes.h" 3272128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse#include "r600d.h" 33de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include <stdio.h> 34de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse#include <errno.h> 35de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 361235becaa1cf7e29f580900592563c3329d326deJerome Glissestatic void r600_pipe_shader_vs(struct pipe_context *ctx, struct r600_pipe_shader *shader) 371235becaa1cf7e29f580900592563c3329d326deJerome Glisse{ 381235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_pipe_state *rstate = &shader->rstate; 391235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_shader *rshader = &shader->shader; 401235becaa1cf7e29f580900592563c3329d326deJerome Glisse unsigned spi_vs_out_id[10]; 411235becaa1cf7e29f580900592563c3329d326deJerome Glisse unsigned i, tmp; 422b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse 431235becaa1cf7e29f580900592563c3329d326deJerome Glisse /* clear previous register */ 441235becaa1cf7e29f580900592563c3329d326deJerome Glisse rstate->nregs = 0; 451235becaa1cf7e29f580900592563c3329d326deJerome Glisse 461235becaa1cf7e29f580900592563c3329d326deJerome Glisse /* so far never got proper semantic id from tgsi */ 47afc56b1861c1dae4137493af4c0e6dacc6ee41f9Jerome Glisse /* FIXME better to move this in config things so they get emited 48afc56b1861c1dae4137493af4c0e6dacc6ee41f9Jerome Glisse * only one time per cs 49afc56b1861c1dae4137493af4c0e6dacc6ee41f9Jerome Glisse */ 501235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (i = 0; i < 10; i++) { 511235becaa1cf7e29f580900592563c3329d326deJerome Glisse spi_vs_out_id[i] = 0; 521235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 531235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (i = 0; i < 32; i++) { 541235becaa1cf7e29f580900592563c3329d326deJerome Glisse tmp = i << ((i & 3) * 8); 551235becaa1cf7e29f580900592563c3329d326deJerome Glisse spi_vs_out_id[i / 4] |= tmp; 561235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 571235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (i = 0; i < 10; i++) { 581235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 591235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_028614_SPI_VS_OUT_ID_0 + i * 4, 601235becaa1cf7e29f580900592563c3329d326deJerome Glisse spi_vs_out_id[i], 0xFFFFFFFF, NULL); 611235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 621235becaa1cf7e29f580900592563c3329d326deJerome Glisse 631235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 641235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_0286C4_SPI_VS_OUT_CONFIG, 651235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_0286C4_VS_EXPORT_COUNT(rshader->noutput - 2), 661235becaa1cf7e29f580900592563c3329d326deJerome Glisse 0xFFFFFFFF, NULL); 671235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 681235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_028868_SQ_PGM_RESOURCES_VS, 691235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_028868_NUM_GPRS(rshader->bc.ngpr) | 701235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_028868_STACK_SIZE(rshader->bc.nstack), 711235becaa1cf7e29f580900592563c3329d326deJerome Glisse 0xFFFFFFFF, NULL); 721235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 73fa86fc564aea4e40c89f6fc889e6a5bf817634b3Jerome Glisse R_0288D0_SQ_PGM_CF_OFFSET_VS, 741235becaa1cf7e29f580900592563c3329d326deJerome Glisse 0x00000000, 0xFFFFFFFF, NULL); 751235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 76fa86fc564aea4e40c89f6fc889e6a5bf817634b3Jerome Glisse R_028858_SQ_PGM_START_VS, 77fa86fc564aea4e40c89f6fc889e6a5bf817634b3Jerome Glisse r600_bo_offset(shader->bo) >> 8, 0xFFFFFFFF, shader->bo); 78fa86fc564aea4e40c89f6fc889e6a5bf817634b3Jerome Glisse 79738aa29289296512959cbb37d8602131dae44dabDave Airlie r600_pipe_state_add_reg(rstate, 80738aa29289296512959cbb37d8602131dae44dabDave Airlie R_03E200_SQ_LOOP_CONST_0 + (32 * 4), 0x01000FFF, 81738aa29289296512959cbb37d8602131dae44dabDave Airlie 0xFFFFFFFF, NULL); 82738aa29289296512959cbb37d8602131dae44dabDave Airlie 831235becaa1cf7e29f580900592563c3329d326deJerome Glisse} 841235becaa1cf7e29f580900592563c3329d326deJerome Glisse 85dbcd6526021c50770c3e5e04b04dc64c70298124Dave Airlieint r600_find_vs_semantic_index(struct r600_shader *vs, 861235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_shader *ps, int id) 871235becaa1cf7e29f580900592563c3329d326deJerome Glisse{ 881235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_shader_io *input = &ps->input[id]; 891235becaa1cf7e29f580900592563c3329d326deJerome Glisse 901235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (int i = 0; i < vs->noutput; i++) { 911235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (input->name == vs->output[i].name && 921235becaa1cf7e29f580900592563c3329d326deJerome Glisse input->sid == vs->output[i].sid) { 931235becaa1cf7e29f580900592563c3329d326deJerome Glisse return i - 1; 941235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 951235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 961235becaa1cf7e29f580900592563c3329d326deJerome Glisse return 0; 971235becaa1cf7e29f580900592563c3329d326deJerome Glisse} 981235becaa1cf7e29f580900592563c3329d326deJerome Glisse 991235becaa1cf7e29f580900592563c3329d326deJerome Glissestatic void r600_pipe_shader_ps(struct pipe_context *ctx, struct r600_pipe_shader *shader) 1001235becaa1cf7e29f580900592563c3329d326deJerome Glisse{ 1011235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_pipe_state *rstate = &shader->rstate; 1021235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_shader *rshader = &shader->shader; 10369251fc4cd5f71be403e08398bc43d19052a640dJerome Glisse unsigned i, exports_ps, num_cout, spi_ps_in_control_0, spi_input_z, spi_ps_in_control_1; 1041e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie int pos_index = -1, face_index = -1; 1051235becaa1cf7e29f580900592563c3329d326deJerome Glisse 1061235becaa1cf7e29f580900592563c3329d326deJerome Glisse rstate->nregs = 0; 1071235becaa1cf7e29f580900592563c3329d326deJerome Glisse 1081235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (i = 0; i < rshader->ninput; i++) { 1091235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (rshader->input[i].name == TGSI_SEMANTIC_POSITION) 1101e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie pos_index = i; 1111235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (rshader->input[i].name == TGSI_SEMANTIC_FACE) 1121e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie face_index = i; 1131235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 114afc56b1861c1dae4137493af4c0e6dacc6ee41f9Jerome Glisse 1151235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (i = 0; i < rshader->noutput; i++) { 11651f9cc4759c23b74a2e4d9c79b0a5df27d403f54Dave Airlie if (rshader->output[i].name == TGSI_SEMANTIC_POSITION) 1177777c997e0f4cf75ff292f34a5a64ee2834c0f26Dave Airlie r600_pipe_state_add_reg(rstate, 1187777c997e0f4cf75ff292f34a5a64ee2834c0f26Dave Airlie R_02880C_DB_SHADER_CONTROL, 1197777c997e0f4cf75ff292f34a5a64ee2834c0f26Dave Airlie S_02880C_Z_EXPORT_ENABLE(1), 1207777c997e0f4cf75ff292f34a5a64ee2834c0f26Dave Airlie S_02880C_Z_EXPORT_ENABLE(1), NULL); 12139d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie if (rshader->output[i].name == TGSI_SEMANTIC_STENCIL) 12239d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie r600_pipe_state_add_reg(rstate, 12339d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie R_02880C_DB_SHADER_CONTROL, 12439d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie S_02880C_STENCIL_REF_EXPORT_ENABLE(1), 12539d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie S_02880C_STENCIL_REF_EXPORT_ENABLE(1), NULL); 1261235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 1271235becaa1cf7e29f580900592563c3329d326deJerome Glisse 1281235becaa1cf7e29f580900592563c3329d326deJerome Glisse exports_ps = 0; 1291235becaa1cf7e29f580900592563c3329d326deJerome Glisse num_cout = 0; 1301235becaa1cf7e29f580900592563c3329d326deJerome Glisse for (i = 0; i < rshader->noutput; i++) { 13139d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie if (rshader->output[i].name == TGSI_SEMANTIC_POSITION || rshader->output[i].name == TGSI_SEMANTIC_STENCIL) 1321235becaa1cf7e29f580900592563c3329d326deJerome Glisse exports_ps |= 1; 1331235becaa1cf7e29f580900592563c3329d326deJerome Glisse else if (rshader->output[i].name == TGSI_SEMANTIC_COLOR) { 1341235becaa1cf7e29f580900592563c3329d326deJerome Glisse num_cout++; 1351235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 1361235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 1371235becaa1cf7e29f580900592563c3329d326deJerome Glisse exports_ps |= S_028854_EXPORT_COLORS(num_cout); 1381235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (!exports_ps) { 1391235becaa1cf7e29f580900592563c3329d326deJerome Glisse /* always at least export 1 component per pixel */ 1401235becaa1cf7e29f580900592563c3329d326deJerome Glisse exports_ps = 2; 1411235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 1421235becaa1cf7e29f580900592563c3329d326deJerome Glisse 1431235becaa1cf7e29f580900592563c3329d326deJerome Glisse spi_ps_in_control_0 = S_0286CC_NUM_INTERP(rshader->ninput) | 1441235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_0286CC_PERSP_GRADIENT_ENA(1); 1451235becaa1cf7e29f580900592563c3329d326deJerome Glisse spi_input_z = 0; 1461e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie if (pos_index != -1) { 1471e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie spi_ps_in_control_0 |= (S_0286CC_POSITION_ENA(1) | 1481e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie S_0286CC_POSITION_CENTROID(rshader->input[pos_index].centroid) | 1491e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie S_0286CC_POSITION_ADDR(rshader->input[pos_index].gpr) | 1501e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie S_0286CC_BARYC_SAMPLE_CNTL(1)); 1511235becaa1cf7e29f580900592563c3329d326deJerome Glisse spi_input_z |= 1; 1521235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 1531e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie 1541e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie spi_ps_in_control_1 = 0; 1551e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie if (face_index != -1) { 1561e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie spi_ps_in_control_1 |= S_0286D0_FRONT_FACE_ENA(1) | 1570637044add50b3a4aee8e915b84c18813c9130f3Dave Airlie S_0286D0_FRONT_FACE_ADDR(rshader->input[face_index].gpr); 1581e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie } 1591e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie 1601235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, R_0286CC_SPI_PS_IN_CONTROL_0, spi_ps_in_control_0, 0xFFFFFFFF, NULL); 1611e82c28fcf76bf79ceb5a1eaf29b3d6d25909dddDave Airlie r600_pipe_state_add_reg(rstate, R_0286D0_SPI_PS_IN_CONTROL_1, spi_ps_in_control_1, 0xFFFFFFFF, NULL); 1621235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, R_0286D8_SPI_INPUT_Z, spi_input_z, 0xFFFFFFFF, NULL); 1631235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 1641235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_028840_SQ_PGM_START_PS, 165d22a1247d8a709cf433a6dd99b2f87a224c27d88Jerome Glisse r600_bo_offset(shader->bo) >> 8, 0xFFFFFFFF, shader->bo); 1661235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 1671235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_028850_SQ_PGM_RESOURCES_PS, 1681235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_028868_NUM_GPRS(rshader->bc.ngpr) | 1691235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_028868_STACK_SIZE(rshader->bc.nstack), 1701235becaa1cf7e29f580900592563c3329d326deJerome Glisse 0xFFFFFFFF, NULL); 1711235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 1721235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_028854_SQ_PGM_EXPORTS_PS, 1731235becaa1cf7e29f580900592563c3329d326deJerome Glisse exports_ps, 0xFFFFFFFF, NULL); 1741235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 1751235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_0288CC_SQ_PGM_CF_OFFSET_PS, 1761235becaa1cf7e29f580900592563c3329d326deJerome Glisse 0x00000000, 0xFFFFFFFF, NULL); 1771235becaa1cf7e29f580900592563c3329d326deJerome Glisse 1785555cd776b970bce020be59193054474a2a63317Dave Airlie if (rshader->fs_write_all) { 1795555cd776b970bce020be59193054474a2a63317Dave Airlie r600_pipe_state_add_reg(rstate, R_028808_CB_COLOR_CONTROL, 1805555cd776b970bce020be59193054474a2a63317Dave Airlie S_028808_MULTIWRITE_ENABLE(1), 1815555cd776b970bce020be59193054474a2a63317Dave Airlie S_028808_MULTIWRITE_ENABLE(1), 1825555cd776b970bce020be59193054474a2a63317Dave Airlie NULL); 1835555cd776b970bce020be59193054474a2a63317Dave Airlie } 1845555cd776b970bce020be59193054474a2a63317Dave Airlie 1851235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (rshader->uses_kill) { 1861235becaa1cf7e29f580900592563c3329d326deJerome Glisse /* only set some bits here, the other bits are set in the dsa state */ 1871235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_state_add_reg(rstate, 1881235becaa1cf7e29f580900592563c3329d326deJerome Glisse R_02880C_DB_SHADER_CONTROL, 1891235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_02880C_KILL_ENABLE(1), 1901235becaa1cf7e29f580900592563c3329d326deJerome Glisse S_02880C_KILL_ENABLE(1), NULL); 1911235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 192738aa29289296512959cbb37d8602131dae44dabDave Airlie r600_pipe_state_add_reg(rstate, 193738aa29289296512959cbb37d8602131dae44dabDave Airlie R_03E200_SQ_LOOP_CONST_0, 0x01000FFF, 194738aa29289296512959cbb37d8602131dae44dabDave Airlie 0xFFFFFFFF, NULL); 1951235becaa1cf7e29f580900592563c3329d326deJerome Glisse} 1961235becaa1cf7e29f580900592563c3329d326deJerome Glisse 19769251fc4cd5f71be403e08398bc43d19052a640dJerome Glisseint r600_pipe_shader(struct pipe_context *ctx, struct r600_pipe_shader *shader) 1981235becaa1cf7e29f580900592563c3329d326deJerome Glisse{ 1991235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_pipe_context *rctx = (struct r600_pipe_context *)ctx; 2001235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_shader *rshader = &shader->shader; 2011235becaa1cf7e29f580900592563c3329d326deJerome Glisse void *ptr; 2021235becaa1cf7e29f580900592563c3329d326deJerome Glisse 2031235becaa1cf7e29f580900592563c3329d326deJerome Glisse /* copy new shader */ 2041235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (shader->bo == NULL) { 20529c4a15bf61a76cd71ffa5b8f09706d0eab84281Keith Whitwell shader->bo = r600_bo(rctx->radeon, rshader->bc.ndw * 4, 4096, 0, 0); 2061235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (shader->bo == NULL) { 2071235becaa1cf7e29f580900592563c3329d326deJerome Glisse return -ENOMEM; 2081235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 209294c9fce1b924beddf198a3cce738b88eabb5537Jerome Glisse ptr = r600_bo_map(rctx->radeon, shader->bo, 0, NULL); 2101235becaa1cf7e29f580900592563c3329d326deJerome Glisse memcpy(ptr, rshader->bc.bytecode, rshader->bc.ndw * 4); 211294c9fce1b924beddf198a3cce738b88eabb5537Jerome Glisse r600_bo_unmap(rctx->radeon, shader->bo); 2121235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 2131235becaa1cf7e29f580900592563c3329d326deJerome Glisse /* build state */ 2141235becaa1cf7e29f580900592563c3329d326deJerome Glisse switch (rshader->processor_type) { 2151235becaa1cf7e29f580900592563c3329d326deJerome Glisse case TGSI_PROCESSOR_VERTEX: 2161235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (rshader->family >= CHIP_CEDAR) { 2171235becaa1cf7e29f580900592563c3329d326deJerome Glisse evergreen_pipe_shader_vs(ctx, shader); 2181235becaa1cf7e29f580900592563c3329d326deJerome Glisse } else { 2191235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_shader_vs(ctx, shader); 2201235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 2211235becaa1cf7e29f580900592563c3329d326deJerome Glisse break; 2221235becaa1cf7e29f580900592563c3329d326deJerome Glisse case TGSI_PROCESSOR_FRAGMENT: 2231235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (rshader->family >= CHIP_CEDAR) { 2241235becaa1cf7e29f580900592563c3329d326deJerome Glisse evergreen_pipe_shader_ps(ctx, shader); 2251235becaa1cf7e29f580900592563c3329d326deJerome Glisse } else { 2261235becaa1cf7e29f580900592563c3329d326deJerome Glisse r600_pipe_shader_ps(ctx, shader); 2271235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 2281235becaa1cf7e29f580900592563c3329d326deJerome Glisse break; 2291235becaa1cf7e29f580900592563c3329d326deJerome Glisse default: 2301235becaa1cf7e29f580900592563c3329d326deJerome Glisse return -EINVAL; 2311235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 2321235becaa1cf7e29f580900592563c3329d326deJerome Glisse return 0; 2331235becaa1cf7e29f580900592563c3329d326deJerome Glisse} 2341235becaa1cf7e29f580900592563c3329d326deJerome Glisse 23596f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian Königint r600_shader_from_tgsi(const struct tgsi_token *tokens, struct r600_shader *shader, u32 **literals); 236dbcd6526021c50770c3e5e04b04dc64c70298124Dave Airlieint r600_pipe_shader_create(struct pipe_context *ctx, struct r600_pipe_shader *shader, const struct tgsi_token *tokens) 2371235becaa1cf7e29f580900592563c3329d326deJerome Glisse{ 238052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König static int dump_shaders = -1; 2391235becaa1cf7e29f580900592563c3329d326deJerome Glisse struct r600_pipe_context *rctx = (struct r600_pipe_context *)ctx; 24096f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König u32 *literals; 2411235becaa1cf7e29f580900592563c3329d326deJerome Glisse int r; 2421235becaa1cf7e29f580900592563c3329d326deJerome Glisse 243052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König /* Would like some magic "get_bool_option_once" routine. 244052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König */ 245052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König if (dump_shaders == -1) 246052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König dump_shaders = debug_get_bool_option("R600_DUMP_SHADERS", FALSE); 247052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König 248052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König if (dump_shaders) { 249052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König fprintf(stderr, "--------------------------------------------------------------\n"); 250052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König tgsi_dump(tokens, 0); 251052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König } 2521235becaa1cf7e29f580900592563c3329d326deJerome Glisse shader->shader.family = r600_get_family(rctx->radeon); 25396f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König r = r600_shader_from_tgsi(tokens, &shader->shader, &literals); 2541235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (r) { 2551235becaa1cf7e29f580900592563c3329d326deJerome Glisse R600_ERR("translation from TGSI failed !\n"); 2561235becaa1cf7e29f580900592563c3329d326deJerome Glisse return r; 2571235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 2581235becaa1cf7e29f580900592563c3329d326deJerome Glisse r = r600_bc_build(&shader->shader.bc); 25996f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König free(literals); 2601235becaa1cf7e29f580900592563c3329d326deJerome Glisse if (r) { 2611235becaa1cf7e29f580900592563c3329d326deJerome Glisse R600_ERR("building bytecode failed !\n"); 2621235becaa1cf7e29f580900592563c3329d326deJerome Glisse return r; 2631235becaa1cf7e29f580900592563c3329d326deJerome Glisse } 264052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König if (dump_shaders) { 265052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König r600_bc_dump(&shader->shader.bc); 266052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König fprintf(stderr, "______________________________________________________________\n"); 267052b9e8fab2e7deddf7f287d63c45aa938e5ec67Christian König } 268afc56b1861c1dae4137493af4c0e6dacc6ee41f9Jerome Glisse return r600_pipe_shader(ctx, shader); 2691235becaa1cf7e29f580900592563c3329d326deJerome Glisse} 2701235becaa1cf7e29f580900592563c3329d326deJerome Glisse 27169251fc4cd5f71be403e08398bc43d19052a640dJerome Glissevoid r600_pipe_shader_destroy(struct pipe_context *ctx, struct r600_pipe_shader *shader) 272ccb9be105602edaaff196046e324c8cb4a12fe0aTilman Sauerbeck{ 273ccb9be105602edaaff196046e324c8cb4a12fe0aTilman Sauerbeck struct r600_pipe_context *rctx = (struct r600_pipe_context *)ctx; 274ccb9be105602edaaff196046e324c8cb4a12fe0aTilman Sauerbeck 275ccb9be105602edaaff196046e324c8cb4a12fe0aTilman Sauerbeck r600_bo_reference(rctx->radeon, &shader->bo, NULL); 276f4a2c62af56ce10e43688e8283f8defeb05cef1aTilman Sauerbeck r600_bc_clear(&shader->shader.bc); 277ccb9be105602edaaff196046e324c8cb4a12fe0aTilman Sauerbeck} 278ccb9be105602edaaff196046e324c8cb4a12fe0aTilman Sauerbeck 2791235becaa1cf7e29f580900592563c3329d326deJerome Glisse/* 2801235becaa1cf7e29f580900592563c3329d326deJerome Glisse * tgsi -> r600 shader 2811235becaa1cf7e29f580900592563c3329d326deJerome Glisse */ 2822b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glissestruct r600_shader_tgsi_instruction; 2832b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse 2842b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glissestruct r600_shader_ctx { 2852b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse struct tgsi_shader_info info; 2862b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse struct tgsi_parse_context parse; 2872b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse const struct tgsi_token *tokens; 2882b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse unsigned type; 2892b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse unsigned file_offset[TGSI_FILE_COUNT]; 2902b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse unsigned temp_reg; 2912b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse struct r600_shader_tgsi_instruction *inst_info; 2922b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse struct r600_bc *bc; 2932b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse struct r600_shader *shader; 294cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen u32 *literals; 295cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen u32 nliterals; 296e0b6df4fcce0964ea7930efeb40cb487b4c53337John Doe u32 max_driver_temp_used; 297fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* needed for evergreen interpolation */ 298fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie boolean input_centroid; 299fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie boolean input_linear; 300fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie boolean input_perspective; 301fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie int num_interp_gpr; 3022b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse}; 3032b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse 3042b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glissestruct r600_shader_tgsi_instruction { 3052b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse unsigned tgsi_opcode; 3062b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse unsigned is_op3; 3072b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse unsigned r600_opcode; 3082b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse int (*process)(struct r600_shader_ctx *ctx); 3092b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse}; 3102b3b76a4a0e21eb4bd4f1a4da5ff6ed26ccbabd1Jerome Glisse 31150526e094f4c66957c7f74c190c35903bc82fb62Dave Airliestatic struct r600_shader_tgsi_instruction r600_shader_tgsi_instruction[], eg_shader_tgsi_instruction[]; 31242c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeckstatic int tgsi_helper_tempx_replicate(struct r600_shader_ctx *ctx); 313de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 314de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_is_supported(struct r600_shader_ctx *ctx) 315de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 316de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct tgsi_full_instruction *i = &ctx->parse.FullToken.FullInstruction; 317de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse int j; 318de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 319de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (i->Instruction.NumDstRegs > 1) { 320de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("too many dst (%d)\n", i->Instruction.NumDstRegs); 321de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 32272128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse } 323de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (i->Instruction.Predicate) { 324de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("predicate unsupported\n"); 325de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 326c6131879eb7dfdf26cd068109f6680608d608ab4Jerome Glisse } 327a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie#if 0 328de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (i->Instruction.Label) { 329de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("label unsupported\n"); 330de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 33172128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse } 332a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie#endif 333de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse for (j = 0; j < i->Instruction.NumSrcRegs; j++) { 3348260ab93461eca3e18f9c17a9ca1961a11372071Keith Whitwell if (i->Src[j].Register.Dimension) { 3358260ab93461eca3e18f9c17a9ca1961a11372071Keith Whitwell R600_ERR("unsupported src %d (dimension %d)\n", j, 3368260ab93461eca3e18f9c17a9ca1961a11372071Keith Whitwell i->Src[j].Register.Dimension); 337de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 338de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 339de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 340de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse for (j = 0; j < i->Instruction.NumDstRegs; j++) { 34147d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie if (i->Dst[j].Register.Dimension) { 34247d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie R600_ERR("unsupported dst (dimension)\n"); 343de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 344de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 345de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 346de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 34772128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse} 34872128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse 349fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airliestatic int evergreen_interp_alu(struct r600_shader_ctx *ctx, int input) 35050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie{ 35150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie int i, r; 35250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie struct r600_bc_alu alu; 353fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie int gpr = 0, base_chan = 0; 354fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie int ij_index = 0; 355fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 356fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->shader->input[input].interpolate == TGSI_INTERPOLATE_PERSPECTIVE) { 357fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ij_index = 0; 358fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->shader->input[input].centroid) 359fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ij_index++; 360fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie } else if (ctx->shader->input[input].interpolate == TGSI_INTERPOLATE_LINEAR) { 361fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ij_index = 0; 362fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* if we have perspective add one */ 363fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->input_perspective) { 364fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ij_index++; 365fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* if we have perspective centroid */ 366fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->input_centroid) 367fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ij_index++; 368fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie } 369fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->shader->input[input].centroid) 370fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ij_index++; 371fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie } 3727ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 373fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* work out gpr and base_chan from index */ 374fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie gpr = ij_index / 2; 375fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie base_chan = (2 * (ij_index % 2)) + 1; 37650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie 37750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie for (i = 0; i < 8; i++) { 37850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 37950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie 38050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie if (i < 4) 38150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie alu.inst = EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INTERP_ZW; 38250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie else 38350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie alu.inst = EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INTERP_XY; 38450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie 38550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie if ((i > 1) && (i < 6)) { 386fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie alu.dst.sel = ctx->shader->input[input].gpr; 38750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie alu.dst.write = 1; 38850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie } 38950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie 39050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie alu.dst.chan = i % 4; 391fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 392fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie alu.src[0].sel = gpr; 393fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie alu.src[0].chan = (base_chan - (i % 2)); 394fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 395fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie alu.src[1].sel = V_SQ_ALU_SRC_PARAM_BASE + ctx->shader->input[input].lds_pos; 39650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie 39750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie alu.bank_swizzle_force = SQ_ALU_VEC_210; 39850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie if ((i % 4) == 3) 39950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie alu.last = 1; 40050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 40150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie if (r) 40250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie return r; 40350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie } 40450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie return 0; 4057ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse} 4067ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 4077ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 408de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_declaration(struct r600_shader_ctx *ctx) 40972128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse{ 410de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct tgsi_full_declaration *d = &ctx->parse.FullToken.FullDeclaration; 411de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse unsigned i; 41272128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse 413de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse switch (d->Declaration.File) { 414de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_FILE_INPUT: 415de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse i = ctx->shader->ninput++; 416de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx->shader->input[i].name = d->Semantic.Name; 417de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx->shader->input[i].sid = d->Semantic.Index; 41835e044ab562b65aa53f9d9d7b5885e6a887774bbJerome Glisse ctx->shader->input[i].interpolate = d->Declaration.Interpolate; 4198a9f02c5d503089bdcc90ff934f6269e59356d52Dave Airlie ctx->shader->input[i].centroid = d->Declaration.Centroid; 420de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx->shader->input[i].gpr = ctx->file_offset[TGSI_FILE_INPUT] + i; 4214afd0683854ac1cfbe7118232b5e344c83d4b0c2Alex Deucher if (ctx->type == TGSI_PROCESSOR_FRAGMENT && ctx->bc->chiprev == CHIPREV_EVERGREEN) { 42250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* turn input into interpolate on EG */ 423fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->shader->input[i].name != TGSI_SEMANTIC_POSITION) { 424fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->shader->input[i].interpolate > 0) { 425fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->shader->input[i].lds_pos = ctx->shader->nlds++; 426fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie evergreen_interp_alu(ctx, i); 427fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie } 428fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie } 42950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie } 430de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 431de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_FILE_OUTPUT: 432de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse i = ctx->shader->noutput++; 433de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx->shader->output[i].name = d->Semantic.Name; 434de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx->shader->output[i].sid = d->Semantic.Index; 435de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx->shader->output[i].gpr = ctx->file_offset[TGSI_FILE_OUTPUT] + i; 43635e044ab562b65aa53f9d9d7b5885e6a887774bbJerome Glisse ctx->shader->output[i].interpolate = d->Declaration.Interpolate; 437de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 438de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_FILE_CONSTANT: 439de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_FILE_TEMPORARY: 44033241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse case TGSI_FILE_SAMPLER: 44147d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie case TGSI_FILE_ADDRESS: 442de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 443de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse default: 444de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("unsupported file %d declaration\n", d->Declaration.File); 445de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 446de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 447de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 44872128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse} 44972128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse 450be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airliestatic int r600_get_temp(struct r600_shader_ctx *ctx) 451be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie{ 452be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie return ctx->temp_reg + ctx->max_driver_temp_used++; 453be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie} 454be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie 4557ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse/* 456fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie * for evergreen we need to scan the shader to find the number of GPRs we need to 457fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie * reserve for interpolation. 458fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie * 459fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie * we need to know if we are going to emit 460fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie * any centroid inputs 461fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie * if perspective and linear are required 462fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie*/ 463fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airliestatic int evergreen_gpr_count(struct r600_shader_ctx *ctx) 464fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie{ 465fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie int i; 466fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie int num_baryc; 467fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 468fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->input_linear = FALSE; 469fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->input_perspective = FALSE; 470fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->input_centroid = FALSE; 471fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->num_interp_gpr = 1; 472fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 473fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* any centroid inputs */ 474fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie for (i = 0; i < ctx->info.num_inputs; i++) { 475fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* skip position/face */ 476fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->info.input_semantic_name[i] == TGSI_SEMANTIC_POSITION || 477fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->info.input_semantic_name[i] == TGSI_SEMANTIC_FACE) 478fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie continue; 479fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->info.input_interpolate[i] == TGSI_INTERPOLATE_LINEAR) 480fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->input_linear = TRUE; 481fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->info.input_interpolate[i] == TGSI_INTERPOLATE_PERSPECTIVE) 482fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->input_perspective = TRUE; 483fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->info.input_centroid[i]) 484fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->input_centroid = TRUE; 485fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie } 486fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 487fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie num_baryc = 0; 488fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* ignoring sample for now */ 489fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->input_perspective) 490fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie num_baryc++; 491fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->input_linear) 492fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie num_baryc++; 493fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie if (ctx->input_centroid) 494fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie num_baryc *= 2; 495fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 496fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx->num_interp_gpr += (num_baryc + 1) >> 1; 497fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 498fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie /* TODO PULL MODEL and LINE STIPPLE, FIXED PT POS */ 499fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie return ctx->num_interp_gpr; 500fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie} 501fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie 50296f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian Königint r600_shader_from_tgsi(const struct tgsi_token *tokens, struct r600_shader *shader, u32 **literals) 50372128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse{ 504de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct tgsi_full_immediate *immediate; 5055555cd776b970bce020be59193054474a2a63317Dave Airlie struct tgsi_full_property *property; 506de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct r600_shader_ctx ctx; 507c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse struct r600_bc_output output[32]; 508457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse unsigned output_done, noutput; 509de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse unsigned opcode; 510de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse int i, r = 0, pos0; 51172128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse 512de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.bc = &shader->bc; 513de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.shader = shader; 514de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = r600_bc_init(ctx.bc, shader->family); 515de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 516de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return r; 517de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.tokens = tokens; 518de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse tgsi_scan_shader(tokens, &ctx.info); 519de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse tgsi_parse_init(&ctx.parse, tokens); 520de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.type = ctx.parse.FullHeader.Processor.Processor; 521de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse shader->processor_type = ctx.type; 522f609b2ab0342d77a8beca9efb5fbc5b66ff98295Jerome Glisse ctx.bc->type = shader->processor_type; 523de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 524de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* register allocations */ 525076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher /* Values [0,127] correspond to GPR[0..127]. 526076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher * Values [128,159] correspond to constant buffer bank 0 527076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher * Values [160,191] correspond to constant buffer bank 1 528f39dfa0ab08d1328110afb5ed0ed16a8b5e3fbdaHenri Verbeet * Values [256,511] correspond to cfile constants c[0..255]. (Gone on EG) 529f39dfa0ab08d1328110afb5ed0ed16a8b5e3fbdaHenri Verbeet * Values [256,287] correspond to constant buffer bank 2 (EG) 530f39dfa0ab08d1328110afb5ed0ed16a8b5e3fbdaHenri Verbeet * Values [288,319] correspond to constant buffer bank 3 (EG) 531de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * Other special values are shown in the list below. 532076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher * 244 ALU_SRC_1_DBL_L: special constant 1.0 double-float, LSW. (RV670+) 533076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher * 245 ALU_SRC_1_DBL_M: special constant 1.0 double-float, MSW. (RV670+) 534076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher * 246 ALU_SRC_0_5_DBL_L: special constant 0.5 double-float, LSW. (RV670+) 535076c53879b90855ecf38602584f22e4ab6db7569Alex Deucher * 247 ALU_SRC_0_5_DBL_M: special constant 0.5 double-float, MSW. (RV670+) 536de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 248 SQ_ALU_SRC_0: special constant 0.0. 537de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 249 SQ_ALU_SRC_1: special constant 1.0 float. 538de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 250 SQ_ALU_SRC_1_INT: special constant 1 integer. 539de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 251 SQ_ALU_SRC_M_1_INT: special constant -1 integer. 540de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 252 SQ_ALU_SRC_0_5: special constant 0.5 float. 541de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 253 SQ_ALU_SRC_LITERAL: literal constant. 542de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 254 SQ_ALU_SRC_PV: previous vector result. 543de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse * 255 SQ_ALU_SRC_PS: previous scalar result. 544de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse */ 545de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse for (i = 0; i < TGSI_FILE_COUNT; i++) { 546de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.file_offset[i] = 0; 547de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 548de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (ctx.type == TGSI_PROCESSOR_VERTEX) { 549de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.file_offset[TGSI_FILE_INPUT] = 1; 5504afd0683854ac1cfbe7118232b5e344c83d4b0c2Alex Deucher if (ctx.bc->chiprev == CHIPREV_EVERGREEN) { 551f609b2ab0342d77a8beca9efb5fbc5b66ff98295Jerome Glisse r600_bc_add_cfinst(ctx.bc, EG_V_SQ_CF_WORD1_SQ_CF_INST_CALL_FS); 552f609b2ab0342d77a8beca9efb5fbc5b66ff98295Jerome Glisse } else { 553f609b2ab0342d77a8beca9efb5fbc5b66ff98295Jerome Glisse r600_bc_add_cfinst(ctx.bc, V_SQ_CF_WORD1_SQ_CF_INST_CALL_FS); 554f609b2ab0342d77a8beca9efb5fbc5b66ff98295Jerome Glisse } 555de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 5564afd0683854ac1cfbe7118232b5e344c83d4b0c2Alex Deucher if (ctx.type == TGSI_PROCESSOR_FRAGMENT && ctx.bc->chiprev == CHIPREV_EVERGREEN) { 557fc6caef4cb67fb13642c5ebccee53019d1764df6Dave Airlie ctx.file_offset[TGSI_FILE_INPUT] = evergreen_gpr_count(&ctx); 55884457701b05ef29126d90c2fe72083278d26bd4fAndre Maasikas } 559de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.file_offset[TGSI_FILE_OUTPUT] = ctx.file_offset[TGSI_FILE_INPUT] + 560de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.info.file_count[TGSI_FILE_INPUT]; 561de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.file_offset[TGSI_FILE_TEMPORARY] = ctx.file_offset[TGSI_FILE_OUTPUT] + 562de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.info.file_count[TGSI_FILE_OUTPUT]; 563d2c06b5037fe9282cbbc0c7acd84a1b286716507Dave Airlie 56497e2aa31c6e735d5f6bd1d67a4dd8da2605aedc8Henri Verbeet /* Outside the GPR range. This will be translated to one of the 56597e2aa31c6e735d5f6bd1d67a4dd8da2605aedc8Henri Verbeet * kcache banks later. */ 56697e2aa31c6e735d5f6bd1d67a4dd8da2605aedc8Henri Verbeet ctx.file_offset[TGSI_FILE_CONSTANT] = 512; 567d42efb9e8df6ef872ab4f142e3daf1b6cb9eff11Dave Airlie 5687728bef29097c8406d35c6dd969544382abdf935Christian König ctx.file_offset[TGSI_FILE_IMMEDIATE] = V_SQ_ALU_SRC_LITERAL; 569de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.temp_reg = ctx.file_offset[TGSI_FILE_TEMPORARY] + 570de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse ctx.info.file_count[TGSI_FILE_TEMPORARY]; 571de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 572cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.nliterals = 0; 573cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.literals = NULL; 5745555cd776b970bce020be59193054474a2a63317Dave Airlie shader->fs_write_all = FALSE; 575de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse while (!tgsi_parse_end_of_tokens(&ctx.parse)) { 576de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse tgsi_parse_token(&ctx.parse); 577de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse switch (ctx.parse.FullToken.Token.Type) { 578de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_TOKEN_TYPE_IMMEDIATE: 579de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse immediate = &ctx.parse.FullToken.FullImmediate; 580cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.literals = realloc(ctx.literals, (ctx.nliterals + 1) * 16); 581cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen if(ctx.literals == NULL) { 582cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen r = -ENOMEM; 583cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen goto out_err; 584cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen } 585cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.literals[ctx.nliterals * 4 + 0] = immediate->u[0].Uint; 586cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.literals[ctx.nliterals * 4 + 1] = immediate->u[1].Uint; 587cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.literals[ctx.nliterals * 4 + 2] = immediate->u[2].Uint; 588cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.literals[ctx.nliterals * 4 + 3] = immediate->u[3].Uint; 589cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen ctx.nliterals++; 590de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 591de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_TOKEN_TYPE_DECLARATION: 592de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = tgsi_declaration(&ctx); 593de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 594de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 595de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 596de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_TOKEN_TYPE_INSTRUCTION: 597de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = tgsi_is_supported(&ctx); 598de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 599de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 600be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie ctx.max_driver_temp_used = 0; 601be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie /* reserve first tmp for everyone */ 602be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie r600_get_temp(&ctx); 603de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse opcode = ctx.parse.FullToken.FullInstruction.Instruction.Opcode; 6044afd0683854ac1cfbe7118232b5e344c83d4b0c2Alex Deucher if (ctx.bc->chiprev == CHIPREV_EVERGREEN) 60550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie ctx.inst_info = &eg_shader_tgsi_instruction[opcode]; 60650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie else 60750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie ctx.inst_info = &r600_shader_tgsi_instruction[opcode]; 608de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = ctx.inst_info->process(&ctx); 609de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 610de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 611de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 612876effb0e717e8e64050662f6ffa286c22065f5cDave Airlie case TGSI_TOKEN_TYPE_PROPERTY: 6135555cd776b970bce020be59193054474a2a63317Dave Airlie property = &ctx.parse.FullToken.FullProperty; 6145555cd776b970bce020be59193054474a2a63317Dave Airlie if (property->Property.PropertyName == TGSI_PROPERTY_FS_COLOR0_WRITES_ALL_CBUFS) { 6155555cd776b970bce020be59193054474a2a63317Dave Airlie if (property->u[0].Data == 1) 6165555cd776b970bce020be59193054474a2a63317Dave Airlie shader->fs_write_all = TRUE; 6175555cd776b970bce020be59193054474a2a63317Dave Airlie } 618876effb0e717e8e64050662f6ffa286c22065f5cDave Airlie break; 619de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse default: 620de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("unsupported token type %d\n", ctx.parse.FullToken.Token.Type); 621de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = -EINVAL; 622de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 623de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 624de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 625de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* export output */ 626457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse noutput = shader->noutput; 627457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse for (i = 0, pos0 = 0; i < noutput; i++) { 628c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse memset(&output[i], 0, sizeof(struct r600_bc_output)); 629c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].gpr = shader->output[i].gpr; 630c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].elem_size = 3; 631c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].swizzle_x = 0; 632c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].swizzle_y = 1; 633c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].swizzle_z = 2; 634c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].swizzle_w = 3; 635c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].barrier = 1; 636c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PARAM; 637c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].array_base = i - pos0; 638a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie output[i].inst = BC_INST(ctx.bc, V_SQ_CF_ALLOC_EXPORT_WORD1_SQ_CF_INST_EXPORT); 639457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse switch (ctx.type) { 640de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_PROCESSOR_VERTEX: 641de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (shader->output[i].name == TGSI_SEMANTIC_POSITION) { 642c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].array_base = 60; 643c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_POS; 644de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* position doesn't count in array_base */ 645457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse pos0++; 646457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse } 647457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse if (shader->output[i].name == TGSI_SEMANTIC_PSIZE) { 648457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].array_base = 61; 649457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_POS; 650457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse /* position doesn't count in array_base */ 651457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse pos0++; 652de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 653de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 654de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_PROCESSOR_FRAGMENT: 655de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (shader->output[i].name == TGSI_SEMANTIC_COLOR) { 656b474478f206c6d81af78696d3d5ce156d4d413d7Jerome Glisse output[i].array_base = shader->output[i].sid; 657c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PIXEL; 6585f6ab5e259de826bb3795d90fdb0235c8997acb9Dave Airlie } else if (shader->output[i].name == TGSI_SEMANTIC_POSITION) { 659c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].array_base = 61; 660b87b6e5bf798fcfa486e8082a09b4425a40cf3c4Dave Airlie output[i].swizzle_x = 2; 66139d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].swizzle_y = 7; 66239d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].swizzle_z = output[i].swizzle_w = 7; 66339d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PIXEL; 66439d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie } else if (shader->output[i].name == TGSI_SEMANTIC_STENCIL) { 66539d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].array_base = 61; 66639d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].swizzle_x = 7; 66739d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].swizzle_y = 1; 66839d1feb51e9dac794751e72f48faf26409a84b1cDave Airlie output[i].swizzle_z = output[i].swizzle_w = 7; 669c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PIXEL; 670de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } else { 671de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("unsupported fragment output name %d\n", shader->output[i].name); 672de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = -EINVAL; 673de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 674de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 675de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 676de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse default: 677de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("unsupported processor type %d\n", ctx.type); 678de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = -EINVAL; 679de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 68072128962d640846472c1b0dc22cf4ac6ce875dc9Jerome Glisse } 681457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse } 682457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse /* add fake param output for vertex shader if no param is exported */ 683457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse if (ctx.type == TGSI_PROCESSOR_VERTEX) { 684457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse for (i = 0, pos0 = 0; i < noutput; i++) { 685457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse if (output[i].type == V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PARAM) { 686457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse pos0 = 1; 687457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse break; 688457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse } 689457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse } 690457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse if (!pos0) { 691457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse memset(&output[i], 0, sizeof(struct r600_bc_output)); 692457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].gpr = 0; 693457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].elem_size = 3; 694457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].swizzle_x = 0; 695457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].swizzle_y = 1; 696457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].swizzle_z = 2; 697457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].swizzle_w = 3; 698457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].barrier = 1; 699457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PARAM; 700457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].array_base = 0; 7017e5173d065f0da450cf553e3e3084a0f774919a3Dave Airlie output[i].inst = BC_INST(ctx.bc, V_SQ_CF_ALLOC_EXPORT_WORD1_SQ_CF_INST_EXPORT); 702457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse noutput++; 703de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 704c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse } 705481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse /* add fake pixel export */ 706481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse if (ctx.type == TGSI_PROCESSOR_FRAGMENT && !noutput) { 707481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse memset(&output[0], 0, sizeof(struct r600_bc_output)); 708481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].gpr = 0; 709481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].elem_size = 3; 710481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].swizzle_x = 7; 711481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].swizzle_y = 7; 712481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].swizzle_z = 7; 713481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].swizzle_w = 7; 714481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].barrier = 1; 715608f749ec3fc655d3e67e572fa2e256a42c16878Jerome Glisse output[0].type = V_SQ_CF_ALLOC_EXPORT_WORD0_SQ_EXPORT_PIXEL; 716481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse output[0].array_base = 0; 717a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie output[0].inst = BC_INST(ctx.bc, V_SQ_CF_ALLOC_EXPORT_WORD1_SQ_CF_INST_EXPORT); 718481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse noutput++; 719481b65abaedb271d0da24c75b8c60f7bcf6d8ce9Jerome Glisse } 720457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse /* set export done on last export of each type */ 721457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse for (i = noutput - 1, output_done = 0; i >= 0; i--) { 722457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse if (i == (noutput - 1)) { 723457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse output[i].end_of_program = 1; 724457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse } 725b474478f206c6d81af78696d3d5ce156d4d413d7Jerome Glisse if (!(output_done & (1 << output[i].type))) { 726b474478f206c6d81af78696d3d5ce156d4d413d7Jerome Glisse output_done |= (1 << output[i].type); 727a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie output[i].inst = BC_INST(ctx.bc, V_SQ_CF_ALLOC_EXPORT_WORD1_SQ_CF_INST_EXPORT_DONE); 728c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse } 729c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse } 730457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse /* add output to bytecode */ 731457378e031ffb89a2011604c7798a6f5f2142207Jerome Glisse for (i = 0; i < noutput; i++) { 732c3ad060488ffd98f1c6dc9127b46324c5201f434Jerome Glisse r = r600_bc_add_output(ctx.bc, &output[i]); 733de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 734de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse goto out_err; 735de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 73696f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König *literals = ctx.literals; 737de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse tgsi_parse_free(&ctx.parse); 738de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 739de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisseout_err: 740cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen free(ctx.literals); 741de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse tgsi_parse_free(&ctx.parse); 742de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return r; 743de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 744de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 745de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_unsupported(struct r600_shader_ctx *ctx) 746de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 747de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse R600_ERR("%d tgsi opcode unsupported\n", ctx->inst_info->tgsi_opcode); 748de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return -EINVAL; 749de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 750de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 751de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_end(struct r600_shader_ctx *ctx) 752de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 753de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 754de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 755de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 756de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_src(struct r600_shader_ctx *ctx, 757de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse const struct tgsi_full_src_register *tgsi_src, 758de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct r600_bc_alu_src *r600_src) 759de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 7607e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse memset(r600_src, 0, sizeof(struct r600_bc_alu_src)); 7617728bef29097c8406d35c6dd969544382abdf935Christian König r600_src->neg = tgsi_src->Register.Negate; 7627728bef29097c8406d35c6dd969544382abdf935Christian König r600_src->abs = tgsi_src->Register.Absolute; 7639e964baaf34fedec385a750b97fd6684fc52584aHenri Verbeet if (tgsi_src->Register.File == TGSI_FILE_IMMEDIATE) { 7647728bef29097c8406d35c6dd969544382abdf935Christian König int index; 7657728bef29097c8406d35c6dd969544382abdf935Christian König if((tgsi_src->Register.SwizzleX == tgsi_src->Register.SwizzleY) && 7667728bef29097c8406d35c6dd969544382abdf935Christian König (tgsi_src->Register.SwizzleX == tgsi_src->Register.SwizzleZ) && 7677728bef29097c8406d35c6dd969544382abdf935Christian König (tgsi_src->Register.SwizzleX == tgsi_src->Register.SwizzleW)) { 7687728bef29097c8406d35c6dd969544382abdf935Christian König 7697728bef29097c8406d35c6dd969544382abdf935Christian König index = tgsi_src->Register.Index * 4 + tgsi_src->Register.SwizzleX; 77096f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König r600_bc_special_constants(ctx->literals[index], &r600_src->sel, &r600_src->neg); 77196f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König if (r600_src->sel != V_SQ_ALU_SRC_LITERAL) 7727728bef29097c8406d35c6dd969544382abdf935Christian König return 0; 7737728bef29097c8406d35c6dd969544382abdf935Christian König } 774cd4bd4fb53f82361480f388923ef9e2fa7379d68Bas Nieuwenhuizen index = tgsi_src->Register.Index; 7757728bef29097c8406d35c6dd969544382abdf935Christian König r600_src->sel = V_SQ_ALU_SRC_LITERAL; 77696f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König r600_src->value = ctx->literals + index * 4; 7777728bef29097c8406d35c6dd969544382abdf935Christian König } else { 7787728bef29097c8406d35c6dd969544382abdf935Christian König if (tgsi_src->Register.Indirect) 7797728bef29097c8406d35c6dd969544382abdf935Christian König r600_src->rel = V_SQ_REL_RELATIVE; 7807728bef29097c8406d35c6dd969544382abdf935Christian König r600_src->sel = tgsi_src->Register.Index; 7817728bef29097c8406d35c6dd969544382abdf935Christian König r600_src->sel += ctx->file_offset[tgsi_src->Register.File]; 782de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 783de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 784de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 785de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 786de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_dst(struct r600_shader_ctx *ctx, 787de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse const struct tgsi_full_dst_register *tgsi_dst, 788de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse unsigned swizzle, 789de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct r600_bc_alu_dst *r600_dst) 790de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 7917a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 7927a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse 793de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r600_dst->sel = tgsi_dst->Register.Index; 794de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r600_dst->sel += ctx->file_offset[tgsi_dst->Register.File]; 795de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r600_dst->chan = swizzle; 796de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r600_dst->write = 1; 79747d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie if (tgsi_dst->Register.Indirect) 79847d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie r600_dst->rel = V_SQ_REL_RELATIVE; 7997a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse if (inst->Instruction.Saturate) { 8007a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse r600_dst->clamp = 1; 8017a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse } 802de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 803de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 804de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 8057e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glissestatic unsigned tgsi_chan(const struct tgsi_full_src_register *tgsi_src, unsigned swizzle) 8067e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse{ 8077e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse switch (swizzle) { 8087e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse case 0: 8097e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return tgsi_src->Register.SwizzleX; 8107e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse case 1: 8117e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return tgsi_src->Register.SwizzleY; 8127e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse case 2: 8137e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return tgsi_src->Register.SwizzleZ; 8147e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse case 3: 8157e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return tgsi_src->Register.SwizzleW; 8167e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse default: 8177e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return 0; 8187e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8197e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse} 8207e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse 8217e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glissestatic int tgsi_split_constant(struct r600_shader_ctx *ctx, struct r600_bc_alu_src r600_src[3]) 8227e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse{ 8237e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 8247e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct r600_bc_alu alu; 8257e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse int i, j, k, nconst, r; 8267e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse 8277e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse for (i = 0, nconst = 0; i < inst->Instruction.NumSrcRegs; i++) { 8287e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (inst->Src[i].Register.File == TGSI_FILE_CONSTANT) { 8297e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse nconst++; 8307e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8317e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_src(ctx, &inst->Src[i], &r600_src[i]); 8327e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) { 8337e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 8347e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8357e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8367e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse for (i = 0, j = nconst - 1; i < inst->Instruction.NumSrcRegs; i++) { 8379d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (j > 0 && inst->Src[i].Register.File == TGSI_FILE_CONSTANT) { 838be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie int treg = r600_get_temp(ctx); 8397e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse for (k = 0; k < 4; k++) { 8407e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 841a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 8429d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse alu.src[0].sel = r600_src[i].sel; 8437e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0].chan = k; 84440cc5bfcd70e412289dbb32a1ebca91bf109e1bdStephan Schmid alu.src[0].rel = r600_src[i].rel; 845be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.dst.sel = treg; 8467e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.chan = k; 8477e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.write = 1; 8487e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (k == 3) 8497e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.last = 1; 8507e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 8517e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 8527e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 8537e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8549d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r600_src[i].sel = treg; 85540cc5bfcd70e412289dbb32a1ebca91bf109e1bdStephan Schmid r600_src[i].rel =0; 8567e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse j--; 8577e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8587e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 8597e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return 0; 8607e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse} 8617e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse 862be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie/* need to move any immediate into a temp - for trig functions which use literal for PI stuff */ 863be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airliestatic int tgsi_split_literal_constant(struct r600_shader_ctx *ctx, struct r600_bc_alu_src r600_src[3]) 864be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie{ 865be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 866be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie struct r600_bc_alu alu; 86720846a8ce102aa2bc6d3f1e907d490940c0d0a69Vinson Lee int i, j, k, nliteral, r; 868be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie 869be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie for (i = 0, nliteral = 0; i < inst->Instruction.NumSrcRegs; i++) { 8707728bef29097c8406d35c6dd969544382abdf935Christian König if (r600_src[i].sel == V_SQ_ALU_SRC_LITERAL) { 871be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie nliteral++; 872be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie } 873be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie } 8749d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse for (i = 0, j = nliteral - 1; i < inst->Instruction.NumSrcRegs; i++) { 8757728bef29097c8406d35c6dd969544382abdf935Christian König if (j > 0 && r600_src[i].sel == V_SQ_ALU_SRC_LITERAL) { 876be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie int treg = r600_get_temp(ctx); 877be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie for (k = 0; k < 4; k++) { 878be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 879a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 8809d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse alu.src[0].sel = r600_src[i].sel; 881be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.src[0].chan = k; 88296f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[0].value = r600_src[i].value; 883be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.dst.sel = treg; 884be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.dst.chan = k; 885be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.dst.write = 1; 886be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie if (k == 3) 887be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.last = 1; 888be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 889be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie if (r) 890be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie return r; 891be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie } 8929d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r600_src[i].sel = treg; 8939d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse j--; 894be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie } 895be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie } 896be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie return 0; 897be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie} 898be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie 899dffad730df17983cfaef0808555a8c26cad0aa15Christian Königstatic int tgsi_last_instruction(unsigned writemask) 900de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 901dffad730df17983cfaef0808555a8c26cad0aa15Christian König int i, lasti = 0; 902d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie 903d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie for (i = 0; i < 4; i++) { 904dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (writemask & (1 << i)) { 905d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie lasti = i; 906d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie } 907d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie } 908dffad730df17983cfaef0808555a8c26cad0aa15Christian König return lasti; 909dffad730df17983cfaef0808555a8c26cad0aa15Christian König} 910dffad730df17983cfaef0808555a8c26cad0aa15Christian König 911dffad730df17983cfaef0808555a8c26cad0aa15Christian Königstatic int tgsi_op2_s(struct r600_shader_ctx *ctx, int swap) 912dffad730df17983cfaef0808555a8c26cad0aa15Christian König{ 913dffad730df17983cfaef0808555a8c26cad0aa15Christian König struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 914dffad730df17983cfaef0808555a8c26cad0aa15Christian König struct r600_bc_alu_src r600_src[3]; 915dffad730df17983cfaef0808555a8c26cad0aa15Christian König struct r600_bc_alu alu; 916dffad730df17983cfaef0808555a8c26cad0aa15Christian König int i, j, r; 917dffad730df17983cfaef0808555a8c26cad0aa15Christian König int lasti = tgsi_last_instruction(inst->Dst[0].Register.WriteMask); 918de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 9197e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_split_constant(ctx, r600_src); 9207e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 9217e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 9229d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 9239d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 9249d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 925d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie for (i = 0; i < lasti + 1; i++) { 926d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 927d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie continue; 928d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie 929de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 930d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 931d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie if (r) 932d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie return r; 9337ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 934d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie alu.inst = ctx->inst_info->r600_opcode; 935d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie if (!swap) { 936de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse for (j = 0; j < inst->Instruction.NumSrcRegs; j++) { 9377e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[j] = r600_src[j]; 9387e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[j].chan = tgsi_chan(&inst->Src[j], i); 939de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 940d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie } else { 941d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie alu.src[0] = r600_src[1]; 942d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[1], i); 943d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie 944d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie alu.src[1] = r600_src[0]; 945d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[0], i); 946de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 947de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* handle some special cases */ 948de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse switch (ctx->inst_info->tgsi_opcode) { 949de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse case TGSI_OPCODE_SUB: 950de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.src[1].neg = 1; 951de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 9527a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse case TGSI_OPCODE_ABS: 9537a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse alu.src[0].abs = 1; 9547a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse break; 955de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse default: 956de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse break; 957de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 958d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie if (i == lasti) { 959de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.last = 1; 960de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 961de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 962de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 963de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return r; 964de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 965de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return 0; 966de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 967de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 968d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airliestatic int tgsi_op2(struct r600_shader_ctx *ctx) 969d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie{ 970d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie return tgsi_op2_s(ctx, 0); 971d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie} 972d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie 973d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airliestatic int tgsi_op2_swap(struct r600_shader_ctx *ctx) 974d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie{ 975d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie return tgsi_op2_s(ctx, 1); 976d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie} 977d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie 9787ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse/* 97988f5976484842671ecb2cefcfa91838a43032359Dave Airlie * r600 - trunc to -PI..PI range 98088f5976484842671ecb2cefcfa91838a43032359Dave Airlie * r700 - normalize by dividing by 2PI 98188f5976484842671ecb2cefcfa91838a43032359Dave Airlie * see fdo bug 27901 98288f5976484842671ecb2cefcfa91838a43032359Dave Airlie */ 98392f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airliestatic int tgsi_setup_trig(struct r600_shader_ctx *ctx, 98492f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct r600_bc_alu_src r600_src[3]) 98588f5976484842671ecb2cefcfa91838a43032359Dave Airlie{ 98696f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König static float half_inv_pi = 1.0 /(3.1415926535 * 2); 98796f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König static float double_pi = 3.1415926535 * 2; 98896f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König static float neg_pi = -3.1415926535; 98996f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König 99088f5976484842671ecb2cefcfa91838a43032359Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 99196f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König int r; 99292f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct r600_bc_alu alu; 9937ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 99488f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = tgsi_split_constant(ctx, r600_src); 99588f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 99688f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 9979d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 9989d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 9999d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 1000be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie 100188f5976484842671ecb2cefcfa91838a43032359Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1002a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD); 100388f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.is_op3 = 1; 100488f5976484842671ecb2cefcfa91838a43032359Dave Airlie 100588f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.chan = 0; 100688f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.sel = ctx->temp_reg; 100788f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.write = 1; 100888f5976484842671ecb2cefcfa91838a43032359Dave Airlie 100988f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0] = r600_src[0]; 101096f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 10117ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 1012921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[1].sel = V_SQ_ALU_SRC_LITERAL; 101388f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[1].chan = 0; 101496f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[1].value = (uint32_t *)&half_inv_pi; 101596f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[2].sel = V_SQ_ALU_SRC_0_5; 1016ac6334145ec8eef42505cdd727aed7fae0831e12Christian König alu.src[2].chan = 0; 101788f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.last = 1; 101888f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 101988f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 102088f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 102188f5976484842671ecb2cefcfa91838a43032359Dave Airlie 102288f5976484842671ecb2cefcfa91838a43032359Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1023a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FRACT); 10247ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 102588f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.chan = 0; 102688f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.sel = ctx->temp_reg; 102788f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.write = 1; 102888f5976484842671ecb2cefcfa91838a43032359Dave Airlie 102988f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0].sel = ctx->temp_reg; 103088f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0].chan = 0; 103188f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.last = 1; 103288f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 103388f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 103488f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 103588f5976484842671ecb2cefcfa91838a43032359Dave Airlie 103688f5976484842671ecb2cefcfa91838a43032359Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1037a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD); 103888f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.is_op3 = 1; 103988f5976484842671ecb2cefcfa91838a43032359Dave Airlie 104088f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.chan = 0; 104188f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.sel = ctx->temp_reg; 104288f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.write = 1; 104388f5976484842671ecb2cefcfa91838a43032359Dave Airlie 104488f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0].sel = ctx->temp_reg; 104588f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0].chan = 0; 10467ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 1047921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[1].sel = V_SQ_ALU_SRC_LITERAL; 104888f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[1].chan = 0; 1049921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[2].sel = V_SQ_ALU_SRC_LITERAL; 1050ac6334145ec8eef42505cdd727aed7fae0831e12Christian König alu.src[2].chan = 0; 105196f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König 105296f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König if (ctx->bc->chiprev == CHIPREV_R600) { 105396f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[1].value = (uint32_t *)&double_pi; 105496f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[2].value = (uint32_t *)&neg_pi; 105596f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König } else { 105696f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[1].sel = V_SQ_ALU_SRC_1; 105796f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[2].sel = V_SQ_ALU_SRC_0_5; 105896f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[2].neg = 1; 105996f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König } 106096f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König 106188f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.last = 1; 106288f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 106388f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 106488f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 106592f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie return 0; 106692f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie} 106792f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 106892f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airliestatic int tgsi_trig(struct r600_shader_ctx *ctx) 106992f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie{ 107092f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 107192f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct r600_bc_alu_src r600_src[3]; 107292f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct r600_bc_alu alu; 107392f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie int i, r; 1074dffad730df17983cfaef0808555a8c26cad0aa15Christian König int lasti = tgsi_last_instruction(inst->Dst[0].Register.WriteMask); 107592f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 107692f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie r = tgsi_setup_trig(ctx, r600_src); 107792f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie if (r) 107892f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie return r; 107988f5976484842671ecb2cefcfa91838a43032359Dave Airlie 108088f5976484842671ecb2cefcfa91838a43032359Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 108188f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.inst = ctx->inst_info->r600_opcode; 108288f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.chan = 0; 108388f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.sel = ctx->temp_reg; 108488f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.dst.write = 1; 108588f5976484842671ecb2cefcfa91838a43032359Dave Airlie 108688f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0].sel = ctx->temp_reg; 108788f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.src[0].chan = 0; 108888f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.last = 1; 108988f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 109088f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 109188f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 109288f5976484842671ecb2cefcfa91838a43032359Dave Airlie 109388f5976484842671ecb2cefcfa91838a43032359Dave Airlie /* replicate result */ 1094be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie for (i = 0; i < lasti + 1; i++) { 1095be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 1096be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie continue; 1097be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie 109888f5976484842671ecb2cefcfa91838a43032359Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1099a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1100be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie 1101be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie alu.src[0].sel = ctx->temp_reg; 110288f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 110388f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 110488f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 1105be7816f2b7f0b064a47fb3f101477ad5dba74017Dave Airlie if (i == lasti) 110688f5976484842671ecb2cefcfa91838a43032359Dave Airlie alu.last = 1; 110788f5976484842671ecb2cefcfa91838a43032359Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 110888f5976484842671ecb2cefcfa91838a43032359Dave Airlie if (r) 110988f5976484842671ecb2cefcfa91838a43032359Dave Airlie return r; 111088f5976484842671ecb2cefcfa91838a43032359Dave Airlie } 111188f5976484842671ecb2cefcfa91838a43032359Dave Airlie return 0; 111288f5976484842671ecb2cefcfa91838a43032359Dave Airlie} 111388f5976484842671ecb2cefcfa91838a43032359Dave Airlie 111492f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airliestatic int tgsi_scs(struct r600_shader_ctx *ctx) 111592f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie{ 111692f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 111792f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct r600_bc_alu_src r600_src[3]; 111892f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie struct r600_bc_alu alu; 111992f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie int r; 112092f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 112157bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck /* We'll only need the trig stuff if we are going to write to the 112257bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck * X or Y components of the destination vector. 112357bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck */ 112457bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (likely(inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_XY)) { 112557bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck r = tgsi_setup_trig(ctx, r600_src); 112657bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (r) 112757bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck return r; 112857bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck } 112992f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 113092f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie /* dst.x = COS */ 113157bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_X) { 113257bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 113357bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_COS); 113457bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck r = tgsi_dst(ctx, &inst->Dst[0], 0, &alu.dst); 113557bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (r) 113657bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck return r; 113792f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 113857bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.src[0].sel = ctx->temp_reg; 113957bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.src[0].chan = 0; 114057bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.last = 1; 114157bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 114257bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (r) 114357bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck return r; 114457bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck } 114592f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 114692f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie /* dst.y = SIN */ 114757bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_Y) { 114857bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 114957bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SIN); 115057bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck r = tgsi_dst(ctx, &inst->Dst[0], 1, &alu.dst); 115157bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (r) 115257bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck return r; 115357bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck 115457bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.src[0].sel = ctx->temp_reg; 115557bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.src[0].chan = 0; 115657bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck alu.last = 1; 115757bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 115857bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck if (r) 115957bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck return r; 116057bf96b43be2abcbadc387d7b5466b772125a093Tilman Sauerbeck } 116192f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 1162ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck /* dst.z = 0.0; */ 1163ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck if (inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_Z) { 1164ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 1165ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1166ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1167ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1168ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck r = tgsi_dst(ctx, &inst->Dst[0], 2, &alu.dst); 1169ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck if (r) 1170ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck return r; 1171ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1172ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.src[0].sel = V_SQ_ALU_SRC_0; 1173ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.src[0].chan = 0; 1174ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1175ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.last = 1; 1176ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1177ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 1178ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck if (r) 1179ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck return r; 1180ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck } 1181ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1182ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck /* dst.w = 1.0; */ 1183ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck if (inst->Dst[0].Register.WriteMask & TGSI_WRITEMASK_W) { 1184ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 1185ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1186ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1187ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1188ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck r = tgsi_dst(ctx, &inst->Dst[0], 3, &alu.dst); 1189ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck if (r) 1190ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck return r; 1191ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1192ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.src[0].sel = V_SQ_ALU_SRC_1; 1193ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.src[0].chan = 0; 1194ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1195ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck alu.last = 1; 1196ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 1197ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 1198ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck if (r) 1199ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck return r; 1200ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck } 1201ef419599d9b18de2a9077c5f0a7f02bfc11d1762Tilman Sauerbeck 120292f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie return 0; 120392f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie} 120492f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie 1205094d66f45992830929d620782c70836b4b9b4a37Jerome Glissestatic int tgsi_kill(struct r600_shader_ctx *ctx) 1206094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse{ 1207094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 1208094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse struct r600_bc_alu alu; 1209094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse int i, r; 1210094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse 1211094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse for (i = 0; i < 4; i++) { 1212094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1213094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse alu.inst = ctx->inst_info->r600_opcode; 12144502b17901ad491e0598ee59a12d372c008ae03bDave Airlie 1215094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse alu.dst.chan = i; 12164502b17901ad491e0598ee59a12d372c008ae03bDave Airlie 1217921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = V_SQ_ALU_SRC_0; 12184502b17901ad491e0598ee59a12d372c008ae03bDave Airlie 12194502b17901ad491e0598ee59a12d372c008ae03bDave Airlie if (ctx->inst_info->tgsi_opcode == TGSI_OPCODE_KILP) { 12204502b17901ad491e0598ee59a12d372c008ae03bDave Airlie alu.src[1].sel = V_SQ_ALU_SRC_1; 12214502b17901ad491e0598ee59a12d372c008ae03bDave Airlie alu.src[1].neg = 1; 12224502b17901ad491e0598ee59a12d372c008ae03bDave Airlie } else { 12234502b17901ad491e0598ee59a12d372c008ae03bDave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[1]); 12244502b17901ad491e0598ee59a12d372c008ae03bDave Airlie if (r) 12254502b17901ad491e0598ee59a12d372c008ae03bDave Airlie return r; 12264502b17901ad491e0598ee59a12d372c008ae03bDave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[0], i); 12274502b17901ad491e0598ee59a12d372c008ae03bDave Airlie } 1228094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse if (i == 3) { 1229094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse alu.last = 1; 1230094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse } 1231094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1232094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse if (r) 1233094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse return r; 1234094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse } 12354502b17901ad491e0598ee59a12d372c008ae03bDave Airlie 12364502b17901ad491e0598ee59a12d372c008ae03bDave Airlie /* kill must be last in ALU */ 12374502b17901ad491e0598ee59a12d372c008ae03bDave Airlie ctx->bc->force_add_cf = 1; 12384502b17901ad491e0598ee59a12d372c008ae03bDave Airlie ctx->shader->uses_kill = TRUE; 1239094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse return 0; 1240094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse} 1241094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse 12420bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmidstatic int tgsi_lit(struct r600_shader_ctx *ctx) 12430bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid{ 12440bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 12450bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid struct r600_bc_alu alu; 1246ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie struct r600_bc_alu_src r600_src[3]; 12470bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid int r; 12480bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 1249ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie r = tgsi_split_constant(ctx, r600_src); 1250ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie if (r) 1251ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie return r; 1252d3fa92584b109bf59dce32501eec73f8de74f42bDave Airlie r = tgsi_split_literal_constant(ctx, r600_src); 1253d3fa92584b109bf59dce32501eec73f8de74f42bDave Airlie if (r) 1254d3fa92584b109bf59dce32501eec73f8de74f42bDave Airlie return r; 1255ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie 12567e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse /* dst.x, <- 1.0 */ 12577e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1258a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1259921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = V_SQ_ALU_SRC_1; /*1.0*/ 12607e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0].chan = 0; 12617e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_dst(ctx, &inst->Dst[0], 0, &alu.dst); 12627e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 12637e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 12647e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.write = (inst->Dst[0].Register.WriteMask >> 0) & 1; 12657e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 12667e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 12677e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 12680bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 12697e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse /* dst.y = max(src.x, 0.0) */ 12707e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1271a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MAX); 1272ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie alu.src[0] = r600_src[0]; 1273921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[1].sel = V_SQ_ALU_SRC_0; /*0.0*/ 127485e401d8bfd80450a31eac234e13008e33e64227Dave Airlie alu.src[1].chan = 0; 12757e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_dst(ctx, &inst->Dst[0], 1, &alu.dst); 12767e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 12777e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 12787e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.write = (inst->Dst[0].Register.WriteMask >> 1) & 1; 12797e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 12807e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 12817e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 12820bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 12837e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse /* dst.w, <- 1.0 */ 12847e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1285a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1286921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = V_SQ_ALU_SRC_1; 12877e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0].chan = 0; 12887e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_dst(ctx, &inst->Dst[0], 3, &alu.dst); 12897e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 12907e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 12917e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.write = (inst->Dst[0].Register.WriteMask >> 3) & 1; 12927e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.last = 1; 12937e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 12947e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 12957e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 12960bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 12970bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid if (inst->Dst[0].Register.WriteMask & (1 << 2)) 12980bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid { 12996a20539580e1b7ae921d497fbf66a8fd545efea4Vinson Lee int chan; 13006a20539580e1b7ae921d497fbf66a8fd545efea4Vinson Lee int sel; 13016a20539580e1b7ae921d497fbf66a8fd545efea4Vinson Lee 13020bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid /* dst.z = log(src.y) */ 13030bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid memset(&alu, 0, sizeof(struct r600_bc_alu)); 1304a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_CLAMPED); 1305ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie alu.src[0] = r600_src[0]; 1306ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 1); 13070bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid r = tgsi_dst(ctx, &inst->Dst[0], 2, &alu.dst); 13080bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid if (r) 13090bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid return r; 13100bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.last = 1; 13110bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid r = r600_bc_add_alu(ctx->bc, &alu); 13120bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid if (r) 13130bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid return r; 13140bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 13156a20539580e1b7ae921d497fbf66a8fd545efea4Vinson Lee chan = alu.dst.chan; 13166a20539580e1b7ae921d497fbf66a8fd545efea4Vinson Lee sel = alu.dst.sel; 13170bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 13180bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid /* tmp.x = amd MUL_LIT(src.w, dst.z, src.x ) */ 13190bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid memset(&alu, 0, sizeof(struct r600_bc_alu)); 1320a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MUL_LIT); 1321ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie alu.src[0] = r600_src[0]; 13227e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0].chan = tgsi_chan(&inst->Src[0], 3); 13230bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.src[1].sel = sel; 13240bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.src[1].chan = chan; 1325ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie 1326ee0153f891bb75ee14db579e6628d592032d6801Dave Airlie alu.src[2] = r600_src[0]; 13277e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[2].chan = tgsi_chan(&inst->Src[0], 0); 13280bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.dst.sel = ctx->temp_reg; 13290bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.dst.chan = 0; 13300bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.dst.write = 1; 13310bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.is_op3 = 1; 13320bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.last = 1; 13330bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid r = r600_bc_add_alu(ctx->bc, &alu); 13340bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid if (r) 13350bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid return r; 13360bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 13370bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid /* dst.z = exp(tmp.x) */ 13380bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid memset(&alu, 0, sizeof(struct r600_bc_alu)); 1339a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE); 13400bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.src[0].sel = ctx->temp_reg; 13410bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.src[0].chan = 0; 13420bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid r = tgsi_dst(ctx, &inst->Dst[0], 2, &alu.dst); 13430bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid if (r) 13440bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid return r; 13450bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid alu.last = 1; 13460bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid r = r600_bc_add_alu(ctx->bc, &alu); 13470bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid if (r) 13480bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid return r; 13490bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid } 13500bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid return 0; 13510bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid} 13520bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid 135342c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeckstatic int tgsi_rsq(struct r600_shader_ctx *ctx) 135442c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck{ 135542c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 135642c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck struct r600_bc_alu alu; 135742c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck int i, r; 135842c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck 135942c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 1360df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck 1361df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck /* FIXME: 1362df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck * For state trackers other than OpenGL, we'll want to use 1363df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck * _RECIPSQRT_IEEE instead. 1364df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck */ 1365df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIPSQRT_CLAMPED); 1366df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck 136742c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck for (i = 0; i < inst->Instruction.NumSrcRegs; i++) { 136842c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck r = tgsi_src(ctx, &inst->Src[i], &alu.src[i]); 136942c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck if (r) 137042c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck return r; 137142c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck alu.src[i].chan = tgsi_chan(&inst->Src[i], 0); 137242c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck alu.src[i].abs = 1; 137342c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck } 137442c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck alu.dst.sel = ctx->temp_reg; 137542c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck alu.dst.write = 1; 137642c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck alu.last = 1; 137742c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 137842c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck if (r) 137942c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck return r; 138042c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck /* replicate result */ 138142c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck return tgsi_helper_tempx_replicate(ctx); 138242c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck} 138342c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck 1384a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glissestatic int tgsi_helper_tempx_replicate(struct r600_shader_ctx *ctx) 13857e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse{ 13867e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 13877e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct r600_bc_alu alu; 1388a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse int i, r; 13897e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse 13907e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse for (i = 0; i < 4; i++) { 13917e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 13927e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0].sel = ctx->temp_reg; 1393a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 13947e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.chan = i; 13957e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 13967e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 13977e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 13987e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.dst.write = (inst->Dst[0].Register.WriteMask >> i) & 1; 13997e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (i == 3) 14007e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.last = 1; 14017e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 14027e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 14037e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 14047e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse } 14057e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return 0; 14067e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse} 14077e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse 1408a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glissestatic int tgsi_trans_srcx_replicate(struct r600_shader_ctx *ctx) 1409a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse{ 1410a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 1411a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse struct r600_bc_alu alu; 1412a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse int i, r; 1413a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse 1414a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1415a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.inst = ctx->inst_info->r600_opcode; 1416a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse for (i = 0; i < inst->Instruction.NumSrcRegs; i++) { 1417a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = tgsi_src(ctx, &inst->Src[i], &alu.src[i]); 1418a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1419a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1420a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.src[i].chan = tgsi_chan(&inst->Src[i], 0); 1421a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse } 1422a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.sel = ctx->temp_reg; 1423a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.write = 1; 1424a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.last = 1; 1425a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1426a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1427a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1428a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse /* replicate result */ 1429a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return tgsi_helper_tempx_replicate(ctx); 1430a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse} 1431a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse 1432a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glissestatic int tgsi_pow(struct r600_shader_ctx *ctx) 1433a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse{ 1434a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 1435a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse struct r600_bc_alu alu; 1436a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse int r; 1437a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse 1438a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse /* LOG2(a) */ 1439a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1440a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_IEEE); 1441a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 1442a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1443a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1444a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 1445a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.sel = ctx->temp_reg; 1446a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.write = 1; 1447a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.last = 1; 1448a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1449a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1450a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1451a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse /* b * LOG2(a) */ 1452a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 145366f55de31e15f97ad1d16c573756738218c02109Fredrik Höglund alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL); 1454a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = tgsi_src(ctx, &inst->Src[1], &alu.src[0]); 1455a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1456a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1457a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.src[0].chan = tgsi_chan(&inst->Src[1], 0); 1458a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.src[1].sel = ctx->temp_reg; 1459a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.sel = ctx->temp_reg; 1460a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.write = 1; 1461a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.last = 1; 1462a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1463a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1464a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1465a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse /* POW(a,b) = EXP2(b * LOG2(a))*/ 1466a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1467a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE); 1468a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.src[0].sel = ctx->temp_reg; 1469a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.sel = ctx->temp_reg; 1470a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.dst.write = 1; 1471a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse alu.last = 1; 1472a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1473a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse if (r) 1474a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return r; 1475a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse return tgsi_helper_tempx_replicate(ctx); 1476a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse} 1477a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse 14780d48925a56ad4fb253386110b545abda82a25464Dave Airliestatic int tgsi_ssg(struct r600_shader_ctx *ctx) 14790d48925a56ad4fb253386110b545abda82a25464Dave Airlie{ 14800d48925a56ad4fb253386110b545abda82a25464Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 14810d48925a56ad4fb253386110b545abda82a25464Dave Airlie struct r600_bc_alu alu; 14820d48925a56ad4fb253386110b545abda82a25464Dave Airlie struct r600_bc_alu_src r600_src[3]; 1483921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse int i, r; 14840d48925a56ad4fb253386110b545abda82a25464Dave Airlie 14850d48925a56ad4fb253386110b545abda82a25464Dave Airlie r = tgsi_split_constant(ctx, r600_src); 14860d48925a56ad4fb253386110b545abda82a25464Dave Airlie if (r) 14870d48925a56ad4fb253386110b545abda82a25464Dave Airlie return r; 14889d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 14899d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 14909d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 14910d48925a56ad4fb253386110b545abda82a25464Dave Airlie 14920d48925a56ad4fb253386110b545abda82a25464Dave Airlie /* tmp = (src > 0 ? 1 : src) */ 14930d48925a56ad4fb253386110b545abda82a25464Dave Airlie for (i = 0; i < 4; i++) { 14940d48925a56ad4fb253386110b545abda82a25464Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1495a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_CNDGT); 14960d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.is_op3 = 1; 1497cb08b9fa84bf432dcca2e685daadd2df651b3025Dave Airlie 14980d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.dst.sel = ctx->temp_reg; 1499cb08b9fa84bf432dcca2e685daadd2df651b3025Dave Airlie alu.dst.chan = i; 15000d48925a56ad4fb253386110b545abda82a25464Dave Airlie 15010d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[0] = r600_src[0]; 15020d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], i); 15030d48925a56ad4fb253386110b545abda82a25464Dave Airlie 1504921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[1].sel = V_SQ_ALU_SRC_1; 15050d48925a56ad4fb253386110b545abda82a25464Dave Airlie 15060d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[2] = r600_src[0]; 15070d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[2].chan = tgsi_chan(&inst->Src[0], i); 15080d48925a56ad4fb253386110b545abda82a25464Dave Airlie if (i == 3) 15090d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.last = 1; 15100d48925a56ad4fb253386110b545abda82a25464Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 15110d48925a56ad4fb253386110b545abda82a25464Dave Airlie if (r) 15120d48925a56ad4fb253386110b545abda82a25464Dave Airlie return r; 15130d48925a56ad4fb253386110b545abda82a25464Dave Airlie } 15140d48925a56ad4fb253386110b545abda82a25464Dave Airlie 15150d48925a56ad4fb253386110b545abda82a25464Dave Airlie /* dst = (-tmp > 0 ? -1 : tmp) */ 15160d48925a56ad4fb253386110b545abda82a25464Dave Airlie for (i = 0; i < 4; i++) { 15170d48925a56ad4fb253386110b545abda82a25464Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1518a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_CNDGT); 15190d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.is_op3 = 1; 15200d48925a56ad4fb253386110b545abda82a25464Dave Airlie r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 15210d48925a56ad4fb253386110b545abda82a25464Dave Airlie if (r) 15220d48925a56ad4fb253386110b545abda82a25464Dave Airlie return r; 15230d48925a56ad4fb253386110b545abda82a25464Dave Airlie 15240d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[0].sel = ctx->temp_reg; 1525cb08b9fa84bf432dcca2e685daadd2df651b3025Dave Airlie alu.src[0].chan = i; 15260d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[0].neg = 1; 15270d48925a56ad4fb253386110b545abda82a25464Dave Airlie 1528921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[1].sel = V_SQ_ALU_SRC_1; 15290d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[1].neg = 1; 15300d48925a56ad4fb253386110b545abda82a25464Dave Airlie 15310d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.src[2].sel = ctx->temp_reg; 1532cb08b9fa84bf432dcca2e685daadd2df651b3025Dave Airlie alu.src[2].chan = i; 15330d48925a56ad4fb253386110b545abda82a25464Dave Airlie 15340d48925a56ad4fb253386110b545abda82a25464Dave Airlie if (i == 3) 15350d48925a56ad4fb253386110b545abda82a25464Dave Airlie alu.last = 1; 15360d48925a56ad4fb253386110b545abda82a25464Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 15370d48925a56ad4fb253386110b545abda82a25464Dave Airlie if (r) 15380d48925a56ad4fb253386110b545abda82a25464Dave Airlie return r; 15390d48925a56ad4fb253386110b545abda82a25464Dave Airlie } 15400d48925a56ad4fb253386110b545abda82a25464Dave Airlie return 0; 15410d48925a56ad4fb253386110b545abda82a25464Dave Airlie} 15420d48925a56ad4fb253386110b545abda82a25464Dave Airlie 1543cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glissestatic int tgsi_helper_copy(struct r600_shader_ctx *ctx, struct tgsi_full_instruction *inst) 1544cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse{ 1545cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse struct r600_bc_alu alu; 1546cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse int i, r; 1547cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse 1548cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse for (i = 0; i < 4; i++) { 1549cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1550cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse if (!(inst->Dst[0].Register.WriteMask & (1 << i))) { 1551a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP); 15526c288d06ac512be6eb7f19a9005389dd46d5a26aJerome Glisse alu.dst.chan = i; 1553cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } else { 1554a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1555cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 1556cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse if (r) 1557cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse return r; 1558cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.src[0].sel = ctx->temp_reg; 1559cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.src[0].chan = i; 1560cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } 1561cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse if (i == 3) { 1562cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.last = 1; 1563cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } 1564cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1565cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse if (r) 1566cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse return r; 1567cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } 1568cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse return 0; 1569cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse} 1570cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse 1571de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic int tgsi_op3(struct r600_shader_ctx *ctx) 1572de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse{ 1573de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 15747e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct r600_bc_alu_src r600_src[3]; 1575de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse struct r600_bc_alu alu; 1576de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse int i, j, r; 1577dffad730df17983cfaef0808555a8c26cad0aa15Christian König int lasti = tgsi_last_instruction(inst->Dst[0].Register.WriteMask); 1578de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 15797e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_split_constant(ctx, r600_src); 15807e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 15817e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 15829d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 15839d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 15849d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 15857be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König for (i = 0; i < lasti + 1; i++) { 15867be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 15877be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König continue; 15887be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König 1589de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1590de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.inst = ctx->inst_info->r600_opcode; 1591de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse for (j = 0; j < inst->Instruction.NumSrcRegs; j++) { 15927e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[j] = r600_src[j]; 15937e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[j].chan = tgsi_chan(&inst->Src[j], i); 1594de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 15957be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König 15967be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 15977be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König if (r) 15987be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König return r; 15997be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König 1600de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.dst.chan = i; 1601cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.dst.write = 1; 1602de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.is_op3 = 1; 16037be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König if (i == lasti) { 1604de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.last = 1; 1605de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 1606de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1607de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 1608de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return r; 1609de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 16107be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König return 0; 1611cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse} 1612cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse 1613cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glissestatic int tgsi_dp(struct r600_shader_ctx *ctx) 1614cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse{ 1615cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 16167e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct r600_bc_alu_src r600_src[3]; 1617cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse struct r600_bc_alu alu; 1618cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse int i, j, r; 1619cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse 16207e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_split_constant(ctx, r600_src); 16217e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 16227e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 16239d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 16249d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 16259d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 1626de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse for (i = 0; i < 4; i++) { 1627de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1628cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.inst = ctx->inst_info->r600_opcode; 1629cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse for (j = 0; j < inst->Instruction.NumSrcRegs; j++) { 16307e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[j] = r600_src[j]; 16317e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[j].chan = tgsi_chan(&inst->Src[j], i); 1632cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } 1633a1146c1373e66d429afbb92ecb08a6fd67c3e224Christian König 1634a1146c1373e66d429afbb92ecb08a6fd67c3e224Christian König r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 1635a1146c1373e66d429afbb92ecb08a6fd67c3e224Christian König if (r) 1636a1146c1373e66d429afbb92ecb08a6fd67c3e224Christian König return r; 1637a1146c1373e66d429afbb92ecb08a6fd67c3e224Christian König 1638cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.dst.chan = i; 1639a1146c1373e66d429afbb92ecb08a6fd67c3e224Christian König alu.dst.write = (inst->Dst[0].Register.WriteMask >> i) & 1; 1640cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse /* handle some special cases */ 1641cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse switch (ctx->inst_info->tgsi_opcode) { 1642cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse case TGSI_OPCODE_DP2: 1643cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse if (i > 1) { 1644921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = alu.src[1].sel = V_SQ_ALU_SRC_0; 1645cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.src[0].chan = alu.src[1].chan = 0; 1646cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } 1647cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse break; 1648cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse case TGSI_OPCODE_DP3: 1649cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse if (i > 2) { 1650921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = alu.src[1].sel = V_SQ_ALU_SRC_0; 1651cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse alu.src[0].chan = alu.src[1].chan = 0; 1652cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse } 1653cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse break; 1654e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie case TGSI_OPCODE_DPH: 1655e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie if (i == 3) { 1656e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie alu.src[0].sel = V_SQ_ALU_SRC_1; 1657e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie alu.src[0].chan = 0; 1658e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie alu.src[0].neg = 0; 1659e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie } 1660e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie break; 1661cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse default: 1662cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse break; 1663de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 1664de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (i == 3) { 1665de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse alu.last = 1; 1666de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 1667de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1668de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse if (r) 1669de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse return r; 1670de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse } 16717be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König return 0; 1672de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse} 1673de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse 167433241134e6e3d5bf19141eceff90fd854b23386aJerome Glissestatic int tgsi_tex(struct r600_shader_ctx *ctx) 167533241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse{ 167696f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König static float one_point_five = 1.5f; 167733241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 167833241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse struct r600_bc_tex tex; 1679641c9adb09e8707f659d42be600d16902ebf8895Jerome Glisse struct r600_bc_alu alu; 1680641c9adb09e8707f659d42be600d16902ebf8895Jerome Glisse unsigned src_gpr; 1681b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie int r, i; 1682bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie int opcode; 168393a95ad8ff1d543f886f123029d1329513729c4bChristian König boolean src_not_temp = 168493a95ad8ff1d543f886f123029d1329513729c4bChristian König inst->Src[0].Register.File != TGSI_FILE_TEMPORARY && 168593a95ad8ff1d543f886f123029d1329513729c4bChristian König inst->Src[0].Register.File != TGSI_FILE_INPUT; 1686641c9adb09e8707f659d42be600d16902ebf8895Jerome Glisse 1687641c9adb09e8707f659d42be600d16902ebf8895Jerome Glisse src_gpr = ctx->file_offset[inst->Src[0].Register.File] + inst->Src[0].Register.Index; 1688641c9adb09e8707f659d42be600d16902ebf8895Jerome Glisse 1689b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie if (inst->Instruction.Opcode == TGSI_OPCODE_TXP) { 1690b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie /* Add perspective divide */ 1691b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1692a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIP_IEEE); 1693bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 1694bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1695bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1696bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1697b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 3); 1698b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.sel = ctx->temp_reg; 1699b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.chan = 3; 1700b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.last = 1; 1701b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.write = 1; 1702b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1703b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie if (r) 1704b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie return r; 17059d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse 1706b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie for (i = 0; i < 3; i++) { 1707b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1708a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL); 1709b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.src[0].sel = ctx->temp_reg; 1710b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.src[0].chan = 3; 1711bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[1]); 1712bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1713bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1714b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[0], i); 1715b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.sel = ctx->temp_reg; 1716b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.chan = i; 1717b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.write = 1; 1718b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1719b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie if (r) 1720b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie return r; 1721b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie } 1722b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1723a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1724921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = V_SQ_ALU_SRC_1; 1725b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.src[0].chan = 0; 1726b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.sel = ctx->temp_reg; 1727b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.chan = 3; 1728b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.last = 1; 1729b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.write = 1; 1730b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1731b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie if (r) 1732b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie return r; 173307b9e22a1f587026672a00a31cebaef5aae964c6Corbin Simpson src_not_temp = FALSE; 1734b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie src_gpr = ctx->temp_reg; 1735bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie } 1736bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1737bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (inst->Texture.Texture == TGSI_TEXTURE_CUBE) { 1738bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie int src_chan, src2_chan; 1739bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1740bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie /* tmp1.xyzw = CUBE(R0.zzxy, R0.yxzz) */ 1741bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie for (i = 0; i < 4; i++) { 1742bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1743a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_CUBE); 1744bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie switch (i) { 1745bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie case 0: 1746bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src_chan = 2; 1747bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src2_chan = 1; 1748bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie break; 1749bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie case 1: 1750bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src_chan = 2; 1751bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src2_chan = 0; 1752bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie break; 1753bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie case 2: 1754bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src_chan = 0; 1755bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src2_chan = 2; 1756bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie break; 1757bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie case 3: 1758bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src_chan = 1; 1759bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src2_chan = 2; 1760bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie break; 176184b2773f00161441c4fe06ce6dbf979c5ce78daeVinson Lee default: 176284b2773f00161441c4fe06ce6dbf979c5ce78daeVinson Lee assert(0); 176384b2773f00161441c4fe06ce6dbf979c5ce78daeVinson Lee src_chan = 0; 176484b2773f00161441c4fe06ce6dbf979c5ce78daeVinson Lee src2_chan = 0; 176584b2773f00161441c4fe06ce6dbf979c5ce78daeVinson Lee break; 1766bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie } 1767bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 1768bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1769bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1770bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], src_chan); 1771bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[1]); 1772bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1773bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1774bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[0], src2_chan); 1775bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.sel = ctx->temp_reg; 1776bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.chan = i; 1777bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (i == 3) 1778bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.last = 1; 1779bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.write = 1; 1780bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1781bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1782bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1783bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie } 1784bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1785bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie /* tmp1.z = RCP_e(|tmp1.z|) */ 1786bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1787a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIP_IEEE); 1788bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].sel = ctx->temp_reg; 1789bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].chan = 2; 1790bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].abs = 1; 1791bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.sel = ctx->temp_reg; 1792bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.chan = 2; 1793bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.write = 1; 1794bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.last = 1; 1795bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1796bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1797bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 17987ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 1799bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie /* MULADD R0.x, R0.x, PS1, (0x3FC00000, 1.5f).x 1800bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie * MULADD R0.y, R0.y, PS1, (0x3FC00000, 1.5f).x 18017ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse * muladd has no writemask, have to use another temp 1802bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie */ 1803bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1804a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD); 1805bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.is_op3 = 1; 1806bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1807bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].sel = ctx->temp_reg; 1808bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].chan = 0; 1809bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[1].sel = ctx->temp_reg; 1810bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[1].chan = 2; 18117ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 1812bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[2].sel = V_SQ_ALU_SRC_LITERAL; 1813bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[2].chan = 0; 181496f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[2].value = (u32*)&one_point_five; 1815bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1816bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.sel = ctx->temp_reg; 1817bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.chan = 0; 1818bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.write = 1; 1819bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1820bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1821bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1822bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1823bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1824bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1825a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD); 1826bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.is_op3 = 1; 1827bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1828bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].sel = ctx->temp_reg; 1829bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[0].chan = 1; 1830bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[1].sel = ctx->temp_reg; 1831bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[1].chan = 2; 18327ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 1833bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[2].sel = V_SQ_ALU_SRC_LITERAL; 1834bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.src[2].chan = 0; 183596f8f8db7bcddec7ef0fce62cf0e23f1c2fb8c8dChristian König alu.src[2].value = (u32*)&one_point_five; 1836bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1837bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.sel = ctx->temp_reg; 1838bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.chan = 1; 1839bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.dst.write = 1; 1840bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1841bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie alu.last = 1; 1842bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1843bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1844bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1845bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 184607b9e22a1f587026672a00a31cebaef5aae964c6Corbin Simpson src_not_temp = FALSE; 1847bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie src_gpr = ctx->temp_reg; 1848bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie } 1849bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1850bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (src_not_temp) { 1851b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie for (i = 0; i < 4; i++) { 1852b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 1853a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 1854a124490262a29d2e873fe50ca57974f246946b85Christian König r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 1855a124490262a29d2e873fe50ca57974f246946b85Christian König if (r) 1856a124490262a29d2e873fe50ca57974f246946b85Christian König return r; 1857a21a2748beb1f42d21e14858eee9a1323d85a00fFredrik Höglund alu.src[0].chan = tgsi_chan(&inst->Src[0], i); 1858b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.sel = ctx->temp_reg; 1859b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.chan = i; 1860b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie if (i == 3) 1861b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.last = 1; 1862b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie alu.dst.write = 1; 1863b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 1864b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie if (r) 1865b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie return r; 1866b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie } 1867b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie src_gpr = ctx->temp_reg; 1868b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie } 18697ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 1870bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie opcode = ctx->inst_info->r600_opcode; 1871bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (opcode == SQ_TEX_INST_SAMPLE && 1872bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie (inst->Texture.Texture == TGSI_TEXTURE_SHADOW1D || inst->Texture.Texture == TGSI_TEXTURE_SHADOW2D)) 1873bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie opcode = SQ_TEX_INST_SAMPLE_C; 187433241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse 187533241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse memset(&tex, 0, sizeof(struct r600_bc_tex)); 1876bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie tex.inst = opcode; 1877ea1d818b58d6ff9e4cd0c40eb865beabde8f268cDave Airlie tex.sampler_id = ctx->file_offset[inst->Src[1].Register.File] + inst->Src[1].Register.Index; 1878ea1d818b58d6ff9e4cd0c40eb865beabde8f268cDave Airlie tex.resource_id = tex.sampler_id; 1879641c9adb09e8707f659d42be600d16902ebf8895Jerome Glisse tex.src_gpr = src_gpr; 18806c288d06ac512be6eb7f19a9005389dd46d5a26aJerome Glisse tex.dst_gpr = ctx->file_offset[inst->Dst[0].Register.File] + inst->Dst[0].Register.Index; 18819d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse tex.dst_sel_x = (inst->Dst[0].Register.WriteMask & 1) ? 0 : 7; 18829d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse tex.dst_sel_y = (inst->Dst[0].Register.WriteMask & 2) ? 1 : 7; 18839d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse tex.dst_sel_z = (inst->Dst[0].Register.WriteMask & 4) ? 2 : 7; 18849d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse tex.dst_sel_w = (inst->Dst[0].Register.WriteMask & 8) ? 3 : 7; 188533241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse tex.src_sel_x = 0; 188633241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse tex.src_sel_y = 1; 188733241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse tex.src_sel_z = 2; 188833241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse tex.src_sel_w = 3; 18899a78e790dc4c40362b971ad5eff2505c02b73ed7Jerome Glisse 1890bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (inst->Texture.Texture == TGSI_TEXTURE_CUBE) { 1891bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie tex.src_sel_x = 1; 1892bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie tex.src_sel_y = 0; 1893bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie tex.src_sel_z = 3; 1894bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie tex.src_sel_w = 1; 1895bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie } 1896bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 189701984cf34fa4e6d564d06a126795468b5718ecb0Dave Airlie if (inst->Texture.Texture != TGSI_TEXTURE_RECT) { 189801984cf34fa4e6d564d06a126795468b5718ecb0Dave Airlie tex.coord_type_x = 1; 189901984cf34fa4e6d564d06a126795468b5718ecb0Dave Airlie tex.coord_type_y = 1; 19007e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse tex.coord_type_z = 1; 190101984cf34fa4e6d564d06a126795468b5718ecb0Dave Airlie tex.coord_type_w = 1; 190201984cf34fa4e6d564d06a126795468b5718ecb0Dave Airlie } 1903bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1904bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (inst->Texture.Texture == TGSI_TEXTURE_SHADOW1D || inst->Texture.Texture == TGSI_TEXTURE_SHADOW2D) 19055d5f693cefe452bd8bd7e45f8b5d7ed991ae5115Dave Airlie tex.src_sel_w = 2; 1906bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1907bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie r = r600_bc_add_tex(ctx->bc, &tex); 1908bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie if (r) 1909bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return r; 1910bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie 1911bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie /* add shadow ambient support - gallium doesn't do it yet */ 1912bea5f559a6f52e8fb7c32ee8e9f9c5f04c05b582Dave Airlie return 0; 191333241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse} 191433241134e6e3d5bf19141eceff90fd854b23386aJerome Glisse 1915b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glissestatic int tgsi_lrp(struct r600_shader_ctx *ctx) 1916b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse{ 1917b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 19187e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse struct r600_bc_alu_src r600_src[3]; 1919b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse struct r600_bc_alu alu; 1920dffad730df17983cfaef0808555a8c26cad0aa15Christian König int lasti = tgsi_last_instruction(inst->Dst[0].Register.WriteMask); 1921b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse unsigned i; 1922b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse int r; 1923b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse 19247e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse r = tgsi_split_constant(ctx, r600_src); 19257e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse if (r) 19267e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse return r; 19279d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 19289d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 19299d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 1930c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König 1931c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König /* optimize if it's just an equal balance */ 1932c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König if(r600_src[0].sel == V_SQ_ALU_SRC_0_5) { 1933c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König for (i = 0; i < lasti + 1; i++) { 1934c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 1935c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König continue; 1936c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König 1937c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König memset(&alu, 0, sizeof(struct r600_bc_alu)); 1938c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_ADD); 1939c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.src[0] = r600_src[1]; 1940c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.src[0].chan = tgsi_chan(&inst->Src[1], i); 1941c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.src[1] = r600_src[2]; 1942c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.src[1].chan = tgsi_chan(&inst->Src[2], i); 1943c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.omod = 3; 1944c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 1945c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König if (r) 1946c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König return r; 1947c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König 1948c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.dst.chan = i; 1949c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König if (i == lasti) { 1950c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König alu.last = 1; 1951c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König } 1952c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König r = r600_bc_add_alu(ctx->bc, &alu); 1953c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König if (r) 1954c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König return r; 1955c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König } 1956c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König return 0; 1957c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König } 1958c60cb25bfb15fc83e78d9f2c74646dcc5ad07792Christian König 1959b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse /* 1 - src0 */ 1960dffad730df17983cfaef0808555a8c26cad0aa15Christian König for (i = 0; i < lasti + 1; i++) { 1961dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 1962dffad730df17983cfaef0808555a8c26cad0aa15Christian König continue; 1963dffad730df17983cfaef0808555a8c26cad0aa15Christian König 1964b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1965a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_ADD); 1966921c987c6f43b4d63a98b61013d43bac97baff21Jerome Glisse alu.src[0].sel = V_SQ_ALU_SRC_1; 1967b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.src[0].chan = 0; 19687e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[1] = r600_src[0]; 19697e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[1].chan = tgsi_chan(&inst->Src[0], i); 1970b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.src[1].neg = 1; 1971b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.sel = ctx->temp_reg; 1972b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.chan = i; 1973dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (i == lasti) { 1974b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.last = 1; 1975b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse } 1976b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.write = 1; 1977b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 1978b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse if (r) 1979b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse return r; 1980b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse } 1981b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse 1982b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse /* (1 - src0) * src2 */ 1983dffad730df17983cfaef0808555a8c26cad0aa15Christian König for (i = 0; i < lasti + 1; i++) { 1984dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 1985dffad730df17983cfaef0808555a8c26cad0aa15Christian König continue; 1986dffad730df17983cfaef0808555a8c26cad0aa15Christian König 1987b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 1988a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL); 1989b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.src[0].sel = ctx->temp_reg; 1990b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.src[0].chan = i; 19917e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[1] = r600_src[2]; 19927e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[1].chan = tgsi_chan(&inst->Src[2], i); 1993b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.sel = ctx->temp_reg; 1994b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.chan = i; 1995dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (i == lasti) { 1996b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.last = 1; 1997b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse } 1998b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.write = 1; 1999b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 2000b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse if (r) 2001b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse return r; 2002b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse } 2003b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse 2004b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse /* src0 * src1 + (1 - src0) * src2 */ 2005dffad730df17983cfaef0808555a8c26cad0aa15Christian König for (i = 0; i < lasti + 1; i++) { 2006dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 2007dffad730df17983cfaef0808555a8c26cad0aa15Christian König continue; 2008dffad730df17983cfaef0808555a8c26cad0aa15Christian König 2009b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse memset(&alu, 0, sizeof(struct r600_bc_alu)); 2010a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD); 2011b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.is_op3 = 1; 20127e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0] = r600_src[0]; 20137e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[0].chan = tgsi_chan(&inst->Src[0], i); 20147e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[1] = r600_src[1]; 20157e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse alu.src[1].chan = tgsi_chan(&inst->Src[1], i); 2016b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.src[2].sel = ctx->temp_reg; 2017b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.src[2].chan = i; 2018dffad730df17983cfaef0808555a8c26cad0aa15Christian König 2019dffad730df17983cfaef0808555a8c26cad0aa15Christian König r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 2020dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (r) 2021dffad730df17983cfaef0808555a8c26cad0aa15Christian König return r; 2022dffad730df17983cfaef0808555a8c26cad0aa15Christian König 2023b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.dst.chan = i; 2024dffad730df17983cfaef0808555a8c26cad0aa15Christian König if (i == lasti) { 2025b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse alu.last = 1; 2026b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse } 2027b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse r = r600_bc_add_alu(ctx->bc, &alu); 2028b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse if (r) 2029b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse return r; 2030b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse } 2031dffad730df17983cfaef0808555a8c26cad0aa15Christian König return 0; 2032b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse} 2033b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse 203487f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airliestatic int tgsi_cmp(struct r600_shader_ctx *ctx) 203587f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie{ 203687f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 203787f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie struct r600_bc_alu_src r600_src[3]; 203887f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie struct r600_bc_alu alu; 203987f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie int i, r; 2040dffad730df17983cfaef0808555a8c26cad0aa15Christian König int lasti = tgsi_last_instruction(inst->Dst[0].Register.WriteMask); 204187f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 204287f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie r = tgsi_split_constant(ctx, r600_src); 204387f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie if (r) 204487f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie return r; 20459d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 20469d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 20479d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 204887f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 20497be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König for (i = 0; i < lasti + 1; i++) { 20507be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König if (!(inst->Dst[0].Register.WriteMask & (1 << i))) 20517be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König continue; 205287f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 205387f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 2054a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_CNDGE); 205587f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.src[0] = r600_src[0]; 205687f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], i); 205787f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 205887f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.src[1] = r600_src[2]; 205987f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[2], i); 206087f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 206187f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.src[2] = r600_src[1]; 206287f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.src[2].chan = tgsi_chan(&inst->Src[1], i); 206387f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 20647be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 20657be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König if (r) 20667be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König return r; 20677be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König 206887f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.dst.chan = i; 206987f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.dst.write = 1; 207087f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.is_op3 = 1; 20717be5455796facbe35cf1f1bdbefa83759b2e3b58Christian König if (i == lasti) 207287f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie alu.last = 1; 207387f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 207487f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie if (r) 207587f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie return r; 20767ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse } 207787f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie return 0; 207887f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie} 207987f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 20800e6a02d29915db2ca460206656ab517ddaf0b455Dave Airliestatic int tgsi_xpd(struct r600_shader_ctx *ctx) 20810e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie{ 20820e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 20830e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie struct r600_bc_alu_src r600_src[3]; 20840e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie struct r600_bc_alu alu; 20850e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie uint32_t use_temp = 0; 20860e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie int i, r; 20870e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 20880e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (inst->Dst[0].Register.WriteMask != 0xf) 20890e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie use_temp = 1; 20900e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 20910e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie r = tgsi_split_constant(ctx, r600_src); 20920e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (r) 20930e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie return r; 20949d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse r = tgsi_split_literal_constant(ctx, r600_src); 20959d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse if (r) 20969d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse return r; 20979d4ae914e28ac7857a32a88ba27aecc182f697c6Jerome Glisse 20980e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie for (i = 0; i < 4; i++) { 20990e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 2100a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL); 21010e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21020e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0] = r600_src[0]; 21030e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie switch (i) { 21040e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 0: 21050e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 2); 21060e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21070e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 1: 21080e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 21090e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21100e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 2: 21110e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 1); 21120e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21130e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 3: 21140e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].sel = V_SQ_ALU_SRC_0; 21150e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = i; 21160e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 21170e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21180e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1] = r600_src[1]; 21190e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie switch (i) { 21200e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 0: 21210e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], 1); 21220e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21230e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 1: 21240e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], 2); 21250e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21260e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 2: 21270e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], 0); 21280e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21290e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 3: 21300e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].sel = V_SQ_ALU_SRC_0; 21310e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = i; 21320e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 21330e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21340e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.dst.sel = ctx->temp_reg; 21350e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.dst.chan = i; 21360e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.dst.write = 1; 21370e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21380e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (i == 3) 21390e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.last = 1; 21400e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 21410e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (r) 21420e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie return r; 21430e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 21440e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21450e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie for (i = 0; i < 4; i++) { 21460e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 2147a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD); 21480e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21490e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0] = r600_src[0]; 21500e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie switch (i) { 21510e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 0: 21520e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 1); 21530e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21540e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 1: 21550e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 2); 21560e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21570e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 2: 21580e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 21590e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21600e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 3: 21610e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].sel = V_SQ_ALU_SRC_0; 21620e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[0].chan = i; 21630e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 21640e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21650e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1] = r600_src[1]; 21660e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie switch (i) { 21670e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 0: 21680e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], 2); 21690e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21700e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 1: 21710e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], 0); 21720e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21730e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 2: 21740e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], 1); 21750e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie break; 21760e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie case 3: 21770e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].sel = V_SQ_ALU_SRC_0; 21780e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[1].chan = i; 21790e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 21800e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21810e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[2].sel = ctx->temp_reg; 21820e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[2].neg = 1; 21830e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.src[2].chan = i; 21840e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 21850e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (use_temp) 21860e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.dst.sel = ctx->temp_reg; 21870e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie else { 21880e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 21890e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (r) 21900e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie return r; 21910e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 21920e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.dst.chan = i; 21930e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.dst.write = 1; 21940e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.is_op3 = 1; 21950e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (i == 3) 21960e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie alu.last = 1; 21970e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 21980e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (r) 21990e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie return r; 22000e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie } 22010e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie if (use_temp) 22020e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie return tgsi_helper_copy(ctx, inst); 22030e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie return 0; 22040e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie} 22050e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie 220636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airliestatic int tgsi_exp(struct r600_shader_ctx *ctx) 220736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie{ 220836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 220989c26866f05dcf8fbb716e38d4780cebcae71653Vinson Lee struct r600_bc_alu_src r600_src[3] = { { 0 } }; 221036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie struct r600_bc_alu alu; 221109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie int r; 221236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 221336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie /* result.x = 2^floor(src); */ 221436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (inst->Dst[0].Register.WriteMask & 1) { 221536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 221636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 2217a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLOOR); 221836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 221936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 222036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 222136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 222236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 222336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 222436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.sel = ctx->temp_reg; 222536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.chan = 0; 222636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.write = 1; 222736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.last = 1; 222836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 222936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 223036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 223136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 2232a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE); 223336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].sel = ctx->temp_reg; 223436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].chan = 0; 223536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 223636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.sel = ctx->temp_reg; 223736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.chan = 0; 223836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.write = 1; 223936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.last = 1; 224036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 224136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 224236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 224336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie } 22447ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 224536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie /* result.y = tmp - floor(tmp); */ 224636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if ((inst->Dst[0].Register.WriteMask >> 1) & 1) { 224736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 224836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 2249a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FRACT); 225036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0] = r600_src[0]; 225136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 225236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 225336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 225436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 225536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 225636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.sel = ctx->temp_reg; 225736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie// r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 225836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie// if (r) 225936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie// return r; 226036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.write = 1; 226136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.chan = 1; 226236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 226336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.last = 1; 226436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 226536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 226636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 226736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 226836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie } 226936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 227036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie /* result.z = RoughApprox2ToX(tmp);*/ 227136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if ((inst->Dst[0].Register.WriteMask >> 2) & 0x1) { 227236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 2273a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE); 227436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 227536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 227636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 227736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 227836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 227936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.sel = ctx->temp_reg; 228036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.write = 1; 228136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.chan = 2; 228236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 228336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.last = 1; 228436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 228536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 228636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 228736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 228836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie } 228936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 229036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie /* result.w = 1.0;*/ 229136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if ((inst->Dst[0].Register.WriteMask >> 3) & 0x1) { 229236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 229336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 2294a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 229536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].sel = V_SQ_ALU_SRC_1; 229636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.src[0].chan = 0; 229736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie 229836d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.sel = ctx->temp_reg; 229936d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.chan = 3; 230036d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.dst.write = 1; 230136d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie alu.last = 1; 230236d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 230336d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie if (r) 230436d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return r; 230536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie } 230636d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie return tgsi_helper_copy(ctx, inst); 230736d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie} 230887f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie 2309460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeckstatic int tgsi_log(struct r600_shader_ctx *ctx) 2310460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck{ 2311460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 2312460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck struct r600_bc_alu alu; 2313460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck int r; 2314460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2315460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck /* result.x = floor(log2(src)); */ 2316460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (inst->Dst[0].Register.WriteMask & 1) { 2317460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 2318460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2319460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_IEEE); 2320460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 2321460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2322460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2323460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2324460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 2325460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2326460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.sel = ctx->temp_reg; 2327460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.chan = 0; 2328460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.write = 1; 2329460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.last = 1; 2330460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 2331460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2332460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2333460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2334460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLOOR); 2335460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.src[0].sel = ctx->temp_reg; 2336460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.src[0].chan = 0; 2337460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2338460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.sel = ctx->temp_reg; 2339460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.chan = 0; 2340460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.write = 1; 2341460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.last = 1; 2342460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2343460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 2344460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2345460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2346460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck } 2347460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 234896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck /* result.y = src.x / (2 ^ floor(log2(src.x))); */ 2349460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if ((inst->Dst[0].Register.WriteMask >> 1) & 1) { 2350460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 2351460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 235296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_IEEE); 235396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 235496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck if (r) 235596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck return r; 235696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 235796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 235896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 235996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.sel = ctx->temp_reg; 236096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.chan = 1; 236196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.write = 1; 236296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.last = 1; 236396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 236496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 236596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck if (r) 236696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck return r; 236796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 236896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 236996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 237096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLOOR); 237196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].sel = ctx->temp_reg; 237296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].chan = 1; 237396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 237496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.sel = ctx->temp_reg; 237596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.chan = 1; 237696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.write = 1; 237796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.last = 1; 237896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 237996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 238096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck if (r) 238196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck return r; 238296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 238396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 238496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 238596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE); 238696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].sel = ctx->temp_reg; 238796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].chan = 1; 238896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 238996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.sel = ctx->temp_reg; 239096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.chan = 1; 239196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.write = 1; 239296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.last = 1; 239396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 239496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 239596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck if (r) 239696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck return r; 239796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 239896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 239996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 240096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIP_IEEE); 240196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].sel = ctx->temp_reg; 240296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].chan = 1; 240396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 240496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.sel = ctx->temp_reg; 240596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.chan = 1; 240696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.dst.write = 1; 240796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.last = 1; 240896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 240996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 241096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck if (r) 241196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck return r; 241296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 241396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 241496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 241596a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL); 241696a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 241796a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 241896a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck if (r) 241996a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck return r; 242096a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 242196a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 242296a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck 242396a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[1].sel = ctx->temp_reg; 242496a4edb8ccb4bc1125918b972e8b3a080f496d0dTilman Sauerbeck alu.src[1].chan = 1; 2425460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2426460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.sel = ctx->temp_reg; 2427460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.chan = 1; 2428460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.write = 1; 2429460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.last = 1; 2430460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2431460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 2432460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2433460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2434460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck } 2435460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2436460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck /* result.z = log2(src);*/ 2437460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if ((inst->Dst[0].Register.WriteMask >> 2) & 1) { 2438460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 2439460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2440460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_IEEE); 2441460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 2442460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2443460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2444460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2445460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 2446460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2447460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.sel = ctx->temp_reg; 2448460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.write = 1; 2449460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.chan = 2; 2450460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.last = 1; 2451460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2452460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 2453460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2454460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2455460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck } 2456460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2457460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck /* result.w = 1.0; */ 2458460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if ((inst->Dst[0].Register.WriteMask >> 3) & 1) { 2459460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck memset(&alu, 0, sizeof(struct r600_bc_alu)); 2460460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2461460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV); 2462460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.src[0].sel = V_SQ_ALU_SRC_1; 2463460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.src[0].chan = 0; 2464460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2465460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.sel = ctx->temp_reg; 2466460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.chan = 3; 2467460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.dst.write = 1; 2468460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck alu.last = 1; 2469460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2470460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck r = r600_bc_add_alu(ctx->bc, &alu); 2471460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck if (r) 2472460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return r; 2473460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck } 2474460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 2475460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck return tgsi_helper_copy(ctx, inst); 2476460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck} 2477460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck 247898b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airliestatic int tgsi_eg_arl(struct r600_shader_ctx *ctx) 247998b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie{ 248098b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 248198b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie struct r600_bc_alu alu; 248298b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie int r; 248398b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 248498b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie 248552c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher switch (inst->Instruction.Opcode) { 248652c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher case TGSI_OPCODE_ARL: 248752c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher alu.inst = EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLT_TO_INT_FLOOR; 248852c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher break; 248952c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher case TGSI_OPCODE_ARR: 249052c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher alu.inst = EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLT_TO_INT; 249152c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher break; 249252c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher default: 249352c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher assert(0); 249452c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher return -1; 249552c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher } 249652c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher 249798b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 249898b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie if (r) 249998b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie return r; 250098b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 250198b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.last = 1; 250298b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.dst.chan = 0; 250398b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.dst.sel = ctx->temp_reg; 250498b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.dst.write = 1; 2505495dec0a2bcdff10f9a4024b892501c54e29ef00Henri Verbeet r = r600_bc_add_alu(ctx->bc, &alu); 250698b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie if (r) 250798b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie return r; 250898b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 250998b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.inst = EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOVA_INT; 251098b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 251198b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie if (r) 251298b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie return r; 251398b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.src[0].sel = ctx->temp_reg; 251498b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.src[0].chan = 0; 251598b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie alu.last = 1; 2516495dec0a2bcdff10f9a4024b892501c54e29ef00Henri Verbeet r = r600_bc_add_alu(ctx->bc, &alu); 251798b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie if (r) 251898b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie return r; 251998b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie return 0; 252098b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie} 252198b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airliestatic int tgsi_r600_arl(struct r600_shader_ctx *ctx) 252247d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie{ 252347d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie /* TODO from r600c, ar values don't persist between clauses */ 252447d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 252547d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie struct r600_bc_alu alu; 252647d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie int r; 252747d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 252847d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie 25297ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse switch (inst->Instruction.Opcode) { 25307ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse case TGSI_OPCODE_ARL: 25317ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse alu.inst = V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOVA_FLOOR; 25327ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse break; 25337ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse case TGSI_OPCODE_ARR: 25347ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse alu.inst = V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOVA; 25357ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse break; 25367ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse default: 25377ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse assert(0); 25387ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse return -1; 25397ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse } 25407ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 254147d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie 254247d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 254347d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie if (r) 254447d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie return r; 254547d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 254647d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie 254747d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie alu.last = 1; 254847d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie 2549495dec0a2bcdff10f9a4024b892501c54e29ef00Henri Verbeet r = r600_bc_add_alu(ctx->bc, &alu); 255047d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie if (r) 255147d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie return r; 2552c5edfcc410bdf3dbe4f37418de8f0009746c9578Dave Airlie ctx->bc->cf_last->r6xx_uses_waterfall = 1; 255347d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie return 0; 255447d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie} 255547d5a19df1e7760c4f5f0e340bfc56355c2e428bDave Airlie 255657eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airliestatic int tgsi_opdst(struct r600_shader_ctx *ctx) 255757eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie{ 255857eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 255957eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie struct r600_bc_alu alu; 256057eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie int i, r = 0; 256157eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie 256257eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie for (i = 0; i < 4; i++) { 256357eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 256457eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie 2565a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie alu.inst = CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL); 256657eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie r = tgsi_dst(ctx, &inst->Dst[0], i, &alu.dst); 256757eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie if (r) 256857eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie return r; 25697ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 25707ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse if (i == 0 || i == 3) { 257157eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie alu.src[0].sel = V_SQ_ALU_SRC_1; 257257eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie } else { 257357eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 257457eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie if (r) 257557eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie return r; 257657eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], i); 257757eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie } 257857eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie 257957eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie if (i == 0 || i == 2) { 258057eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie alu.src[1].sel = V_SQ_ALU_SRC_1; 258157eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie } else { 258257eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie r = tgsi_src(ctx, &inst->Src[1], &alu.src[1]); 258357eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie if (r) 258457eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie return r; 258557eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie alu.src[1].chan = tgsi_chan(&inst->Src[1], i); 258657eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie } 258757eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie if (i == 3) 258857eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie alu.last = 1; 258957eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie r = r600_bc_add_alu(ctx->bc, &alu); 259057eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie if (r) 259157eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie return r; 259257eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie } 259357eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie return 0; 259457eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie} 259557eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie 2596a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airliestatic int emit_logic_pred(struct r600_shader_ctx *ctx, int opcode) 2597a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie{ 2598a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie struct tgsi_full_instruction *inst = &ctx->parse.FullToken.FullInstruction; 259909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie struct r600_bc_alu alu; 2600a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie int r; 2601a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2602a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie memset(&alu, 0, sizeof(struct r600_bc_alu)); 2603a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.inst = opcode; 2604a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.predicate = 1; 2605a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2606a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.dst.sel = ctx->temp_reg; 2607a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.dst.write = 1; 2608a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.dst.chan = 0; 2609a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2610a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie r = tgsi_src(ctx, &inst->Src[0], &alu.src[0]); 2611a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie if (r) 2612a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return r; 2613a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.src[0].chan = tgsi_chan(&inst->Src[0], 0); 2614a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.src[1].sel = V_SQ_ALU_SRC_0; 2615a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.src[1].chan = 0; 26167ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 2617a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie alu.last = 1; 2618a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2619a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie r = r600_bc_add_alu_type(ctx->bc, &alu, CTX_INST(V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU_PUSH_BEFORE)); 2620a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie if (r) 2621a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return r; 2622a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return 0; 2623a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie} 2624a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2625a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airliestatic int pops(struct r600_shader_ctx *ctx, int pops) 2626a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie{ 26278813842121d46d1be476807c98b0ba0b771f0c91Christian König int alu_pop = 3; 26288813842121d46d1be476807c98b0ba0b771f0c91Christian König if (ctx->bc->cf_last) { 26298813842121d46d1be476807c98b0ba0b771f0c91Christian König if (ctx->bc->cf_last->inst == CTX_INST(V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU) << 3) 26308813842121d46d1be476807c98b0ba0b771f0c91Christian König alu_pop = 0; 26318813842121d46d1be476807c98b0ba0b771f0c91Christian König else if (ctx->bc->cf_last->inst == CTX_INST(V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU_POP_AFTER) << 3) 26328813842121d46d1be476807c98b0ba0b771f0c91Christian König alu_pop = 1; 26338813842121d46d1be476807c98b0ba0b771f0c91Christian König } 26348813842121d46d1be476807c98b0ba0b771f0c91Christian König alu_pop += pops; 26358813842121d46d1be476807c98b0ba0b771f0c91Christian König if (alu_pop == 1) { 26368813842121d46d1be476807c98b0ba0b771f0c91Christian König ctx->bc->cf_last->inst = CTX_INST(V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU_POP_AFTER) << 3; 26378813842121d46d1be476807c98b0ba0b771f0c91Christian König ctx->bc->force_add_cf = 1; 26388813842121d46d1be476807c98b0ba0b771f0c91Christian König } else if (alu_pop == 2) { 26398813842121d46d1be476807c98b0ba0b771f0c91Christian König ctx->bc->cf_last->inst = CTX_INST(V_SQ_CF_ALU_WORD1_SQ_CF_INST_ALU_POP2_AFTER) << 3; 26408813842121d46d1be476807c98b0ba0b771f0c91Christian König ctx->bc->force_add_cf = 1; 26418813842121d46d1be476807c98b0ba0b771f0c91Christian König } else { 26428813842121d46d1be476807c98b0ba0b771f0c91Christian König r600_bc_add_cfinst(ctx->bc, CTX_INST(V_SQ_CF_WORD1_SQ_CF_INST_POP)); 26438813842121d46d1be476807c98b0ba0b771f0c91Christian König ctx->bc->cf_last->pop_count = pops; 26448813842121d46d1be476807c98b0ba0b771f0c91Christian König ctx->bc->cf_last->cf_addr = ctx->bc->cf_last->id + 2; 26458813842121d46d1be476807c98b0ba0b771f0c91Christian König } 2646a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return 0; 2647a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie} 2648a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 264909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic inline void callstack_decrease_current(struct r600_shader_ctx *ctx, unsigned reason) 2650a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie{ 265109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie switch(reason) { 265209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_PUSH_VPM: 265309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current--; 265409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 265509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_PUSH_WQM: 265609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_LOOP: 265709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current -= 4; 265809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 265909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_REP: 266009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie /* TOODO : for 16 vp asic should -= 2; */ 266109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current --; 266209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 266309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 266409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 2665a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 266609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic inline void callstack_check_depth(struct r600_shader_ctx *ctx, unsigned reason, unsigned check_max_only) 266709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 266809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if (check_max_only) { 266909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie int diff; 267009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie switch (reason) { 267109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_PUSH_VPM: 267209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie diff = 1; 267309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 267409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_PUSH_WQM: 267509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie diff = 4; 267609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 2677a712e193a3f58f4f40402c34adf16de255afa760Vinson Lee default: 2678a712e193a3f58f4f40402c34adf16de255afa760Vinson Lee assert(0); 2679a712e193a3f58f4f40402c34adf16de255afa760Vinson Lee diff = 0; 268009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 268109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if ((ctx->bc->callstack[ctx->bc->call_sp].current + diff) > 268209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].max) { 268309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].max = 268409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current + diff; 268509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 268609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return; 26877ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse } 268809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie switch (reason) { 268909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_PUSH_VPM: 269009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current++; 269109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 269209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_PUSH_WQM: 269309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_LOOP: 269409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current += 4; 269509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 269609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie case FC_REP: 269709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current++; 269809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 269909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 270009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 270109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if ((ctx->bc->callstack[ctx->bc->call_sp].current) > 270209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].max) { 270309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].max = 270409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->callstack[ctx->bc->call_sp].current; 270509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 270609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 270709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 270809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic void fc_set_mid(struct r600_shader_ctx *ctx, int fc_sp) 270909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 271009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie struct r600_cf_stack_entry *sp = &ctx->bc->fc_stack[fc_sp]; 271109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 271209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->mid = (struct r600_bc_cf **)realloc((void *)sp->mid, 271309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sizeof(struct r600_bc_cf *) * (sp->num_mid + 1)); 271409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->mid[sp->num_mid] = ctx->bc->cf_last; 271509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->num_mid++; 271609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 2717a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 271809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic void fc_pushlevel(struct r600_shader_ctx *ctx, int type) 271909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 2720a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie ctx->bc->fc_sp++; 272109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].type = type; 272209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].start = ctx->bc->cf_last; 272309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 272409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 272509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic void fc_poplevel(struct r600_shader_ctx *ctx) 272609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 272709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie struct r600_cf_stack_entry *sp = &ctx->bc->fc_stack[ctx->bc->fc_sp]; 272809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if (sp->mid) { 272909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie free(sp->mid); 273009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->mid = NULL; 273109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 273209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->num_mid = 0; 273309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->start = NULL; 273409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie sp->type = 0; 273509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->fc_sp--; 273609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 273709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 273809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie#if 0 273909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int emit_return(struct r600_shader_ctx *ctx) 274009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 274109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie r600_bc_add_cfinst(ctx->bc, V_SQ_CF_WORD1_SQ_CF_INST_RETURN); 274209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return 0; 274309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 274409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 274509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int emit_jump_to_offset(struct r600_shader_ctx *ctx, int pops, int offset) 274609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 274709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 2748a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie r600_bc_add_cfinst(ctx->bc, V_SQ_CF_WORD1_SQ_CF_INST_JUMP); 274909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->cf_last->pop_count = pops; 275009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie /* TODO work out offset */ 275109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return 0; 275209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 2753a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 275409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int emit_setret_in_loop_flag(struct r600_shader_ctx *ctx, unsigned flag_value) 275509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 275609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return 0; 275709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 275809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 275909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic void emit_testflag(struct r600_shader_ctx *ctx) 276009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 27617ffd4e976fd11b8c083c2927effd25a2f79ac841Jerome Glisse 276209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 276309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 276409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic void emit_return_on_flag(struct r600_shader_ctx *ctx, unsigned ifidx) 276509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 276609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie emit_testflag(ctx); 276709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie emit_jump_to_offset(ctx, 1, 4); 276809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie emit_setret_in_loop_flag(ctx, V_SQ_ALU_SRC_0); 276909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie pops(ctx, ifidx + 1); 277009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie emit_return(ctx); 277109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 277209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 277309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic void break_loop_on_flag(struct r600_shader_ctx *ctx, unsigned fc_sp) 277409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 277509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie emit_testflag(ctx); 277609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 277709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie r600_bc_add_cfinst(ctx->bc, ctx->inst_info->r600_opcode); 277809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->cf_last->pop_count = 1; 277909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 278009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_set_mid(ctx, fc_sp); 278109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 278209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie pops(ctx, 1); 278309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 278409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie#endif 278509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 278609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int tgsi_if(struct r600_shader_ctx *ctx) 278709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 2788a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie emit_logic_pred(ctx, CTX_INST(V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_PRED_SETNE)); 278909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 2790a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie r600_bc_add_cfinst(ctx->bc, CTX_INST(V_SQ_CF_WORD1_SQ_CF_INST_JUMP)); 279109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 279209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_pushlevel(ctx, FC_IF); 279309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 279409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie callstack_check_depth(ctx, FC_PUSH_VPM, 0); 2795a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return 0; 2796a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie} 2797a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2798a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airliestatic int tgsi_else(struct r600_shader_ctx *ctx) 2799a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie{ 2800a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie r600_bc_add_cfinst(ctx->bc, CTX_INST(V_SQ_CF_WORD1_SQ_CF_INST_ELSE)); 2801a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie ctx->bc->cf_last->pop_count = 1; 2802a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 280309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_set_mid(ctx, ctx->bc->fc_sp); 2804a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].start->cf_addr = ctx->bc->cf_last->id; 2805a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return 0; 2806a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie} 2807a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2808a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airliestatic int tgsi_endif(struct r600_shader_ctx *ctx) 2809a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie{ 2810a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie pops(ctx, 1); 2811a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie if (ctx->bc->fc_stack[ctx->bc->fc_sp].type != FC_IF) { 2812a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie R600_ERR("if/endif unbalanced in shader\n"); 2813a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return -1; 2814a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie } 2815a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2816a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie if (ctx->bc->fc_stack[ctx->bc->fc_sp].mid == NULL) { 2817a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].start->cf_addr = ctx->bc->cf_last->id + 2; 2818a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].start->pop_count = 1; 2819a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie } else { 282009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].mid[0]->cf_addr = ctx->bc->cf_last->id + 2; 2821a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie } 282209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_poplevel(ctx); 282309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 282409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie callstack_decrease_current(ctx, FC_PUSH_VPM); 282509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return 0; 282609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 282709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 282809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int tgsi_bgnloop(struct r600_shader_ctx *ctx) 282909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 2830a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie r600_bc_add_cfinst(ctx->bc, CTX_INST(V_SQ_CF_WORD1_SQ_CF_INST_LOOP_START_NO_AL)); 283109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 283209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_pushlevel(ctx, FC_LOOP); 2833a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 283409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie /* check stack depth */ 283509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie callstack_check_depth(ctx, FC_LOOP, 0); 283609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return 0; 283709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 283809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 283909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int tgsi_endloop(struct r600_shader_ctx *ctx) 284009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 284109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie int i; 284209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 2843a3a94554f5a12f0626d9712ddcdc81b1e21d36c2Dave Airlie r600_bc_add_cfinst(ctx->bc, CTX_INST(V_SQ_CF_WORD1_SQ_CF_INST_LOOP_END)); 284409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 284509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if (ctx->bc->fc_stack[ctx->bc->fc_sp].type != FC_LOOP) { 284609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie R600_ERR("loop/endloop in shader code are not paired.\n"); 284709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return -EINVAL; 284809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 284909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 285009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie /* fixup loop pointers - from r600isa 285109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie LOOP END points to CF after LOOP START, 285209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie LOOP START point to CF after LOOP END 285309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie BRK/CONT point to LOOP END CF 285409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie */ 285509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->cf_last->cf_addr = ctx->bc->fc_stack[ctx->bc->fc_sp].start->id + 2; 285609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 285709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].start->cf_addr = ctx->bc->cf_last->id + 2; 285809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 285909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie for (i = 0; i < ctx->bc->fc_stack[ctx->bc->fc_sp].num_mid; i++) { 286009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->fc_stack[ctx->bc->fc_sp].mid[i]->cf_addr = ctx->bc->cf_last->id; 286109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 286209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie /* TODO add LOOPRET support */ 286309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_poplevel(ctx); 286409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie callstack_decrease_current(ctx, FC_LOOP); 286509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return 0; 286609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie} 286709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 286809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airliestatic int tgsi_loop_brk_cont(struct r600_shader_ctx *ctx) 286909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie{ 287009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie unsigned int fscp; 287109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 287209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie for (fscp = ctx->bc->fc_sp; fscp > 0; fscp--) 287309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie { 287409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if (FC_LOOP == ctx->bc->fc_stack[fscp].type) 287509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie break; 287609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 287709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 287809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie if (fscp == 0) { 287909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie R600_ERR("Break not inside loop/endloop pair\n"); 288009547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie return -EINVAL; 288109547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie } 288209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 288309547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie r600_bc_add_cfinst(ctx->bc, ctx->inst_info->r600_opcode); 288409547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie ctx->bc->cf_last->pop_count = 1; 288509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 288609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie fc_set_mid(ctx, fscp); 288709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie 288809547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie pops(ctx, 1); 288909547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie callstack_check_depth(ctx, FC_PUSH_VPM, 1); 2890a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie return 0; 2891a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie} 2892a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie 2893de553d906b4a205d811a9e1651f14212ec284e29Jerome Glissestatic struct r600_shader_tgsi_instruction r600_shader_tgsi_instruction[] = { 289498b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie {TGSI_OPCODE_ARL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_r600_arl}, 2895de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_MOV, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV, tgsi_op2}, 28960bebdc230ff09f191cfa269c2cbcbb257fd2e0fcStephan Schmid {TGSI_OPCODE_LIT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_lit}, 2897df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck 2898df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck /* FIXME: 2899df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck * For state trackers other than OpenGL, we'll want to use 2900df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck * _RECIP_IEEE instead. 2901df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck */ 2902df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck {TGSI_OPCODE_RCP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIP_CLAMPED, tgsi_trans_srcx_replicate}, 2903df62338c491f2cace1a48f99de78e83b5edd82fdTilman Sauerbeck 290442c966bc496d4049d98eb1d45dd7bb0b55fa41bdTilman Sauerbeck {TGSI_OPCODE_RSQ, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_rsq}, 290536d91be75ea9b79878fdf4b789ea022d781e87f4Dave Airlie {TGSI_OPCODE_EXP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_exp}, 2906460c5304aba646143938b76d536a6fc13a302ca8Tilman Sauerbeck {TGSI_OPCODE_LOG, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_log}, 2907de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_MUL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL, tgsi_op2}, 2908de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ADD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_ADD, tgsi_op2}, 2909cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse {TGSI_OPCODE_DP3, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 2910cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse {TGSI_OPCODE_DP4, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 291157eecbbf6c57fbf5a46b8b81d8d4fbb6bd78ea12Dave Airlie {TGSI_OPCODE_DST, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_opdst}, 2912dd863bf5e7c6680075cf7c355a026b1da69ee9e3Jerome Glisse {TGSI_OPCODE_MIN, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MIN, tgsi_op2}, 2913de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_MAX, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MAX, tgsi_op2}, 2914d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie {TGSI_OPCODE_SLT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGT, tgsi_op2_swap}, 2915be288c3505429811adc2743c1be2c1971f4483a2Dave Airlie {TGSI_OPCODE_SGE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGE, tgsi_op2}, 2916de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_MAD, 1, V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD, tgsi_op3}, 2917de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_SUB, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_ADD, tgsi_op2}, 2918b346c4205dc19c9ffbff48ed8bd89687772a96f8Jerome Glisse {TGSI_OPCODE_LRP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_lrp}, 2919de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_CND, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2920de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 2921de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {20, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2922de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_DP2A, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2923de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 2924de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {22, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2925de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {23, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29263af87162cd0d3107cb2af0812ce4e4680b177725Dave Airlie {TGSI_OPCODE_FRC, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FRACT, tgsi_op2}, 2927de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_CLAMP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29283af87162cd0d3107cb2af0812ce4e4680b177725Dave Airlie {TGSI_OPCODE_FLR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLOOR, tgsi_op2}, 2929de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ROUND, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29307e42b7e5d2aebcda0e6bf081b6661411731e6df2Jerome Glisse {TGSI_OPCODE_EX2, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE, tgsi_trans_srcx_replicate}, 29314558b634556f42867449a6e60d4badc72099f10dDave Airlie {TGSI_OPCODE_LG2, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_IEEE, tgsi_trans_srcx_replicate}, 2932a4b10a56145ea253def4cf958410d770d0640bc9Jerome Glisse {TGSI_OPCODE_POW, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_pow}, 29330e6a02d29915db2ca460206656ab517ddaf0b455Dave Airlie {TGSI_OPCODE_XPD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_xpd}, 2934de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 2935de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {32, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29367a73390f9126fd270d9891cd9d2bf38ef56d9b80Jerome Glisse {TGSI_OPCODE_ABS, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV, tgsi_op2}, 2937de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_RCC, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2938e57437ccd6814ffd4534fd46512afeb0b9e06eedDave Airlie {TGSI_OPCODE_DPH, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 293988f5976484842671ecb2cefcfa91838a43032359Dave Airlie {TGSI_OPCODE_COS, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_COS, tgsi_trig}, 29403af87162cd0d3107cb2af0812ce4e4680b177725Dave Airlie {TGSI_OPCODE_DDX, 0, SQ_TEX_INST_GET_GRADIENTS_H, tgsi_tex}, 29413af87162cd0d3107cb2af0812ce4e4680b177725Dave Airlie {TGSI_OPCODE_DDY, 0, SQ_TEX_INST_GET_GRADIENTS_V, tgsi_tex}, 29424502b17901ad491e0598ee59a12d372c008ae03bDave Airlie {TGSI_OPCODE_KILP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_KILLGT, tgsi_kill}, /* predicated kill */ 2943de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_PK2H, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2944de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_PK2US, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2945de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_PK4B, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2946de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_PK4UB, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2947de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_RFL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29480d48925a56ad4fb253386110b545abda82a25464Dave Airlie {TGSI_OPCODE_SEQ, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETE, tgsi_op2}, 2949de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_SFL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29500d48925a56ad4fb253386110b545abda82a25464Dave Airlie {TGSI_OPCODE_SGT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGT, tgsi_op2}, 295188f5976484842671ecb2cefcfa91838a43032359Dave Airlie {TGSI_OPCODE_SIN, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SIN, tgsi_trig}, 2952d8fb13bae30b6ff214c5d5158b9bcaf430f56b43Dave Airlie {TGSI_OPCODE_SLE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGE, tgsi_op2_swap}, 29530d48925a56ad4fb253386110b545abda82a25464Dave Airlie {TGSI_OPCODE_SNE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETNE, tgsi_op2}, 2954de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_STR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2955b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie {TGSI_OPCODE_TEX, 0, SQ_TEX_INST_SAMPLE, tgsi_tex}, 2956de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_TXD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2957b777db32541b360516203865a0fa41f4b8cebf7cDave Airlie {TGSI_OPCODE_TXP, 0, SQ_TEX_INST_SAMPLE, tgsi_tex}, 2958de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UP2H, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2959de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UP2US, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2960de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UP4B, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2961de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UP4UB, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2962de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_X2D, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2963de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ARA, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29649f7ec103e26c67cb077fd7d94d2fb68562b86c40Keith Whitwell {TGSI_OPCODE_ARR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_r600_arl}, 2965de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_BRA, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2966de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_CAL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2967de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_RET, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29680d48925a56ad4fb253386110b545abda82a25464Dave Airlie {TGSI_OPCODE_SSG, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_ssg}, 296987f44d5723ebb3a2efe0dddc1a6edb6536adea4dDave Airlie {TGSI_OPCODE_CMP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_cmp}, 297092f5c7a597aaf098f4e6b4793e4b89ae539e328aDave Airlie {TGSI_OPCODE_SCS, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_scs}, 2971d01c0025e81e713d99f4de9ed7f4cdd12a1d08b5Dave Airlie {TGSI_OPCODE_TXB, 0, SQ_TEX_INST_SAMPLE_L, tgsi_tex}, 2972de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_NRM, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2973de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_DIV, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2974cf864fd58b2a4780482a108cd3ff86779e8fa965Jerome Glisse {TGSI_OPCODE_DP2, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 2975ef2702fb2003944998ab1578119fb44fe16d1c82Dave Airlie {TGSI_OPCODE_TXL, 0, SQ_TEX_INST_SAMPLE_L, tgsi_tex}, 297609547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie {TGSI_OPCODE_BRK, 0, V_SQ_CF_WORD1_SQ_CF_INST_LOOP_BREAK, tgsi_loop_brk_cont}, 2977a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie {TGSI_OPCODE_IF, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_if}, 2978de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 2979de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {75, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2980de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {76, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2981a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie {TGSI_OPCODE_ELSE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_else}, 2982a03d456f5a41926e39194de70b2d50776e64b8a2Dave Airlie {TGSI_OPCODE_ENDIF, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_endif}, 2983de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 2984de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {79, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2985de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {80, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2986de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_PUSHA, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2987de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_POPA, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2988de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_CEIL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2989de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_I2F, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2990de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_NOT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 29914558b634556f42867449a6e60d4badc72099f10dDave Airlie {TGSI_OPCODE_TRUNC, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_TRUNC, tgsi_trans_srcx_replicate}, 2992de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_SHL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2993de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 2994de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {88, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2995de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_AND, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2996de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_OR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2997de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_MOD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2998de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_XOR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 2999de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_SAD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3000de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_TXF, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3001de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_TXQ, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 300209547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie {TGSI_OPCODE_CONT, 0, V_SQ_CF_WORD1_SQ_CF_INST_LOOP_CONTINUE, tgsi_loop_brk_cont}, 3003de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_EMIT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3004de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ENDPRIM, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 300509547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie {TGSI_OPCODE_BGNLOOP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_bgnloop}, 3006de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_BGNSUB, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 300709547e1bcee7df3444dd8682770d1b31da1a5822Dave Airlie {TGSI_OPCODE_ENDLOOP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_endloop}, 3008de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ENDSUB, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3009de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 3010de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {103, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3011de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {104, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3012de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {105, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3013de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {106, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3014de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_NOP, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3015de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 3016de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {108, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3017de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {109, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3018de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {110, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3019de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {111, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3020de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_NRM4, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3021de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_CALLNZ, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3022de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_IFC, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3023de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_BREAKC, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3024094d66f45992830929d620782c70836b4b9b4a37Jerome Glisse {TGSI_OPCODE_KIL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_KILLGT, tgsi_kill}, /* conditional kill */ 3025de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_END, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_end}, /* aka HALT */ 3026de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse /* gap */ 3027de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {118, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3028de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_F2I, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3029de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_IDIV, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3030de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_IMAX, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3031de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_IMIN, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3032de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_INEG, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3033de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ISGE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3034de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ISHR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3035de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ISLT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3036de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_F2U, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3037de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_U2F, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3038de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UADD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3039de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UDIV, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3040de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UMAD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3041de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UMAX, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3042de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UMIN, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3043de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UMOD, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3044de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_UMUL, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3045de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_USEQ, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3046de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_USGE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3047de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_USHR, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3048de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_USLT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3049de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_USNE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3050de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_SWITCH, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3051de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_CASE, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3052de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_DEFAULT, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3053de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_ENDSWITCH, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3054de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse {TGSI_OPCODE_LAST, 0, V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 3055de553d906b4a205d811a9e1651f14212ec284e29Jerome Glisse}; 305650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie 305750526e094f4c66957c7f74c190c35903bc82fb62Dave Airliestatic struct r600_shader_tgsi_instruction eg_shader_tgsi_instruction[] = { 305898b3f27439ba3a48286ed0d6a4467e5482b41fecDave Airlie {TGSI_OPCODE_ARL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_eg_arl}, 305950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_MOV, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV, tgsi_op2}, 306050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_LIT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_lit}, 306150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_RCP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIP_IEEE, tgsi_trans_srcx_replicate}, 306250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_RSQ, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_RECIPSQRT_IEEE, tgsi_trans_srcx_replicate}, 306350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_EXP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_exp}, 306450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_LOG, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 306550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_MUL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MUL, tgsi_op2}, 306650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ADD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_ADD, tgsi_op2}, 306750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DP3, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 306850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DP4, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 306950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DST, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_opdst}, 307050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_MIN, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MIN, tgsi_op2}, 307150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_MAX, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MAX, tgsi_op2}, 307250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SLT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGT, tgsi_op2_swap}, 307350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SGE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGE, tgsi_op2}, 307450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_MAD, 1, EG_V_SQ_ALU_WORD1_OP3_SQ_OP3_INST_MULADD, tgsi_op3}, 307550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SUB, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_ADD, tgsi_op2}, 307650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_LRP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_lrp}, 307750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CND, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 307850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 307950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {20, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 308050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DP2A, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 308150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 308250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {22, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 308350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {23, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 308450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_FRC, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FRACT, tgsi_op2}, 308550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CLAMP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 308650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_FLR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_FLOOR, tgsi_op2}, 308750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ROUND, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 308850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_EX2, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_EXP_IEEE, tgsi_trans_srcx_replicate}, 308950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_LG2, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_LOG_IEEE, tgsi_trans_srcx_replicate}, 309050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_POW, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_pow}, 309150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_XPD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_xpd}, 309250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 309350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {32, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 309450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ABS, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_MOV, tgsi_op2}, 309550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_RCC, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 309650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DPH, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 309750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_COS, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_COS, tgsi_trig}, 309850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DDX, 0, SQ_TEX_INST_GET_GRADIENTS_H, tgsi_tex}, 309950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DDY, 0, SQ_TEX_INST_GET_GRADIENTS_V, tgsi_tex}, 310050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_KILP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_KILLGT, tgsi_kill}, /* predicated kill */ 310150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_PK2H, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 310250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_PK2US, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 310350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_PK4B, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 310450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_PK4UB, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 310550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_RFL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 310650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SEQ, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETE, tgsi_op2}, 310750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SFL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 310850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SGT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGT, tgsi_op2}, 310950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SIN, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SIN, tgsi_trig}, 311050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SLE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETGE, tgsi_op2_swap}, 311150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SNE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_SETNE, tgsi_op2}, 311250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_STR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 311350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TEX, 0, SQ_TEX_INST_SAMPLE, tgsi_tex}, 311450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TXD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 311550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TXP, 0, SQ_TEX_INST_SAMPLE, tgsi_tex}, 311650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UP2H, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 311750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UP2US, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 311850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UP4B, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 311950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UP4UB, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 312050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_X2D, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 312150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ARA, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 312252c66120d8c55d29af6af60f75eb1dc54d9b8062Alex Deucher {TGSI_OPCODE_ARR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_eg_arl}, 312350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_BRA, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 312450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CAL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 312550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_RET, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 312650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SSG, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_ssg}, 312750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CMP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_cmp}, 312850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SCS, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_scs}, 312950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TXB, 0, SQ_TEX_INST_SAMPLE_L, tgsi_tex}, 313050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_NRM, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 313150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DIV, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 313250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DP2, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_DOT4, tgsi_dp}, 3133ef2702fb2003944998ab1578119fb44fe16d1c82Dave Airlie {TGSI_OPCODE_TXL, 0, SQ_TEX_INST_SAMPLE_L, tgsi_tex}, 313450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_BRK, 0, EG_V_SQ_CF_WORD1_SQ_CF_INST_LOOP_BREAK, tgsi_loop_brk_cont}, 313550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_IF, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_if}, 313650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 313750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {75, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 313850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {76, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 313950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ELSE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_else}, 314050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ENDIF, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_endif}, 314150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 314250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {79, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {80, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_PUSHA, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_POPA, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CEIL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_I2F, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_NOT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 314950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TRUNC, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_TRUNC, tgsi_trans_srcx_replicate}, 315050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SHL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 315250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {88, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_AND, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_OR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_MOD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_XOR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SAD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TXF, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 315950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_TXQ, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 316050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CONT, 0, EG_V_SQ_CF_WORD1_SQ_CF_INST_LOOP_CONTINUE, tgsi_loop_brk_cont}, 316150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_EMIT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 316250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ENDPRIM, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 316350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_BGNLOOP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_bgnloop}, 316450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_BGNSUB, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 316550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ENDLOOP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_endloop}, 316650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ENDSUB, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 316750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 316850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {103, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 316950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {104, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {105, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {106, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_NOP, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 317450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {108, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {109, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {110, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {111, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_NRM4, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 317950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CALLNZ, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_IFC, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_BREAKC, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_KIL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_KILLGT, tgsi_kill}, /* conditional kill */ 318350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_END, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_end}, /* aka HALT */ 318450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie /* gap */ 318550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {118, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_F2I, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_IDIV, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_IMAX, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 318950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_IMIN, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_INEG, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ISGE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ISHR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ISLT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_F2U, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_U2F, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UADD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UDIV, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UMAD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 319950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UMAX, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UMIN, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UMOD, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_UMUL, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_USEQ, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320450526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_USGE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320550526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_USHR, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320650526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_USLT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320750526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_USNE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320850526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_SWITCH, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 320950526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_CASE, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 321050526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_DEFAULT, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 321150526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_ENDSWITCH, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 321250526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie {TGSI_OPCODE_LAST, 0, EG_V_SQ_ALU_WORD1_OP2_SQ_OP2_INST_NOP, tgsi_unsupported}, 321350526e094f4c66957c7f74c190c35903bc82fb62Dave Airlie}; 3214