lp_bld_tgsi_soa.c revision 3ded3e98ffc36820c8ab318d736eab99bb16f26b
163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca/**************************************************************************
263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca *
363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * Copyright 2009 VMware, Inc.
463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * Copyright 2007-2008 Tungsten Graphics, Inc., Cedar Park, Texas.
563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * All Rights Reserved.
663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca *
763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * Permission is hereby granted, free of charge, to any person obtaining a
863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * copy of this software and associated documentation files (the
963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * "Software"), to deal in the Software without restriction, including
1063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * without limitation the rights to use, copy, modify, merge, publish,
1163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * distribute, sub license, and/or sell copies of the Software, and to
1263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * permit persons to whom the Software is furnished to do so, subject to
1363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * the following conditions:
1463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca *
1563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * The above copyright notice and this permission notice (including the
1663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * next paragraph) shall be included in all copies or substantial portions
1763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * of the Software.
1863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca *
1963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
2063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
2163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
2263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
2363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
2463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
2563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
2663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca *
2763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca **************************************************************************/
2863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
295811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca/**
305811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca * @file
315811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca * TGSI to LLVM IR translation -- SoA.
325811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca *
335811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca * @author Jose Fonseca <jfonseca@vmware.com>
345811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca *
355811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca * Based on tgsi_sse2.c code written by Michal Krol, Keith Whitwell,
365811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca * Brian Paul, and others.
375811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca */
385811ed87d732101ab8cfbd087bc99d8c6c963f30José Fonseca
3963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "pipe/p_config.h"
4063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "pipe/p_shader_tokens.h"
4163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "util/u_debug.h"
4263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "util/u_math.h"
4363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "util/u_memory.h"
442410125d072faeb83c8373e676422f6c44c78febBrian Paul#include "tgsi/tgsi_dump.h"
457821664b15501b173b2304bbada758c33c5ff972José Fonseca#include "tgsi/tgsi_info.h"
4663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "tgsi/tgsi_parse.h"
4763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "tgsi/tgsi_util.h"
48021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin#include "tgsi/tgsi_scan.h"
4963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "lp_bld_type.h"
5063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "lp_bld_const.h"
5163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "lp_bld_arit.h"
526d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca#include "lp_bld_bitarit.h"
534363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul#include "lp_bld_gather.h"
547821664b15501b173b2304bbada758c33c5ff972José Fonseca#include "lp_bld_logic.h"
5563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "lp_bld_swizzle.h"
563d7a88674f9eb3320eeff511968f041426e25023José Fonseca#include "lp_bld_flow.h"
57ef81779850d1343b3ae284eb9beabeaf11934d4aJosé Fonseca#include "lp_bld_quad.h"
5863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#include "lp_bld_tgsi.h"
596c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca#include "lp_bld_limits.h"
6080f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin#include "lp_bld_debug.h"
6163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
6263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
6363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define FOR_EACH_CHANNEL( CHAN )\
6463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   for (CHAN = 0; CHAN < NUM_CHANNELS; CHAN++)
6563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
6663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define IS_DST0_CHANNEL_ENABLED( INST, CHAN )\
675b0824dfe5eaf59fa87134e7482b3d147b262901Keith Whitwell   ((INST)->Dst[0].Register.WriteMask & (1 << (CHAN)))
6863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
6963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define IF_IS_DST0_CHANNEL_ENABLED( INST, CHAN )\
7063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   if (IS_DST0_CHANNEL_ENABLED( INST, CHAN ))
7163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
7263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define FOR_EACH_DST0_ENABLED_CHANNEL( INST, CHAN )\
7363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   FOR_EACH_CHANNEL( CHAN )\
7463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( INST, CHAN )
7563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
7663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define CHAN_X 0
7763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define CHAN_Y 1
7863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define CHAN_Z 2
7963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca#define CHAN_W 3
805a916204179c6787157af3f3be758dc36162ab20Keith Whitwell#define NUM_CHANNELS 4
8163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
820b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin#define LP_MAX_INSTRUCTIONS 256
830b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
8480f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
8580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstruct lp_exec_mask {
8680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   struct lp_build_context *bld;
8780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
8880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   boolean has_mask;
8980f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
9080f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   LLVMTypeRef int_vec_type;
9180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
926c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca   LLVMValueRef cond_stack[LP_MAX_TGSI_NESTING];
9380f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   int cond_stack_size;
9480f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   LLVMValueRef cond_mask;
9580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
962d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMBasicBlockRef loop_block;
9718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMValueRef cont_mask;
982d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMValueRef break_mask;
992d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMValueRef break_var;
1002d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   struct {
1012d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      LLVMBasicBlockRef loop_block;
1022d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      LLVMValueRef cont_mask;
1032d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      LLVMValueRef break_mask;
1042d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      LLVMValueRef break_var;
1052d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   } loop_stack[LP_MAX_TGSI_NESTING];
10618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   int loop_stack_size;
10718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
10832a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   LLVMValueRef ret_mask;
1090b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   struct {
1100b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      int pc;
1110b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      LLVMValueRef ret_mask;
1120b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   } call_stack[LP_MAX_TGSI_NESTING];
1130b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   int call_stack_size;
1140b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
11580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   LLVMValueRef exec_mask;
11680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin};
11763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
11863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecastruct lp_build_tgsi_soa_context
11963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
12063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct lp_build_context base;
12163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
122ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   /* Builder for integer masks and indices */
1236d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   struct lp_build_context uint_bld;
124ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
12563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   LLVMValueRef consts_ptr;
126f85c5f8621382ba1c8baa1582d87b46b388258d2José Fonseca   const LLVMValueRef *pos;
127263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca   const LLVMValueRef (*inputs)[NUM_CHANNELS];
128263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca   LLVMValueRef (*outputs)[NUM_CHANNELS];
129c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca
1303f6dc8e79d918283a6dfcf9c8937a6d52f3bb4f5Brian Paul   const struct lp_build_sampler_soa *sampler;
13163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
1326c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca   LLVMValueRef immediates[LP_MAX_TGSI_IMMEDIATES][NUM_CHANNELS];
1336c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca   LLVMValueRef temps[LP_MAX_TGSI_TEMPS][NUM_CHANNELS];
1346c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca   LLVMValueRef addr[LP_MAX_TGSI_ADDRS][NUM_CHANNELS];
135ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   LLVMValueRef preds[LP_MAX_TGSI_PREDS][NUM_CHANNELS];
1361929057eac0c3351e0810612bdae56331a235736José Fonseca
1373662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul   /* We allocate/use this array of temps if (1 << TGSI_FILE_TEMPORARY) is
1383662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul    * set in the indirect_files field.
1393662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul    * The temps[] array above is unused then.
1403662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul    */
141021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin   LLVMValueRef temps_array;
1423662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul
1436d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   const struct tgsi_shader_info *info;
1443662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul   /** bitmask indicating which register files are accessed indirectly */
1453662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul   unsigned indirect_files;
146021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin
1473d7a88674f9eb3320eeff511968f041426e25023José Fonseca   struct lp_build_mask_context *mask;
14880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   struct lp_exec_mask exec_mask;
1490b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
1500b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   struct tgsi_full_instruction *instructions;
1510b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   uint max_instructions;
15263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca};
15363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
15480f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstatic void lp_exec_mask_init(struct lp_exec_mask *mask, struct lp_build_context *bld)
15580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin{
15680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->bld = bld;
15780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->has_mask = FALSE;
15880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->cond_stack_size = 0;
15918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   mask->loop_stack_size = 0;
1600b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   mask->call_stack_size = 0;
16180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
16280f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->int_vec_type = lp_build_int_vec_type(mask->bld->type);
16332a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   mask->exec_mask = mask->ret_mask = mask->break_mask = mask->cont_mask = mask->cond_mask =
1642d91903882e399e8ea7306fd37d5d214907247e6José Fonseca         LLVMConstAllOnes(mask->int_vec_type);
16580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin}
16680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
16780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstatic void lp_exec_mask_update(struct lp_exec_mask *mask)
16880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin{
16918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   if (mask->loop_stack_size) {
17018a4a83ddab7655253fdb71d37393a32adcda488Zack Rusin      /*for loops we need to update the entire mask at runtime */
17118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      LLVMValueRef tmp;
1727fe93f831d74ce46a161c0b0c89f00b9c18caa2bBrian Paul      assert(mask->break_mask);
17318d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      tmp = LLVMBuildAnd(mask->bld->builder,
17418d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                         mask->cont_mask,
17518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                         mask->break_mask,
17618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                         "maskcb");
17718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      mask->exec_mask = LLVMBuildAnd(mask->bld->builder,
17818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                     mask->cond_mask,
17918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                     tmp,
18018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                     "maskfull");
18118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   } else
18218d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      mask->exec_mask = mask->cond_mask;
18318d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
18432a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   if (mask->call_stack_size) {
1850b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      mask->exec_mask = LLVMBuildAnd(mask->bld->builder,
1860b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                                     mask->exec_mask,
18732a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca                                     mask->ret_mask,
1880b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                                     "callmask");
18932a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   }
19018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
19118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   mask->has_mask = (mask->cond_stack_size > 0 ||
1920b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                     mask->loop_stack_size > 0 ||
1930b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                     mask->call_stack_size > 0);
19480f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin}
19580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
19680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstatic void lp_exec_mask_cond_push(struct lp_exec_mask *mask,
19780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin                                   LLVMValueRef val)
19880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin{
1996c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca   assert(mask->cond_stack_size < LP_MAX_TGSI_NESTING);
2002d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   if (mask->cond_stack_size == 0) {
2012d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      assert(mask->cond_mask == LLVMConstAllOnes(mask->int_vec_type));
2022d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   }
20380f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->cond_stack[mask->cond_stack_size++] = mask->cond_mask;
2042d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   assert(LLVMTypeOf(val) == mask->int_vec_type);
2053fa3c33844b8491a204cda6ae8d67cd6ada78b3bBrian Paul   mask->cond_mask = LLVMBuildAnd(mask->bld->builder,
2063fa3c33844b8491a204cda6ae8d67cd6ada78b3bBrian Paul                                  mask->cond_mask,
2073fa3c33844b8491a204cda6ae8d67cd6ada78b3bBrian Paul                                  val,
2083fa3c33844b8491a204cda6ae8d67cd6ada78b3bBrian Paul                                  "");
20980f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   lp_exec_mask_update(mask);
21080f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin}
21180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
21280f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstatic void lp_exec_mask_cond_invert(struct lp_exec_mask *mask)
21380f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin{
2142d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMValueRef prev_mask;
2152d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMValueRef inv_mask;
2162d91903882e399e8ea7306fd37d5d214907247e6José Fonseca
2172d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   assert(mask->cond_stack_size);
2182d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   prev_mask = mask->cond_stack[mask->cond_stack_size - 1];
2192d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   if (mask->cond_stack_size == 1) {
2202d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      assert(prev_mask == LLVMConstAllOnes(mask->int_vec_type));
221faf8215bae70f020420242dc812ef141fdcf5417Zack Rusin   }
222faf8215bae70f020420242dc812ef141fdcf5417Zack Rusin
2232d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   inv_mask = LLVMBuildNot(mask->bld->builder, mask->cond_mask, "");
2242d91903882e399e8ea7306fd37d5d214907247e6José Fonseca
22580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->cond_mask = LLVMBuildAnd(mask->bld->builder,
22680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin                                  inv_mask,
22780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin                                  prev_mask, "");
22880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   lp_exec_mask_update(mask);
22980f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin}
23080f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
23180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstatic void lp_exec_mask_cond_pop(struct lp_exec_mask *mask)
23280f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin{
2332d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   assert(mask->cond_stack_size);
23480f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   mask->cond_mask = mask->cond_stack[--mask->cond_stack_size];
23580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   lp_exec_mask_update(mask);
23680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin}
23780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
23818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusinstatic void lp_exec_bgnloop(struct lp_exec_mask *mask)
23918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin{
2402d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   if (mask->loop_stack_size == 0) {
2412d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      assert(mask->loop_block == NULL);
2422d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      assert(mask->cont_mask == LLVMConstAllOnes(mask->int_vec_type));
2432d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      assert(mask->break_mask == LLVMConstAllOnes(mask->int_vec_type));
2442d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      assert(mask->break_var == NULL);
2452d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   }
2462d91903882e399e8ea7306fd37d5d214907247e6José Fonseca
2472d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   assert(mask->loop_stack_size < LP_MAX_TGSI_NESTING);
24818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
2492d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->loop_stack[mask->loop_stack_size].loop_block = mask->loop_block;
2502d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->loop_stack[mask->loop_stack_size].cont_mask = mask->cont_mask;
2512d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->loop_stack[mask->loop_stack_size].break_mask = mask->break_mask;
2522d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->loop_stack[mask->loop_stack_size].break_var = mask->break_var;
2532d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   ++mask->loop_stack_size;
2543a423dcf9dfa725a4e5dca60f0f2b02599d2ed9bZack Rusin
2552d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->break_var = lp_build_alloca(mask->bld->builder, mask->int_vec_type, "");
2562d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMBuildStore(mask->bld->builder, mask->break_mask, mask->break_var);
2576c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca
25818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   mask->loop_block = lp_build_insert_new_block(mask->bld->builder, "bgnloop");
25918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMBuildBr(mask->bld->builder, mask->loop_block);
26018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMPositionBuilderAtEnd(mask->bld->builder, mask->loop_block);
26118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
2622d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->break_mask = LLVMBuildLoad(mask->bld->builder, mask->break_var, "");
2632d91903882e399e8ea7306fd37d5d214907247e6José Fonseca
26418d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   lp_exec_mask_update(mask);
26518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin}
26618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
26718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusinstatic void lp_exec_break(struct lp_exec_mask *mask)
26818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin{
26918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMValueRef exec_mask = LLVMBuildNot(mask->bld->builder,
27018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                         mask->exec_mask,
27118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                         "break");
27218d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
273d2b6ed7c4daf094bfe3fa4e0318133d0a8ea3cf6Zack Rusin   mask->break_mask = LLVMBuildAnd(mask->bld->builder,
274d2b6ed7c4daf094bfe3fa4e0318133d0a8ea3cf6Zack Rusin                                   mask->break_mask,
275d2b6ed7c4daf094bfe3fa4e0318133d0a8ea3cf6Zack Rusin                                   exec_mask, "break_full");
27618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
27718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   lp_exec_mask_update(mask);
27818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin}
27918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
28018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusinstatic void lp_exec_continue(struct lp_exec_mask *mask)
28118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin{
28218d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMValueRef exec_mask = LLVMBuildNot(mask->bld->builder,
28318d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                         mask->exec_mask,
28418d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin                                         "");
28518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
286d2b6ed7c4daf094bfe3fa4e0318133d0a8ea3cf6Zack Rusin   mask->cont_mask = LLVMBuildAnd(mask->bld->builder,
287d2b6ed7c4daf094bfe3fa4e0318133d0a8ea3cf6Zack Rusin                                  mask->cont_mask,
288d2b6ed7c4daf094bfe3fa4e0318133d0a8ea3cf6Zack Rusin                                  exec_mask, "");
28918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
29018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   lp_exec_mask_update(mask);
29118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin}
29218d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
29318d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
29418d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusinstatic void lp_exec_endloop(struct lp_exec_mask *mask)
29518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin{
29618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMBasicBlockRef endloop;
297d42229707ad4be9be5a8e122354be7102d6ec348Jose Fonseca   LLVMTypeRef reg_type = LLVMIntType(mask->bld->type.width*
298d42229707ad4be9be5a8e122354be7102d6ec348Jose Fonseca                                      mask->bld->type.length);
2997fe93f831d74ce46a161c0b0c89f00b9c18caa2bBrian Paul   LLVMValueRef i1cond;
3007fe93f831d74ce46a161c0b0c89f00b9c18caa2bBrian Paul
3017fe93f831d74ce46a161c0b0c89f00b9c18caa2bBrian Paul   assert(mask->break_mask);
3027fe93f831d74ce46a161c0b0c89f00b9c18caa2bBrian Paul
3032d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   /*
3042d91903882e399e8ea7306fd37d5d214907247e6José Fonseca    * Restore the cont_mask, but don't pop
3052d91903882e399e8ea7306fd37d5d214907247e6José Fonseca    */
3062d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   assert(mask->loop_stack_size);
3072d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->cont_mask = mask->loop_stack[mask->loop_stack_size - 1].cont_mask;
3082d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   lp_exec_mask_update(mask);
3092d91903882e399e8ea7306fd37d5d214907247e6José Fonseca
3102d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   /*
3112d91903882e399e8ea7306fd37d5d214907247e6José Fonseca    * Unlike the continue mask, the break_mask must be preserved across loop
3122d91903882e399e8ea7306fd37d5d214907247e6José Fonseca    * iterations
3132d91903882e399e8ea7306fd37d5d214907247e6José Fonseca    */
3142d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   LLVMBuildStore(mask->bld->builder, mask->break_mask, mask->break_var);
3152d91903882e399e8ea7306fd37d5d214907247e6José Fonseca
316d42229707ad4be9be5a8e122354be7102d6ec348Jose Fonseca   /* i1cond = (mask == 0) */
3177fe93f831d74ce46a161c0b0c89f00b9c18caa2bBrian Paul   i1cond = LLVMBuildICmp(
318d42229707ad4be9be5a8e122354be7102d6ec348Jose Fonseca      mask->bld->builder,
319d42229707ad4be9be5a8e122354be7102d6ec348Jose Fonseca      LLVMIntNE,
3202d91903882e399e8ea7306fd37d5d214907247e6José Fonseca      LLVMBuildBitCast(mask->bld->builder, mask->exec_mask, reg_type, ""),
321d42229707ad4be9be5a8e122354be7102d6ec348Jose Fonseca      LLVMConstNull(reg_type), "");
32218d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
32318d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   endloop = lp_build_insert_new_block(mask->bld->builder, "endloop");
32418d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
32518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMBuildCondBr(mask->bld->builder,
326ac33e7752d22f03db84e6a4c822b3a3f41d05f77Zack Rusin                   i1cond, mask->loop_block, endloop);
32718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
32818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   LLVMPositionBuilderAtEnd(mask->bld->builder, endloop);
32918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
3302d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   assert(mask->loop_stack_size);
3312d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   --mask->loop_stack_size;
3322d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->loop_block = mask->loop_stack[mask->loop_stack_size].loop_block;
3332d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->cont_mask = mask->loop_stack[mask->loop_stack_size].cont_mask;
3342d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->break_mask = mask->loop_stack[mask->loop_stack_size].break_mask;
3352d91903882e399e8ea7306fd37d5d214907247e6José Fonseca   mask->break_var = mask->loop_stack[mask->loop_stack_size].break_var;
33618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
33718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   lp_exec_mask_update(mask);
33818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin}
33918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
34018a4a83ddab7655253fdb71d37393a32adcda488Zack Rusin/* stores val into an address pointed to by dst.
34118a4a83ddab7655253fdb71d37393a32adcda488Zack Rusin * mask->exec_mask is used to figure out which bits of val
34218a4a83ddab7655253fdb71d37393a32adcda488Zack Rusin * should be stored into the address
34318a4a83ddab7655253fdb71d37393a32adcda488Zack Rusin * (0 means don't store this bit, 1 means do store).
34418a4a83ddab7655253fdb71d37393a32adcda488Zack Rusin */
34580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusinstatic void lp_exec_mask_store(struct lp_exec_mask *mask,
346ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca                               LLVMValueRef pred,
34780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin                               LLVMValueRef val,
34880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin                               LLVMValueRef dst)
34980f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin{
350ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   /* Mix the predicate and execution mask */
35180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   if (mask->has_mask) {
352ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      if (pred) {
35354b94ee96a6d750d57d99ae9819fcf8206d4680dJosé Fonseca         pred = LLVMBuildAnd(mask->bld->builder, pred, mask->exec_mask, "");
354ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      } else {
355ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         pred = mask->exec_mask;
356ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      }
357ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   }
358ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
359ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   if (pred) {
36080f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      LLVMValueRef real_val, dst_val;
36180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
36280f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      dst_val = LLVMBuildLoad(mask->bld->builder, dst, "");
36380f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      real_val = lp_build_select(mask->bld,
364ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca                                 pred,
36580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin                                 val, dst_val);
36680f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
36780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      LLVMBuildStore(mask->bld->builder, real_val, dst);
36880f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   } else
36980f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      LLVMBuildStore(mask->bld->builder, val, dst);
37080f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin}
37180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
3720b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusinstatic void lp_exec_mask_call(struct lp_exec_mask *mask,
3730b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                              int func,
3740b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                              int *pc)
3750b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin{
37632a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   assert(mask->call_stack_size < LP_MAX_TGSI_NESTING);
3770b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   mask->call_stack[mask->call_stack_size].pc = *pc;
37832a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   mask->call_stack[mask->call_stack_size].ret_mask = mask->ret_mask;
37932a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   mask->call_stack_size++;
3800b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   *pc = func;
3810b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin}
3820b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
3830b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusinstatic void lp_exec_mask_ret(struct lp_exec_mask *mask, int *pc)
3840b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin{
3850b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   LLVMValueRef exec_mask;
38632a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca
3870b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   if (mask->call_stack_size == 0) {
3880b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      /* returning from main() */
3890b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      *pc = -1;
3900b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      return;
3910b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   }
3920b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   exec_mask = LLVMBuildNot(mask->bld->builder,
3930b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                            mask->exec_mask,
3940b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                            "ret");
3950b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
39632a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   mask->ret_mask = LLVMBuildAnd(mask->bld->builder,
39732a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca                                 mask->ret_mask,
39832a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca                                 exec_mask, "ret_full");
3990b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
4000b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   lp_exec_mask_update(mask);
4010b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin}
4020b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
4030b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusinstatic void lp_exec_mask_bgnsub(struct lp_exec_mask *mask)
4040b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin{
4050b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin}
4060b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
4070b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusinstatic void lp_exec_mask_endsub(struct lp_exec_mask *mask, int *pc)
4080b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin{
40932a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   assert(mask->call_stack_size);
4100b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   mask->call_stack_size--;
4110b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   *pc = mask->call_stack[mask->call_stack_size].pc;
41232a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   mask->ret_mask = mask->call_stack[mask->call_stack_size].ret_mask;
41332a7209c0a0d5ae63f12056ed969087d942c6298José Fonseca   lp_exec_mask_update(mask);
4140b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin}
41586226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
416695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul
417695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul/**
418695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul * Return pointer to a temporary register channel (src or dest).
419f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul * Note that indirect addressing cannot be handled here.
420695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul * \param index  which temporary register
421695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul * \param chan  which channel of the temp register.
422695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul */
42386226d5ea186d3fc6013bc40a341e0c0a891de39José Fonsecastatic LLVMValueRef
424263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonsecaget_temp_ptr(struct lp_build_tgsi_soa_context *bld,
425263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca             unsigned index,
426f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul             unsigned chan)
427263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca{
428263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca   assert(chan < 4);
4293662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul   if (bld->indirect_files & (1 << TGSI_FILE_TEMPORARY)) {
430f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul      LLVMValueRef lindex = lp_build_const_int32(index * 4 + chan);
431263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca      return LLVMBuildGEP(bld->base.builder, bld->temps_array, &lindex, 1, "");
432263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca   }
433695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul   else {
434695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul      return bld->temps[index][chan];
435695814a15b4d64e1fa829d51f18c4089837929c3Brian Paul   }
436263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca}
437263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca
4384363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
4394363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul/**
4404363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul * Gather vector.
4414363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul * XXX the lp_build_gather() function should be capable of doing this
4424363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul * with a little work.
4434363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul */
4444363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paulstatic LLVMValueRef
4454363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paulbuild_gather(struct lp_build_tgsi_soa_context *bld,
4464363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul             LLVMValueRef base_ptr,
4474363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul             LLVMValueRef indexes)
4484363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul{
4494363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul   LLVMValueRef res = bld->base.undef;
4504363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul   unsigned i;
4514363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
4524363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul   /*
4534363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul    * Loop over elements of index_vec, load scalar value, insert it into 'res'.
4544363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul    */
4554363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul   for (i = 0; i < bld->base.type.length; i++) {
4564363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul      LLVMValueRef ii = LLVMConstInt(LLVMInt32Type(), i, 0);
4574363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul      LLVMValueRef index = LLVMBuildExtractElement(bld->base.builder,
4584363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul                                                   indexes, ii, "");
4594363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul      LLVMValueRef scalar_ptr = LLVMBuildGEP(bld->base.builder, base_ptr,
4603ded3e98ffc36820c8ab318d736eab99bb16f26bBrian Paul                                             &index, 1, "gather_ptr");
4614363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul      LLVMValueRef scalar = LLVMBuildLoad(bld->base.builder, scalar_ptr, "");
4624363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
4634363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul      res = LLVMBuildInsertElement(bld->base.builder, res, scalar, ii, "");
4644363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul   }
4654363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
4664363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul   return res;
4674363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul}
4684363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
4694363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
47063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca/**
4712fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul * Scatter/store vector.
4722fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul */
4732fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paulstatic void
4742fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paulbuild_scatter(struct lp_build_tgsi_soa_context *bld,
4752fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul              LLVMValueRef base_ptr,
4762fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul              LLVMValueRef indexes,
4772fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul              LLVMValueRef values)
4782fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul{
4792fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul   LLVMBuilderRef builder = bld->base.builder;
4802fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul   unsigned i;
4812fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
4822fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul   /*
4832fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul    * Loop over elements of index_vec, store scalar value.
4842fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul    */
4852fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul   for (i = 0; i < bld->base.type.length; i++) {
4862fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul      LLVMValueRef ii = LLVMConstInt(LLVMInt32Type(), i, 0);
4872fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul      LLVMValueRef index = LLVMBuildExtractElement(builder, indexes, ii, "");
4882fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul      LLVMValueRef scalar_ptr = LLVMBuildGEP(builder, base_ptr, &index, 1, "scatter_ptr");
4892fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul      LLVMValueRef val = LLVMBuildExtractElement(builder, values, ii, "scatter_val");
4902fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
4912fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul      LLVMBuildStore(builder, val, scalar_ptr);
4922fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul   }
4932fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul}
4942fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
4952fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
4962fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul/**
4970115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul * Read the current value of the ADDR register, convert the floats to
4982fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul * ints, add the base index and return the vector of offsets.
4990115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul * The offsets will be used to index into the constant buffer or
5000115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul * temporary register file.
5010115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul */
5020115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paulstatic LLVMValueRef
5036d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonsecaget_indirect_index(struct lp_build_tgsi_soa_context *bld,
5046d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                   unsigned reg_file, unsigned reg_index,
5056d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                   const struct tgsi_src_register *indirect_reg)
5060115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul{
5076d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   struct lp_build_context *uint_bld = &bld->uint_bld;
5080115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul   /* always use X component of address register */
5093d5b9c1f2d3340259dd0d8765090a5a963074f29José Fonseca   unsigned swizzle = indirect_reg->SwizzleX;
5106d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMValueRef base;
5116d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMValueRef rel;
5126d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMValueRef max_index;
5136d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMValueRef index;
5140115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul
5156d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   assert(bld->indirect_files & (1 << reg_file));
5166d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca
5176d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   base = lp_build_const_int_vec(uint_bld->type, reg_index);
5186d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca
5196d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   assert(swizzle < 4);
5206d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   rel = LLVMBuildLoad(bld->base.builder,
5216d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                        bld->addr[indirect_reg->Index][swizzle],
5226d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                        "load addr reg");
5230115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul
5240115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul   /* for indexing we want integers */
5256d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   rel = LLVMBuildFPToSI(bld->base.builder,
5266d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                         rel,
5276d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                         uint_bld->vec_type, "");
5286d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca
5296d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   index = lp_build_add(uint_bld, base, rel);
5300115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul
5316d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   max_index = lp_build_const_int_vec(uint_bld->type,
5326d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                      bld->info->file_max[reg_file]);
5330115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul
5346d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   assert(!uint_bld->type.sign);
5356d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   index = lp_build_min(uint_bld, index, max_index);
5366d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca
5376d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   return index;
5380115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul}
5390115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul
5400115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul
5410115f07507fc661a0a19564c496a781c3dcbc7a0Brian Paul/**
54263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * Register fetch.
54363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca */
54463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecastatic LLVMValueRef
54563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecaemit_fetch(
54663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct lp_build_tgsi_soa_context *bld,
5472fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca   const struct tgsi_full_instruction *inst,
548ec0e7b16bb6753bedbd611a97062934bfca03aa7Brian Paul   unsigned src_op,
54963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   const unsigned chan_index )
55063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
5516d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   struct lp_build_context *uint_bld = &bld->uint_bld;
552ec0e7b16bb6753bedbd611a97062934bfca03aa7Brian Paul   const struct tgsi_full_src_register *reg = &inst->Src[src_op];
55385c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   const unsigned swizzle =
55485c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      tgsi_util_get_full_src_register_swizzle(reg, chan_index);
55563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   LLVMValueRef res;
5566d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMValueRef indirect_index = NULL;
55763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
55885c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   if (swizzle > 3) {
55985c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      assert(0 && "invalid swizzle in emit_fetch()");
56085c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      return bld->base.undef;
56185c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   }
56285c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul
56385c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   if (reg->Register.Indirect) {
5646d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca      indirect_index = get_indirect_index(bld,
5656d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                          reg->Register.File,
5666d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                          reg->Register.Index,
5676d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                          &reg->Indirect);
5686d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   } else {
5696d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca      assert(reg->Register.Index <= bld->info->file_max[reg->Register.File]);
57085c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   }
571ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin
57285c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   switch (reg->Register.File) {
57385c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   case TGSI_FILE_CONSTANT:
574be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul      if (reg->Register.Indirect) {
5756d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         LLVMValueRef swizzle_vec =
5766d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca            lp_build_const_int_vec(uint_bld->type, swizzle);
577be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         LLVMValueRef index_vec;  /* index into the const buffer */
5784363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
5796d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         /* index_vec = indirect_index * 4 + swizzle */
5806d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         index_vec = lp_build_shl_imm(uint_bld, indirect_index, 2);
5816d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         index_vec = lp_build_add(uint_bld, index_vec, swizzle_vec);
5824363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
583be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         /* Gather values from the constant buffer */
584be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         res = build_gather(bld, bld->consts_ptr, index_vec);
585be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul      }
586be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul      else {
587be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         LLVMValueRef index;  /* index into the const buffer */
588be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         LLVMValueRef scalar, scalar_ptr;
589ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin
590be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         index = lp_build_const_int32(reg->Register.Index*4 + swizzle);
5914363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
592be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         scalar_ptr = LLVMBuildGEP(bld->base.builder, bld->consts_ptr,
593be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul                                   &index, 1, "");
594be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         scalar = LLVMBuildLoad(bld->base.builder, scalar_ptr, "");
5954363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
596be22e1e781094decfb408ad6d74e3d833b297c87Brian Paul         res = lp_build_broadcast_scalar(&bld->base, scalar);
59763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
59885c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      break;
59963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
60085c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   case TGSI_FILE_IMMEDIATE:
601263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca      res = bld->immediates[reg->Register.Index][swizzle];
60285c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      assert(res);
60385c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      break;
60463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
60585c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   case TGSI_FILE_INPUT:
606263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca      res = bld->inputs[reg->Register.Index][swizzle];
60785c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      assert(res);
60885c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      break;
60963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
61085c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul   case TGSI_FILE_TEMPORARY:
611105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul      if (reg->Register.Indirect) {
6126d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         LLVMValueRef swizzle_vec =
6136d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca            lp_build_const_int_vec(uint_bld->type, swizzle);
6146d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         LLVMValueRef length_vec =
6156d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca            lp_build_const_int_vec(uint_bld->type, bld->base.type.length);
616105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         LLVMValueRef index_vec;  /* index into the const buffer */
617105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         LLVMValueRef temps_array;
618105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         LLVMTypeRef float4_ptr_type;
6194363d4d0b945c4ca6c303fb337e1fac39e6e1ad6Brian Paul
6206d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         /* index_vec = (indirect_index * 4 + swizzle) * length */
6216d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         index_vec = lp_build_shl_imm(uint_bld, indirect_index, 2);
6226d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         index_vec = lp_build_add(uint_bld, index_vec, swizzle_vec);
6236d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         index_vec = lp_build_mul(uint_bld, index_vec, length_vec);
624105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul
625105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         /* cast temps_array pointer to float* */
626105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         float4_ptr_type = LLVMPointerType(LLVMFloatType(), 0);
6276d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca         temps_array = LLVMBuildBitCast(uint_bld->builder, bld->temps_array,
628105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul                                        float4_ptr_type, "");
629105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul
630105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         /* Gather values from the temporary register array */
631105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         res = build_gather(bld, temps_array, index_vec);
632105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul      }
633105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul      else {
634105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         LLVMValueRef temp_ptr;
635f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul         temp_ptr = get_temp_ptr(bld, reg->Register.Index, swizzle);
636021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin         res = LLVMBuildLoad(bld->base.builder, temp_ptr, "");
637105ed7dfd4abc94db1ce0cba2967ac0491158389Brian Paul         if (!res)
63863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            return bld->base.undef;
63963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
64063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
64163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
64263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   default:
64385c6799f6e2645e708eb03201e91f3285de7d9e1Brian Paul      assert(0 && "invalid src register in emit_fetch()");
6444d7a8194c5763f70ba559f32f58dfda36237b666José Fonseca      return bld->base.undef;
64563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
64663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
64763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   switch( tgsi_util_get_full_src_register_sign_mode( reg, chan_index ) ) {
64863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_UTIL_SIGN_CLEAR:
64963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      res = lp_build_abs( &bld->base, res );
65063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
65163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
65263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_UTIL_SIGN_SET:
65363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      res = lp_build_abs( &bld->base, res );
654fc9a49b638c26801951c33a570178bbb2b67ec60nobled      /* fall through */
65563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_UTIL_SIGN_TOGGLE:
6568a3a971743a90463e65b44f1769a5301a31ce4cdJosé Fonseca      res = lp_build_negate( &bld->base, res );
65763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
65863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
65963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_UTIL_SIGN_KEEP:
66063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
66163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
66263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
66363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   return res;
66463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca}
66563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
66663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
66763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca/**
66886226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca * Register fetch with derivatives.
66986226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca */
67086226d5ea186d3fc6013bc40a341e0c0a891de39José Fonsecastatic void
67186226d5ea186d3fc6013bc40a341e0c0a891de39José Fonsecaemit_fetch_deriv(
67286226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   struct lp_build_tgsi_soa_context *bld,
67386226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   const struct tgsi_full_instruction *inst,
67486226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   unsigned index,
67586226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   const unsigned chan_index,
67686226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   LLVMValueRef *res,
67786226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   LLVMValueRef *ddx,
67886226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   LLVMValueRef *ddy)
67986226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca{
68086226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   LLVMValueRef src;
68186226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
68286226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   src = emit_fetch(bld, inst, index, chan_index);
68386226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
68486226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   if(res)
68586226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca      *res = src;
68686226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
68786226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   /* TODO: use interpolation coeffs for inputs */
68886226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
68986226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   if(ddx)
690ef81779850d1343b3ae284eb9beabeaf11934d4aJosé Fonseca      *ddx = lp_build_ddx(&bld->base, src);
69186226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
69286226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca   if(ddy)
693ef81779850d1343b3ae284eb9beabeaf11934d4aJosé Fonseca      *ddy = lp_build_ddy(&bld->base, src);
69486226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca}
69586226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
69686226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca
69786226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca/**
698ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca * Predicate.
699ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca */
700ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonsecastatic void
701ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonsecaemit_fetch_predicate(
702ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   struct lp_build_tgsi_soa_context *bld,
703ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   const struct tgsi_full_instruction *inst,
704ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   LLVMValueRef *pred)
705ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca{
706ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   unsigned index;
707ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   unsigned char swizzles[4];
708ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   LLVMValueRef unswizzled[4] = {NULL, NULL, NULL, NULL};
709ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   LLVMValueRef value;
710ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   unsigned chan;
711ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
712ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   if (!inst->Instruction.Predicate) {
713ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      FOR_EACH_CHANNEL( chan ) {
714ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         pred[chan] = NULL;
715ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      }
716ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      return;
717ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   }
718ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
719ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   swizzles[0] = inst->Predicate.SwizzleX;
720ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   swizzles[1] = inst->Predicate.SwizzleY;
721ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   swizzles[2] = inst->Predicate.SwizzleZ;
722ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   swizzles[3] = inst->Predicate.SwizzleW;
723ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
724ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   index = inst->Predicate.Index;
725ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   assert(index < LP_MAX_TGSI_PREDS);
726ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
727ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   FOR_EACH_CHANNEL( chan ) {
728ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      unsigned swizzle = swizzles[chan];
729ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
730ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      /*
731ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca       * Only fetch the predicate register channels that are actually listed
732ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca       * in the swizzles
733ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca       */
734ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      if (!unswizzled[swizzle]) {
735ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         value = LLVMBuildLoad(bld->base.builder,
736263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca                               bld->preds[index][swizzle], "");
737ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
738ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         /*
739ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca          * Convert the value to an integer mask.
740ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca          *
741ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca          * TODO: Short-circuit this comparison -- a D3D setp_xx instructions
742ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca          * is needlessly causing two comparisons due to storing the intermediate
743ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca          * result as float vector instead of an integer mask vector.
744ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca          */
745ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         value = lp_build_compare(bld->base.builder,
746ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca                                  bld->base.type,
747ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca                                  PIPE_FUNC_NOTEQUAL,
748ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca                                  value,
749ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca                                  bld->base.zero);
750ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         if (inst->Predicate.Negate) {
751ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca            value = LLVMBuildNot(bld->base.builder, value, "");
752ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         }
753ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
754ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         unswizzled[swizzle] = value;
755ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      } else {
756ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         value = unswizzled[swizzle];
757ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      }
758ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
759ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      pred[chan] = value;
760ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   }
761ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca}
762ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
763ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
764ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca/**
76563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * Register store.
76663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca */
76763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecastatic void
76863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecaemit_store(
76963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct lp_build_tgsi_soa_context *bld,
77063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   const struct tgsi_full_instruction *inst,
7712fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca   unsigned index,
77263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   unsigned chan_index,
773ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   LLVMValueRef pred,
77463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   LLVMValueRef value)
77563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
7767d6c8f980d1e23ad6f557d650e89c715861a3b0cKeith Whitwell   const struct tgsi_full_dst_register *reg = &inst->Dst[index];
7772fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul   struct lp_build_context *uint_bld = &bld->uint_bld;
7786d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMValueRef indirect_index = NULL;
7792fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca
78063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   switch( inst->Instruction.Saturate ) {
78163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_SAT_NONE:
78263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
78363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
78463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_SAT_ZERO_ONE:
7857926b42d41058e5d2b99ba0e8810f93bc7c12d36José Fonseca      value = lp_build_max(&bld->base, value, bld->base.zero);
7867926b42d41058e5d2b99ba0e8810f93bc7c12d36José Fonseca      value = lp_build_min(&bld->base, value, bld->base.one);
78763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
78863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
78963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_SAT_MINUS_PLUS_ONE:
790185be3a87a5b38e8821a560c073975c11dcbd3e9Brian Paul      value = lp_build_max(&bld->base, value, lp_build_const_vec(bld->base.type, -1.0));
7917926b42d41058e5d2b99ba0e8810f93bc7c12d36José Fonseca      value = lp_build_min(&bld->base, value, bld->base.one);
79263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
7937926b42d41058e5d2b99ba0e8810f93bc7c12d36José Fonseca
7947926b42d41058e5d2b99ba0e8810f93bc7c12d36José Fonseca   default:
7957926b42d41058e5d2b99ba0e8810f93bc7c12d36José Fonseca      assert(0);
79663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
79763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
798021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin   if (reg->Register.Indirect) {
7996d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca      indirect_index = get_indirect_index(bld,
8006d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                          reg->Register.File,
8016d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                          reg->Register.Index,
8026d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca                                          &reg->Indirect);
8036d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   } else {
8046d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca      assert(reg->Register.Index <= bld->info->file_max[reg->Register.File]);
805021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin   }
806021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin
8075b0824dfe5eaf59fa87134e7482b3d147b262901Keith Whitwell   switch( reg->Register.File ) {
80863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_FILE_OUTPUT:
809ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      lp_exec_mask_store(&bld->exec_mask, pred, value,
810263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca                         bld->outputs[reg->Register.Index][chan_index]);
81163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
81263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
813f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul   case TGSI_FILE_TEMPORARY:
814f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul      if (reg->Register.Indirect) {
8152fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         LLVMValueRef chan_vec =
8162fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul            lp_build_const_int_vec(uint_bld->type, chan_index);
8172fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         LLVMValueRef length_vec =
8182fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul            lp_build_const_int_vec(uint_bld->type, bld->base.type.length);
8192fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         LLVMValueRef index_vec;  /* indexes into the temp registers */
8202fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         LLVMValueRef temps_array;
8212fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         LLVMTypeRef float_ptr_type;
8222fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
8232fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         /* index_vec = (indirect_index * 4 + chan_index) * length */
8242fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         index_vec = lp_build_shl_imm(uint_bld, indirect_index, 2);
8252fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         index_vec = lp_build_add(uint_bld, index_vec, chan_vec);
8262fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         index_vec = lp_build_mul(uint_bld, index_vec, length_vec);
8272fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
8282fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         float_ptr_type = LLVMPointerType(LLVMFloatType(), 0);
8292fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         temps_array = LLVMBuildBitCast(bld->base.builder, bld->temps_array,
8302fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul                                        float_ptr_type, "");
8312fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul
8322fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         /* Scatter store values into temp registers */
8332fefbc79ac8bb55197ff817feeca2626585d7a8cBrian Paul         build_scatter(bld, temps_array, index_vec, value);
834f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul      }
835f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul      else {
836f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul         LLVMValueRef temp_ptr = get_temp_ptr(bld, reg->Register.Index,
837f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul                                              chan_index);
838f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul         lp_exec_mask_store(&bld->exec_mask, pred, value, temp_ptr);
839f674ed6b0662a15ab8298da0848a4c82694e0c95Brian Paul      }
84063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
84163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
84263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_FILE_ADDRESS:
843ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      lp_exec_mask_store(&bld->exec_mask, pred, value,
844263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca                         bld->addr[reg->Indirect.Index][chan_index]);
84563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
84663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
847ccf57af93f7118a044fa21e874847fa3ed555bcaJosé Fonseca   case TGSI_FILE_PREDICATE:
848ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      lp_exec_mask_store(&bld->exec_mask, pred, value,
8498690c6a6b4fb0b48e2ae75cd0f64de86b039081cmichal                         bld->preds[reg->Register.Index][chan_index]);
850ccf57af93f7118a044fa21e874847fa3ed555bcaJosé Fonseca      break;
851ccf57af93f7118a044fa21e874847fa3ed555bcaJosé Fonseca
85263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   default:
85363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      assert( 0 );
85463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
85563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca}
85663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
85763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
85863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca/**
85963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca * High-level instruction translators.
86063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca */
86163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
86263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecastatic void
86363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecaemit_tex( struct lp_build_tgsi_soa_context *bld,
86463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca          const struct tgsi_full_instruction *inst,
86558daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca          enum lp_build_tex_modifier modifier,
866faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca          LLVMValueRef *texel)
86763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
868962558daaed43b0111cd062e32821aad106869d7José Fonseca   unsigned unit;
869ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca   LLVMValueRef lod_bias, explicit_lod;
87031d1822473bf9d4105bb82b67572cfeea53aaf94Vinson Lee   LLVMValueRef oow = NULL;
871c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca   LLVMValueRef coords[3];
872962558daaed43b0111cd062e32821aad106869d7José Fonseca   LLVMValueRef ddx[3];
873962558daaed43b0111cd062e32821aad106869d7José Fonseca   LLVMValueRef ddy[3];
874c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca   unsigned num_coords;
87563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   unsigned i;
87663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
8779db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca   if (!bld->sampler) {
8789db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca      _debug_printf("warning: found texture instruction but no sampler generator supplied\n");
8799db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca      for (i = 0; i < 4; i++) {
8809db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca         texel[i] = bld->base.undef;
8819db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca      }
8829db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca      return;
8839db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca   }
8849db4a211e96356deb963223038eea074a5fe0edaJosé Fonseca
8857d6c8f980d1e23ad6f557d650e89c715861a3b0cKeith Whitwell   switch (inst->Texture.Texture) {
88663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_TEXTURE_1D:
887c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca      num_coords = 1;
88863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
88963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_TEXTURE_2D:
89063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_TEXTURE_RECT:
891c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca      num_coords = 2;
89263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
893f04ce6276b64f24cf26ca522f012a1e1a28937feJosé Fonseca   case TGSI_TEXTURE_SHADOW1D:
894f04ce6276b64f24cf26ca522f012a1e1a28937feJosé Fonseca   case TGSI_TEXTURE_SHADOW2D:
895f04ce6276b64f24cf26ca522f012a1e1a28937feJosé Fonseca   case TGSI_TEXTURE_SHADOWRECT:
89663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_TEXTURE_3D:
89763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_TEXTURE_CUBE:
898c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca      num_coords = 3;
89963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
90063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   default:
90163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      assert(0);
90263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      return;
90363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
90463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
90558daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca   if (modifier == LP_BLD_TEX_MODIFIER_LOD_BIAS) {
906ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca      lod_bias = emit_fetch( bld, inst, 0, 3 );
907ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca      explicit_lod = NULL;
908ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca   }
90958daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca   else if (modifier == LP_BLD_TEX_MODIFIER_EXPLICIT_LOD) {
910ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca      lod_bias = NULL;
911ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca      explicit_lod = emit_fetch( bld, inst, 0, 3 );
912ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca   }
913ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca   else {
914ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca      lod_bias = NULL;
915ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca      explicit_lod = NULL;
916ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca   }
91763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
91858daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca   if (modifier == LP_BLD_TEX_MODIFIER_PROJECTED) {
9192fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      oow = emit_fetch( bld, inst, 0, 3 );
92063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      oow = lp_build_rcp(&bld->base, oow);
92163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
92263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
923c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca   for (i = 0; i < num_coords; i++) {
924c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca      coords[i] = emit_fetch( bld, inst, 0, i );
92558daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca      if (modifier == LP_BLD_TEX_MODIFIER_PROJECTED)
926c40eddd294abfe8af3619d08ccd7e9c8f1660fcbJosé Fonseca         coords[i] = lp_build_mul(&bld->base, coords[i], oow);
92763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
928ba33ef00118d1c6017585af1498b89e99fe045beJosé Fonseca   for (i = num_coords; i < 3; i++) {
929ba33ef00118d1c6017585af1498b89e99fe045beJosé Fonseca      coords[i] = bld->base.undef;
930ba33ef00118d1c6017585af1498b89e99fe045beJosé Fonseca   }
93163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
93258daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca   if (modifier == LP_BLD_TEX_MODIFIER_EXPLICIT_DERIV) {
93317dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca      LLVMTypeRef i32t = LLVMInt32Type();
93417dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca      LLVMValueRef index0 = LLVMConstInt(i32t, 0, 0);
935962558daaed43b0111cd062e32821aad106869d7José Fonseca      for (i = 0; i < num_coords; i++) {
93617dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca         LLVMValueRef src1 = emit_fetch( bld, inst, 1, i );
93717dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca         LLVMValueRef src2 = emit_fetch( bld, inst, 2, i );
93817dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca         ddx[i] = LLVMBuildExtractElement(bld->base.builder, src1, index0, "");
93917dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca         ddy[i] = LLVMBuildExtractElement(bld->base.builder, src2, index0, "");
940962558daaed43b0111cd062e32821aad106869d7José Fonseca      }
941962558daaed43b0111cd062e32821aad106869d7José Fonseca      unit = inst->Src[3].Register.Index;
942962558daaed43b0111cd062e32821aad106869d7José Fonseca   }  else {
943962558daaed43b0111cd062e32821aad106869d7José Fonseca      for (i = 0; i < num_coords; i++) {
94417dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca         ddx[i] = lp_build_scalar_ddx( &bld->base, coords[i] );
94517dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca         ddy[i] = lp_build_scalar_ddy( &bld->base, coords[i] );
946962558daaed43b0111cd062e32821aad106869d7José Fonseca      }
947962558daaed43b0111cd062e32821aad106869d7José Fonseca      unit = inst->Src[1].Register.Index;
948962558daaed43b0111cd062e32821aad106869d7José Fonseca   }
9494554cdc289f1d97855825127c0bf8c0e7f6a2edaJosé Fonseca   for (i = num_coords; i < 3; i++) {
95017dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca      ddx[i] = LLVMGetUndef(bld->base.elem_type);
95117dbd41cf23e7e7de2f27e5e9252d7f792d932f3José Fonseca      ddy[i] = LLVMGetUndef(bld->base.elem_type);
9524554cdc289f1d97855825127c0bf8c0e7f6a2edaJosé Fonseca   }
953962558daaed43b0111cd062e32821aad106869d7José Fonseca
9548be72bb7646d430e66cb36e09c13c13bee030d53José Fonseca   bld->sampler->emit_fetch_texel(bld->sampler,
9558be72bb7646d430e66cb36e09c13c13bee030d53José Fonseca                                  bld->base.builder,
9568be72bb7646d430e66cb36e09c13c13bee030d53José Fonseca                                  bld->base.type,
957962558daaed43b0111cd062e32821aad106869d7José Fonseca                                  unit, num_coords, coords,
958ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca                                  ddx, ddy,
959ec43b2eb45a1b2e33f328f76624c987484e329f3José Fonseca                                  lod_bias, explicit_lod,
9608be72bb7646d430e66cb36e09c13c13bee030d53José Fonseca                                  texel);
96163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca}
96263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
96322ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwellstatic boolean
96422ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwellnear_end_of_shader(struct lp_build_tgsi_soa_context *bld,
96522ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell		   int pc)
96622ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell{
96722ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   int i;
96822ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
96922ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   for (i = 0; i < 5; i++) {
97022ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      unsigned opcode;
97122ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
97222ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      if (pc + i >= bld->info->num_instructions)
97322ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	 return TRUE;
97422ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
97522ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      opcode = bld->instructions[pc + i].Instruction.Opcode;
97622ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
97722ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      if (opcode == TGSI_OPCODE_END)
97822ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	 return TRUE;
97922ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
98022ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      if (opcode == TGSI_OPCODE_TEX ||
98122ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_TXP ||
98222ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_TXD ||
98322ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_TXB ||
98422ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_TXL ||
98522ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_TXF ||
98622ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_TXQ ||
98722ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_CAL ||
98822ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_CALLNZ ||
98922ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_IF ||
99022ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_IFC ||
99122ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_BGNLOOP ||
99222ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  opcode == TGSI_OPCODE_SWITCH)
99322ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	 return FALSE;
99422ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   }
99522ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
99622ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   return TRUE;
99722ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell}
99822ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
99922ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell
100063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
1001feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul/**
1002feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul * Kill fragment if any of the src register values are negative.
1003feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul */
100463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecastatic void
100563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecaemit_kil(
100663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct lp_build_tgsi_soa_context *bld,
100722ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   const struct tgsi_full_instruction *inst,
100822ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   int pc)
100963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
10107d6c8f980d1e23ad6f557d650e89c715861a3b0cKeith Whitwell   const struct tgsi_full_src_register *reg = &inst->Src[0];
10117821664b15501b173b2304bbada758c33c5ff972José Fonseca   LLVMValueRef terms[NUM_CHANNELS];
10123d7a88674f9eb3320eeff511968f041426e25023José Fonseca   LLVMValueRef mask;
101363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   unsigned chan_index;
101463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
10157821664b15501b173b2304bbada758c33c5ff972José Fonseca   memset(&terms, 0, sizeof terms);
101663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
101763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   FOR_EACH_CHANNEL( chan_index ) {
101863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      unsigned swizzle;
101963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
10207821664b15501b173b2304bbada758c33c5ff972José Fonseca      /* Unswizzle channel */
1021b9cb74c7f826dfd320f5e5b54aa933898f7ddd3dKeith Whitwell      swizzle = tgsi_util_get_full_src_register_swizzle( reg, chan_index );
102263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
10237821664b15501b173b2304bbada758c33c5ff972José Fonseca      /* Check if the component has not been already tested. */
10247821664b15501b173b2304bbada758c33c5ff972José Fonseca      assert(swizzle < NUM_CHANNELS);
10257821664b15501b173b2304bbada758c33c5ff972José Fonseca      if( !terms[swizzle] )
10267821664b15501b173b2304bbada758c33c5ff972José Fonseca         /* TODO: change the comparison operator instead of setting the sign */
10272fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         terms[swizzle] =  emit_fetch(bld, inst, 0, chan_index );
102863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
102963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
10303d7a88674f9eb3320eeff511968f041426e25023José Fonseca   mask = NULL;
10317821664b15501b173b2304bbada758c33c5ff972José Fonseca   FOR_EACH_CHANNEL( chan_index ) {
1032aede39efd86d200ffbace8fc012104e31f673973José Fonseca      if(terms[chan_index]) {
10333d7a88674f9eb3320eeff511968f041426e25023José Fonseca         LLVMValueRef chan_mask;
1034aede39efd86d200ffbace8fc012104e31f673973José Fonseca
1035feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul         /*
1036feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul          * If term < 0 then mask = 0 else mask = ~0.
1037feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul          */
10383d7a88674f9eb3320eeff511968f041426e25023José Fonseca         chan_mask = lp_build_cmp(&bld->base, PIPE_FUNC_GEQUAL, terms[chan_index], bld->base.zero);
1039aede39efd86d200ffbace8fc012104e31f673973José Fonseca
10403d7a88674f9eb3320eeff511968f041426e25023José Fonseca         if(mask)
10413d7a88674f9eb3320eeff511968f041426e25023José Fonseca            mask = LLVMBuildAnd(bld->base.builder, mask, chan_mask, "");
10423d7a88674f9eb3320eeff511968f041426e25023José Fonseca         else
10433d7a88674f9eb3320eeff511968f041426e25023José Fonseca            mask = chan_mask;
1044aede39efd86d200ffbace8fc012104e31f673973José Fonseca      }
104563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
10463d7a88674f9eb3320eeff511968f041426e25023José Fonseca
1047aa4cb5e2d8d48c7dcc9653c61a9e25494e3e7b2aKeith Whitwell   if(mask) {
10483d7a88674f9eb3320eeff511968f041426e25023José Fonseca      lp_build_mask_update(bld->mask, mask);
1049aa4cb5e2d8d48c7dcc9653c61a9e25494e3e7b2aKeith Whitwell
105022ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      if (!near_end_of_shader(bld, pc))
105122ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	 lp_build_mask_check(bld->mask);
1052aa4cb5e2d8d48c7dcc9653c61a9e25494e3e7b2aKeith Whitwell   }
105363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca}
105463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
105563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
105663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca/**
1057feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul * Predicated fragment kill.
1058feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul * XXX Actually, we do an unconditional kill (as in tgsi_exec.c).
1059feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul * The only predication is the execution mask which will apply if
1060feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul * we're inside a loop or conditional.
1061feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul */
1062feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paulstatic void
1063feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paulemit_kilp(struct lp_build_tgsi_soa_context *bld,
106422ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell          const struct tgsi_full_instruction *inst,
106522ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell	  int pc)
1066feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul{
1067feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   LLVMValueRef mask;
1068feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul
1069feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   /* For those channels which are "alive", disable fragment shader
1070feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul    * execution.
1071feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul    */
1072feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   if (bld->exec_mask.has_mask) {
1073feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul      mask = LLVMBuildNot(bld->base.builder, bld->exec_mask.exec_mask, "kilp");
1074feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   }
1075feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   else {
1076ec2824cd867d3b782588be1f3b1d5d802eb381abBrian Paul      LLVMValueRef zero = LLVMConstNull(bld->base.int_vec_type);
1077ec2824cd867d3b782588be1f3b1d5d802eb381abBrian Paul      mask = zero;
1078feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   }
1079feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul
1080feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul   lp_build_mask_update(bld->mask, mask);
1081aa4cb5e2d8d48c7dcc9653c61a9e25494e3e7b2aKeith Whitwell
108222ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell   if (!near_end_of_shader(bld, pc))
108322ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      lp_build_mask_check(bld->mask);
1084feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul}
1085feffd259da5f2655222a2f26e2e5665a9e28173fBrian Paul
1086e27983bc08d4eff5effbbcffbf5c9f5862fca2cfJosé Fonsecastatic void
108785c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusinemit_declaration(
108885c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   struct lp_build_tgsi_soa_context *bld,
108985c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   const struct tgsi_full_declaration *decl)
109085c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin{
10916d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   LLVMTypeRef vec_type = bld->base.vec_type;
1092a18c210a95794c79c6f26dbf4c66d4a85e29169dJosé Fonseca
109385c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   unsigned first = decl->Range.First;
109485c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   unsigned last = decl->Range.Last;
109585c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   unsigned idx, i;
109685c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin
109785c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   for (idx = first; idx <= last; ++idx) {
10986d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca      assert(last <= bld->info->file_max[decl->Declaration.File]);
109985c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin      switch (decl->Declaration.File) {
110085c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin      case TGSI_FILE_TEMPORARY:
11016c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca         assert(idx < LP_MAX_TGSI_TEMPS);
11023662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul         if (bld->indirect_files & (1 << TGSI_FILE_TEMPORARY)) {
1103846b2fccc2a67b08acc6da51f4970fe66ed4559bBrian Paul            LLVMValueRef array_size = LLVMConstInt(LLVMInt32Type(),
1104846b2fccc2a67b08acc6da51f4970fe66ed4559bBrian Paul                                                   last*4 + 4, 0);
1105263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca            bld->temps_array = lp_build_array_alloca(bld->base.builder,
11063ded3e98ffc36820c8ab318d736eab99bb16f26bBrian Paul                                                     vec_type, array_size, "temparray");
1107263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca         } else {
1108021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin            for (i = 0; i < NUM_CHANNELS; i++)
1109a18c210a95794c79c6f26dbf4c66d4a85e29169dJosé Fonseca               bld->temps[idx][i] = lp_build_alloca(bld->base.builder,
11103ded3e98ffc36820c8ab318d736eab99bb16f26bBrian Paul                                                    vec_type, "temp");
1111021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin         }
111285c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin         break;
111385c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin
111485c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin      case TGSI_FILE_OUTPUT:
1115263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca         for (i = 0; i < NUM_CHANNELS; i++)
1116263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca            bld->outputs[idx][i] = lp_build_alloca(bld->base.builder,
11173ded3e98ffc36820c8ab318d736eab99bb16f26bBrian Paul                                                   vec_type, "output");
111885c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin         break;
111985c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin
1120ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin      case TGSI_FILE_ADDRESS:
11216c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca         assert(idx < LP_MAX_TGSI_ADDRS);
1122263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca         for (i = 0; i < NUM_CHANNELS; i++)
1123263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca            bld->addr[idx][i] = lp_build_alloca(bld->base.builder,
11243ded3e98ffc36820c8ab318d736eab99bb16f26bBrian Paul                                                vec_type, "addr");
1125ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin         break;
1126ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin
1127e27983bc08d4eff5effbbcffbf5c9f5862fca2cfJosé Fonseca      case TGSI_FILE_PREDICATE:
1128ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         assert(idx < LP_MAX_TGSI_PREDS);
1129263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca         for (i = 0; i < NUM_CHANNELS; i++)
1130263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca            bld->preds[idx][i] = lp_build_alloca(bld->base.builder,
11313ded3e98ffc36820c8ab318d736eab99bb16f26bBrian Paul                                                 vec_type, "predicate");
1132e27983bc08d4eff5effbbcffbf5c9f5862fca2cfJosé Fonseca         break;
1133e27983bc08d4eff5effbbcffbf5c9f5862fca2cfJosé Fonseca
113485c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin      default:
113585c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin         /* don't need to declare other vars */
1136dc886ba1391d7d890bd1f5532bc14553e883a418Zack Rusin         break;
1137012fabca722494162c244a367913562b8cfa4677Zack Rusin      }
113885c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin   }
113985c7ec70ad41c8ada75a4cbace83d16815d3e2c5Zack Rusin}
114063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
1141fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul
1142fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul/**
1143fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul * Emit LLVM for one TGSI instruction.
1144fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul * \param return TRUE for success, FALSE otherwise
1145fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul */
1146fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paulstatic boolean
114763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecaemit_instruction(
114863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct lp_build_tgsi_soa_context *bld,
1149faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   const struct tgsi_full_instruction *inst,
11500b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   const struct tgsi_opcode_info *info,
11510b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   int *pc)
115263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
115363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   unsigned chan_index;
115490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca   LLVMValueRef src0, src1, src2;
1155e049ddb7549a45adde521d6f2899c2b74b4ff972Vinson Lee   LLVMValueRef tmp0, tmp1, tmp2;
1156e049ddb7549a45adde521d6f2899c2b74b4ff972Vinson Lee   LLVMValueRef tmp3 = NULL;
1157e049ddb7549a45adde521d6f2899c2b74b4ff972Vinson Lee   LLVMValueRef tmp4 = NULL;
1158e049ddb7549a45adde521d6f2899c2b74b4ff972Vinson Lee   LLVMValueRef tmp5 = NULL;
1159e049ddb7549a45adde521d6f2899c2b74b4ff972Vinson Lee   LLVMValueRef tmp6 = NULL;
1160e049ddb7549a45adde521d6f2899c2b74b4ff972Vinson Lee   LLVMValueRef tmp7 = NULL;
1161faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   LLVMValueRef res;
1162faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   LLVMValueRef dst0[NUM_CHANNELS];
116363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
116489258652b6a1d282bed14549907892bdfda752f0José Fonseca   /*
116589258652b6a1d282bed14549907892bdfda752f0José Fonseca    * Stores and write masks are handled in a general fashion after the long
116689258652b6a1d282bed14549907892bdfda752f0José Fonseca    * instruction opcode switch statement.
116789258652b6a1d282bed14549907892bdfda752f0José Fonseca    *
116889258652b6a1d282bed14549907892bdfda752f0José Fonseca    * Although not stricitly necessary, we avoid generating instructions for
116989258652b6a1d282bed14549907892bdfda752f0José Fonseca    * channels which won't be stored, in cases where's that easy. For some
117089258652b6a1d282bed14549907892bdfda752f0José Fonseca    * complex instructions, like texture sampling, it is more convenient to
117189258652b6a1d282bed14549907892bdfda752f0José Fonseca    * assume a full writemask and then let LLVM optimization passes eliminate
117289258652b6a1d282bed14549907892bdfda752f0José Fonseca    * redundant code.
117389258652b6a1d282bed14549907892bdfda752f0José Fonseca    */
117489258652b6a1d282bed14549907892bdfda752f0José Fonseca
11750b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   (*pc)++;
11760b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
1177faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   assert(info->num_dst <= 1);
1178ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca   if (info->num_dst) {
1179faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1180faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = bld->base.undef;
1181faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      }
1182faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   }
1183faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca
118463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   switch (inst->Instruction.Opcode) {
118563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ARL:
11862fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
11872fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1188ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin         tmp0 = lp_build_floor(&bld->base, tmp0);
1189faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
119063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
119163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
119263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
119363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_MOV:
11942fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1195faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = emit_fetch( bld, inst, 0, chan_index );
119663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
119763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
119863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
119963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_LIT:
12002fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) ) {
1201faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_X] = bld->base.one;
120263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
12032fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) ) {
12042fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, CHAN_X );
1205faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Y] = lp_build_max( &bld->base, src0, bld->base.zero);
1206ef1fddb36a91a3b272a3c74d104033cd99556cfaJosé Fonseca      }
12072fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ) ) {
1208ef1fddb36a91a3b272a3c74d104033cd99556cfaJosé Fonseca         /* XMM[1] = SrcReg[0].yyyy */
12092fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp1 = emit_fetch( bld, inst, 0, CHAN_Y );
1210ef1fddb36a91a3b272a3c74d104033cd99556cfaJosé Fonseca         /* XMM[1] = max(XMM[1], 0) */
1211ef1fddb36a91a3b272a3c74d104033cd99556cfaJosé Fonseca         tmp1 = lp_build_max( &bld->base, tmp1, bld->base.zero);
1212ef1fddb36a91a3b272a3c74d104033cd99556cfaJosé Fonseca         /* XMM[2] = SrcReg[0].wwww */
12132fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp2 = emit_fetch( bld, inst, 0, CHAN_W );
1214ef1fddb36a91a3b272a3c74d104033cd99556cfaJosé Fonseca         tmp1 = lp_build_pow( &bld->base, tmp1, tmp2);
12152fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
1216c5abcac7ef7ebd0167093285b5fc9cf3829c1febJosé Fonseca         tmp2 = lp_build_cmp(&bld->base, PIPE_FUNC_GREATER, tmp0, bld->base.zero);
1217faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Z] = lp_build_select(&bld->base, tmp2, tmp1, bld->base.zero);
1218c5abcac7ef7ebd0167093285b5fc9cf3829c1febJosé Fonseca      }
12192fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_W ) ) {
1220faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_W] = bld->base.one;
122163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
122263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
122363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
122463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_RCP:
122563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_RECIP */
12262fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      src0 = emit_fetch( bld, inst, 0, CHAN_X );
1227faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      res = lp_build_rcp(&bld->base, src0);
12282fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1229faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = res;
123063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
123163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
123263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
123363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_RSQ:
123463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_RECIPSQRT */
12352fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      src0 = emit_fetch( bld, inst, 0, CHAN_X );
123690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      src0 = lp_build_abs(&bld->base, src0);
1237faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      res = lp_build_rsqrt(&bld->base, src0);
12382fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1239faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = res;
124063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
124163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
124263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
124363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_EXP:
12442fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) ||
12452fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) ||
12462fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z )) {
124757907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         LLVMValueRef *p_exp2_int_part = NULL;
124857907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         LLVMValueRef *p_frac_part = NULL;
124957907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         LLVMValueRef *p_exp2 = NULL;
125057907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
12512fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, CHAN_X );
125257907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
12532fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ))
125457907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca            p_exp2_int_part = &tmp0;
12552fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ))
125657907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca            p_frac_part = &tmp1;
12572fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ))
125857907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca            p_exp2 = &tmp2;
125957907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
126057907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         lp_build_exp2_approx(&bld->base, src0, p_exp2_int_part, p_frac_part, p_exp2);
126157907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
12622fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ))
1263faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_X] = tmp0;
12642fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ))
1265faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_Y] = tmp1;
12662fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ))
1267faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_Z] = tmp2;
126863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
126963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      /* dst.w = 1.0 */
12702fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_W )) {
1271faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_W] = bld->base.one;
127263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
127363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
127463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
127563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_LOG:
12762fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) ||
12772fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) ||
12782fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z )) {
1279add6dfbba64260c9b314b4a95c8def084e05bd3bVinson Lee         LLVMValueRef *p_floor_log2 = NULL;
1280add6dfbba64260c9b314b4a95c8def084e05bd3bVinson Lee         LLVMValueRef *p_exp = NULL;
1281add6dfbba64260c9b314b4a95c8def084e05bd3bVinson Lee         LLVMValueRef *p_log2 = NULL;
128257907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
12832fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, CHAN_X );
128457907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         src0 = lp_build_abs( &bld->base, src0 );
128557907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
12862fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ))
128757907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca            p_floor_log2 = &tmp0;
12882fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ))
128957907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca            p_exp = &tmp1;
12902fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ))
129157907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca            p_log2 = &tmp2;
129257907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
129357907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         lp_build_log2_approx(&bld->base, src0, p_exp, p_floor_log2, p_log2);
129457907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca
129557907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         /* dst.x = floor(lg2(abs(src.x))) */
12962fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ))
1297faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_X] = tmp0;
129857907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         /* dst.y = abs(src)/ex2(floor(lg2(abs(src.x)))) */
12992fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y )) {
1300faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_Y] = lp_build_div( &bld->base, src0, tmp1);
130163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         }
130257907e7fd9fc63b9023d0e2b08934c2d0acf2953José Fonseca         /* dst.z = lg2(abs(src.x)) */
13032fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ))
1304faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_Z] = tmp2;
130563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
130663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      /* dst.w = 1.0 */
13072fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if (IS_DST0_CHANNEL_ENABLED( inst, CHAN_W )) {
1308faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_W] = bld->base.one;
130963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
131063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
131163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
131263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_MUL:
13132fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
13142fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
13152fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
1316faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_mul(&bld->base, src0, src1);
131763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
131863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
131963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
132063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ADD:
13212fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
13222fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
13232fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
1324faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_add(&bld->base, src0, src1);
132563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
132663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
132763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
132863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DP3:
132963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_DOT3 */
13302fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
13312fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 1, CHAN_X );
133290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_mul( &bld->base, tmp0, tmp1);
13332fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Y );
13342fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Y );
133590e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
133690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
13372fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Z );
13382fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Z );
133990e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
134090e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
13412fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1342faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
134363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
134463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
134563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
134663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DP4:
134763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_DOT4 */
13482fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
13492fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 1, CHAN_X );
135090e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_mul( &bld->base, tmp0, tmp1);
13512fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Y );
13522fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Y );
135390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
135490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
13552fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Z );
13562fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Z );
135790e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
135890e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
13592fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_W );
13602fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_W );
136190e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
136290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
13632fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1364faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
136563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
136663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
136763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
136863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DST:
13692fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) {
1370faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_X] = bld->base.one;
137163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
13722fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) {
13732fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, CHAN_Y );
13742fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp1 = emit_fetch( bld, inst, 1, CHAN_Y );
1375faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Y] = lp_build_mul( &bld->base, tmp0, tmp1);
137663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
13772fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ) {
1378faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Z] = emit_fetch( bld, inst, 0, CHAN_Z );
137963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
13802fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_W ) {
1381faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_W] = emit_fetch( bld, inst, 1, CHAN_W );
138263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
138363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
138463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
138563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_MIN:
13862fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
13872fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
13882fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
1389faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_min( &bld->base, src0, src1 );
139063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
139163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
139263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
139363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_MAX:
13942fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
13952fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
13962fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
1397faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_max( &bld->base, src0, src1 );
139863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
139963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
140063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
140163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SLT:
140263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_SETLT */
14032fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
14042fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
14052fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
14061aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_LESS, src0, src1 );
1407faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, bld->base.one, bld->base.zero );
14081aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
140963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
141063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
141163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SGE:
141263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_SETGE */
14132fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
14142fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
14152fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
14161aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_GEQUAL, src0, src1 );
1417faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, bld->base.one, bld->base.zero );
14181aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
141963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
142063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
142163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_MAD:
142263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_MADD */
14232fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
14242fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
14252fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp1 = emit_fetch( bld, inst, 1, chan_index );
14262fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp2 = emit_fetch( bld, inst, 2, chan_index );
142790e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp0 = lp_build_mul( &bld->base, tmp0, tmp1);
142890e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp0 = lp_build_add( &bld->base, tmp0, tmp2);
1429faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
143063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
143163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
143263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
143363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SUB:
14342fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
14352fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
14362fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp1 = emit_fetch( bld, inst, 1, chan_index );
1437faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_sub( &bld->base, tmp0, tmp1);
143863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
143963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
144063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
144163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_LRP:
14422fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
14432fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
14442fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
14452fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src2 = emit_fetch( bld, inst, 2, chan_index );
144690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp0 = lp_build_sub( &bld->base, src1, src2 );
144790e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp0 = lp_build_mul( &bld->base, src0, tmp0 );
1448faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_add( &bld->base, tmp0, src2 );
144963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
145063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
145163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
145263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_CND:
1453873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1454873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
1455873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
1456873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         src2 = emit_fetch( bld, inst, 2, chan_index );
1457185be3a87a5b38e8821a560c073975c11dcbd3e9Brian Paul         tmp1 = lp_build_const_vec(bld->base.type, 0.5);
1458873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_GREATER, src2, tmp1);
1459faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, src0, src1 );
1460873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      }
146163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
146263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
146363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DP2A:
14642fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );  /* xmm0 = src[0].x */
14652fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 1, CHAN_X );  /* xmm1 = src[1].x */
146690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_mul( &bld->base, tmp0, tmp1);              /* xmm0 = xmm0 * xmm1 */
14672fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Y );  /* xmm1 = src[0].y */
14682fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Y );  /* xmm2 = src[1].y */
146990e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);              /* xmm1 = xmm1 * xmm2 */
147090e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);              /* xmm0 = xmm0 + xmm1 */
14712fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 2, CHAN_X );  /* xmm1 = src[2].x */
147290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);              /* xmm0 = xmm0 + xmm1 */
14732fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1474faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;  /* dest[ch] = xmm0 */
147563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
147663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
147763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
147863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_FRC:
14792fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1480873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
1481873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         tmp0 = lp_build_floor(&bld->base, src0);
1482f1f49bd465b899d1c85aa07650ca5b62a50303b0Brian Paul         tmp0 = lp_build_sub(&bld->base, src0, tmp0);
1483faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
148463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
148563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
148663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
148763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_CLAMP:
1488873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1489873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1490873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
1491873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         src2 = emit_fetch( bld, inst, 2, chan_index );
1492873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         tmp0 = lp_build_max(&bld->base, tmp0, src1);
1493873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         tmp0 = lp_build_min(&bld->base, tmp0, src2);
1494faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
1495873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      }
149663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
149763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
149863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_FLR:
14992fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
15002fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1501faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_floor(&bld->base, tmp0);
150263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
150363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
150463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
150563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ROUND:
15062fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
15072fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1508faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_round(&bld->base, tmp0);
150963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
151063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
151163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
151290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca   case TGSI_OPCODE_EX2: {
15132fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
151490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_exp2( &bld->base, tmp0);
15152fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1516faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
151763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
151863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
151990e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca   }
152063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
152163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_LG2:
15222fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
152390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_log2( &bld->base, tmp0);
15242fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1525faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
152663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
152763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
152863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
152963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_POW:
15302fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      src0 = emit_fetch( bld, inst, 0, CHAN_X );
15312fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      src1 = emit_fetch( bld, inst, 1, CHAN_X );
1532faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      res = lp_build_pow( &bld->base, src0, src1 );
15332fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1534faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = res;
153563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
153663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
153763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
153863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_XPD:
15392fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) ||
15402fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) ) {
15412fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp1 = emit_fetch( bld, inst, 1, CHAN_Z );
15422fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp3 = emit_fetch( bld, inst, 0, CHAN_Z );
154363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
15442fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) ||
15452fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ) ) {
15462fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, CHAN_Y );
15472fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp4 = emit_fetch( bld, inst, 1, CHAN_Y );
154863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
15492fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) {
155090e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp2 = tmp0;
155190e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp2 = lp_build_mul( &bld->base, tmp2, tmp1);
155290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp5 = tmp3;
155390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp5 = lp_build_mul( &bld->base, tmp5, tmp4);
155490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp2 = lp_build_sub( &bld->base, tmp2, tmp5);
1555faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_X] = tmp2;
155663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
15572fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      if( IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) ||
15582fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca          IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ) ) {
15592fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp2 = emit_fetch( bld, inst, 1, CHAN_X );
15602fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp5 = emit_fetch( bld, inst, 0, CHAN_X );
156163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
15622fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) {
156390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp3 = lp_build_mul( &bld->base, tmp3, tmp2);
156490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp1 = lp_build_mul( &bld->base, tmp1, tmp5);
156590e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp3 = lp_build_sub( &bld->base, tmp3, tmp1);
1566faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Y] = tmp3;
156763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
15682fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ) {
156990e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp5 = lp_build_mul( &bld->base, tmp5, tmp4);
157090e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp0 = lp_build_mul( &bld->base, tmp0, tmp2);
157190e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca         tmp5 = lp_build_sub( &bld->base, tmp5, tmp0);
1572faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Z] = tmp5;
157363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
15742fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_W ) {
1575faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_W] = bld->base.one;
157663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
157763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
157863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
157963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ABS:
15802fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
15812fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1582faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_abs( &bld->base, tmp0 );
158363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
158463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
158563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
158663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_RCC:
1587873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
1588873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1589fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
159063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
159163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DPH:
15922fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
15932fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 1, CHAN_X );
159490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_mul( &bld->base, tmp0, tmp1);
15952fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Y );
15962fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Y );
159790e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
159890e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
15992fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Z );
16002fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Z );
160190e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);
160290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
16032fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 1, CHAN_W );
160490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
16052fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1606faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
160763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
160863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
160963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
161063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_COS:
16112fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
161290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_cos( &bld->base, tmp0 );
16132fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1614faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
161563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
161663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
161763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
161863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DDX:
161986226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
162086226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca         emit_fetch_deriv( bld, inst, 0, chan_index, NULL, &dst0[chan_index], NULL);
162186226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca      }
162263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
162363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
162463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DDY:
162586226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
162686226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca         emit_fetch_deriv( bld, inst, 0, chan_index, NULL, NULL, &dst0[chan_index]);
162786226d5ea186d3fc6013bc40a341e0c0a891de39José Fonseca      }
162863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
162963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
163063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_KILP:
163163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      /* predicated kill */
163222ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      emit_kilp( bld, inst, (*pc)-1 );
163363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
163463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
163563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_KIL:
163663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      /* conditional kill */
163722ec25e2bf5c9309610b68e8e40472a8ea695ba9Keith Whitwell      emit_kil( bld, inst, (*pc)-1 );
163863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
163963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
164063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_PK2H:
1641fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
164263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
164363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
164463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_PK2US:
1645fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
164663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
164763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
164863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_PK4B:
1649fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
165063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
165163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
165263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_PK4UB:
1653fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
165463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
165563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
165663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_RFL:
1657fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
165863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
165963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
166063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SEQ:
16612fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
16622fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
16632fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
16641aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_EQUAL, src0, src1 );
1665faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, bld->base.one, bld->base.zero );
16661aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
166763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
166863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
166963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SFL:
1670873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1671faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = bld->base.zero;
1672873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      }
167363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
167463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
167563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SGT:
16762fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
16772fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
16782fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
16791aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_GREATER, src0, src1 );
1680faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, bld->base.one, bld->base.zero );
16811aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
168263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
168363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
168463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SIN:
16852fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
168690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_sin( &bld->base, tmp0 );
16872fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1688faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
168963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
169063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
169163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
169263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SLE:
16932fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
16942fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
16952fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
16961aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_LEQUAL, src0, src1 );
1697faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, bld->base.one, bld->base.zero );
16981aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
169963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
170063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
170163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SNE:
17022fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
17032fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
17042fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
17051aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_NOTEQUAL, src0, src1 );
1706faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, bld->base.one, bld->base.zero );
17071aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
170863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
170963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
171063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_STR:
1711873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1712faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = bld->base.one;
1713873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      }
171463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
171563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
171663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TEX:
171758daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca      emit_tex( bld, inst, LP_BLD_TEX_MODIFIER_NONE, dst0 );
171863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
171963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
172063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TXD:
172158daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca      emit_tex( bld, inst, LP_BLD_TEX_MODIFIER_EXPLICIT_DERIV, dst0 );
172263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
172363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
172463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_UP2H:
1725873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1726873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert (0);
1727fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
172863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
172963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
173063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_UP2US:
1731873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1732873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1733fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
173463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
173563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
173663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_UP4B:
1737873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1738873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1739fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
174063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
174163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
174263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_UP4UB:
1743873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1744873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1745fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
174663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
174763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
174863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_X2D:
1749873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
1750873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1751fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
175263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
175363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
175463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ARA:
1755873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1756873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1757fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
175863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
175963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
176063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ARR:
17612fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
17622fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1763ded2374e67bdc2c24e868775d2ff77b39b339d56Zack Rusin         tmp0 = lp_build_round(&bld->base, tmp0);
1764faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;
176563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
176663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
176763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
176863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_BRA:
1769873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1770873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1771fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
177263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
177363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
1774263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca   case TGSI_OPCODE_CAL:
17750b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      lp_exec_mask_call(&bld->exec_mask,
17760b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                        inst->Label.Label,
17770b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                        pc);
17780b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
177963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
178063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
178163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_RET:
17820b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      lp_exec_mask_ret(&bld->exec_mask, pc);
178363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
178463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
178563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_END:
17860b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      *pc = -1;
178763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
178863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
178963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SSG:
179063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* TGSI_OPCODE_SGN */
17912fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
17922fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1793faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_sgn( &bld->base, tmp0 );
179463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
179563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
179663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
179763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_CMP:
17982fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
17992fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src0 = emit_fetch( bld, inst, 0, chan_index );
18002fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src1 = emit_fetch( bld, inst, 1, chan_index );
18012fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         src2 = emit_fetch( bld, inst, 2, chan_index );
18021aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca         tmp0 = lp_build_cmp( &bld->base, PIPE_FUNC_LESS, src0, bld->base.zero );
1803faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_select( &bld->base, tmp0, src1, src2);
18041aae039ee279f8ad300919d8af0fc4691ca2f514José Fonseca      }
180563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
180663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
180763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SCS:
18082fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_X ) {
18092fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
1810faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_X] = lp_build_cos( &bld->base, tmp0 );
181163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
18122fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_Y ) {
18132fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, CHAN_X );
1814faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Y] = lp_build_sin( &bld->base, tmp0 );
181563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
18162fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_Z ) {
1817faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_Z] = bld->base.zero;
181863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
18192fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      IF_IS_DST0_CHANNEL_ENABLED( inst, CHAN_W ) {
1820faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[CHAN_W] = bld->base.one;
182163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
182263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
182363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
182463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TXB:
182558daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca      emit_tex( bld, inst, LP_BLD_TEX_MODIFIER_LOD_BIAS, dst0 );
182663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
182763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
182863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_NRM:
182963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      /* fall-through */
183063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_NRM4:
183163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      /* 3 or 4-component normalization */
183263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      {
183363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         uint dims = (inst->Instruction.Opcode == TGSI_OPCODE_NRM) ? 3 : 4;
183463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
18352fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_X) ||
18362fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca             IS_DST0_CHANNEL_ENABLED(inst, CHAN_Y) ||
18372fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca             IS_DST0_CHANNEL_ENABLED(inst, CHAN_Z) ||
18382fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca             (IS_DST0_CHANNEL_ENABLED(inst, CHAN_W) && dims == 4)) {
183963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
184063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* NOTE: Cannot use xmm regs 2/3 here (see emit_rsqrt() above). */
184163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
184263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm4 = src.x */
184363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm0 = src.x * src.x */
18442fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            tmp0 = emit_fetch(bld, inst, 0, CHAN_X);
18452fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_X)) {
184690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca               tmp4 = tmp0;
184763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
184890e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca            tmp0 = lp_build_mul( &bld->base, tmp0, tmp0);
184963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
185063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm5 = src.y */
185163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm0 = xmm0 + src.y * src.y */
18522fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            tmp1 = emit_fetch(bld, inst, 0, CHAN_Y);
18532fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_Y)) {
185490e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca               tmp5 = tmp1;
185563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
185690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca            tmp1 = lp_build_mul( &bld->base, tmp1, tmp1);
185790e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca            tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
185863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
185963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm6 = src.z */
186063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm0 = xmm0 + src.z * src.z */
18612fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            tmp1 = emit_fetch(bld, inst, 0, CHAN_Z);
18622fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_Z)) {
186390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca               tmp6 = tmp1;
186463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
186590e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca            tmp1 = lp_build_mul( &bld->base, tmp1, tmp1);
186690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca            tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
186763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
186863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            if (dims == 4) {
186963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca               /* xmm7 = src.w */
187063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca               /* xmm0 = xmm0 + src.w * src.w */
18712fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca               tmp1 = emit_fetch(bld, inst, 0, CHAN_W);
18722fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca               if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_W)) {
187390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca                  tmp7 = tmp1;
187463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca               }
187590e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca               tmp1 = lp_build_mul( &bld->base, tmp1, tmp1);
187690e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca               tmp0 = lp_build_add( &bld->base, tmp0, tmp1);
187763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
187863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
187963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* xmm1 = 1 / sqrt(xmm0) */
188090e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca            tmp1 = lp_build_rsqrt( &bld->base, tmp0);
188163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
188263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* dst.x = xmm1 * src.x */
18832fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_X)) {
1884faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca               dst0[CHAN_X] = lp_build_mul( &bld->base, tmp4, tmp1);
188563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
188663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
188763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* dst.y = xmm1 * src.y */
18882fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_Y)) {
1889faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca               dst0[CHAN_Y] = lp_build_mul( &bld->base, tmp5, tmp1);
189063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
189163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
189263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* dst.z = xmm1 * src.z */
18932fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_Z)) {
1894faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca               dst0[CHAN_Z] = lp_build_mul( &bld->base, tmp6, tmp1);
189563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
189663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
189763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            /* dst.w = xmm1 * src.w */
18982fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca            if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_X) && dims == 4) {
1899faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca               dst0[CHAN_W] = lp_build_mul( &bld->base, tmp7, tmp1);
190063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            }
190163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         }
190263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
1903faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         /* dst.w = 1.0 */
19042fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         if (IS_DST0_CHANNEL_ENABLED(inst, CHAN_W) && dims == 3) {
1905faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca            dst0[CHAN_W] = bld->base.one;
190663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         }
190763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
190863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
190963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
191063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DIV:
1911873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated */
1912873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert( 0 );
1913fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
191463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
191563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
191663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_DP2:
19172fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp0 = emit_fetch( bld, inst, 0, CHAN_X );  /* xmm0 = src[0].x */
19182fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 1, CHAN_X );  /* xmm1 = src[1].x */
191990e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_mul( &bld->base, tmp0, tmp1);              /* xmm0 = xmm0 * xmm1 */
19202fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp1 = emit_fetch( bld, inst, 0, CHAN_Y );  /* xmm1 = src[0].y */
19212fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      tmp2 = emit_fetch( bld, inst, 1, CHAN_Y );  /* xmm2 = src[1].y */
192290e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp1 = lp_build_mul( &bld->base, tmp1, tmp2);              /* xmm1 = xmm1 * xmm2 */
192390e9a4d4f99e722d8f0f2050e134a3c69863541bJosé Fonseca      tmp0 = lp_build_add( &bld->base, tmp0, tmp1);              /* xmm0 = xmm0 + xmm1 */
19242fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1925faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = tmp0;  /* dest[ch] = xmm0 */
192663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
192763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
192863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
192963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TXL:
193058daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca      emit_tex( bld, inst, LP_BLD_TEX_MODIFIER_EXPLICIT_LOD, dst0 );
193163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
193263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
193363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TXP:
193458daea741fa21fe3f89fd7bf106df1545c5b21afJosé Fonseca      emit_tex( bld, inst, LP_BLD_TEX_MODIFIER_PROJECTED, dst0 );
193563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
193618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
193763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_BRK:
193818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      lp_exec_break(&bld->exec_mask);
193963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
194063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
194163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_IF:
194280f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      tmp0 = emit_fetch(bld, inst, 0, CHAN_X);
1943ac33e7752d22f03db84e6a4c822b3a3f41d05f77Zack Rusin      tmp0 = lp_build_cmp(&bld->base, PIPE_FUNC_NOTEQUAL,
1944ac33e7752d22f03db84e6a4c822b3a3f41d05f77Zack Rusin                          tmp0, bld->base.zero);
194580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      lp_exec_mask_cond_push(&bld->exec_mask, tmp0);
194663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
194763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
194818d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   case TGSI_OPCODE_BGNLOOP:
194918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      lp_exec_bgnloop(&bld->exec_mask);
195018d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      break;
195118d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
19520b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   case TGSI_OPCODE_BGNSUB:
19530b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      lp_exec_mask_bgnsub(&bld->exec_mask);
19540b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      break;
19550b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
195663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ELSE:
195780f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      lp_exec_mask_cond_invert(&bld->exec_mask);
195863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
195963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
196063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ENDIF:
196180f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin      lp_exec_mask_cond_pop(&bld->exec_mask);
196263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
196363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
196418d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   case TGSI_OPCODE_ENDLOOP:
196518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      lp_exec_endloop(&bld->exec_mask);
196618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      break;
196718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin
19680b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   case TGSI_OPCODE_ENDSUB:
19690b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      lp_exec_mask_endsub(&bld->exec_mask, pc);
19700b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      break;
19710b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
197263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_PUSHA:
1973873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
1974873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1975fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
197663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
197763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
197863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_POPA:
1979873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
1980873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1981fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
198263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
198363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
198463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_CEIL:
1985873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
1986873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
1987faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_ceil(&bld->base, tmp0);
1988873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      }
198963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
199063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
199163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_I2F:
1992873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
1993873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
1994fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
199563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
199663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
199763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_NOT:
1998873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
1999873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2000fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
200163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
200263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
200363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TRUNC:
20042fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
20052fef9b3369d1b017a5360d53a75286234ace2c9dJosé Fonseca         tmp0 = emit_fetch( bld, inst, 0, chan_index );
2006faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         dst0[chan_index] = lp_build_trunc(&bld->base, tmp0);
200763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
200863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
200963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
201063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SHL:
2011873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2012873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2013fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
201463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
201563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
20162c046034dc5c95dd2fe84d0b4fd44f25235480b9Michal Krol   case TGSI_OPCODE_ISHR:
2017873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2018873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2019fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
202063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
202163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
202263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_AND:
2023873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2024873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2025fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
202663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
202763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
202863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_OR:
2029873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2030873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2031fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
203263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
203363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
203463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_MOD:
2035873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2036873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2037fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
203863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
203963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
204063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_XOR:
2041873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2042873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2043fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
204463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
204563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
204663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_SAD:
2047873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2048873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2049fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
205063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
205163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
205263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TXF:
2053873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2054873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2055fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
205663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
205763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
205863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_TXQ:
2059873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      /* deprecated? */
2060873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      assert(0);
2061fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
206263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
206363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
206463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_CONT:
206518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      lp_exec_continue(&bld->exec_mask);
206663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
206763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
206863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_EMIT:
2069fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
207063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
207163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
207263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   case TGSI_OPCODE_ENDPRIM:
2073fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
207463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      break;
207563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
2076873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca   case TGSI_OPCODE_NOP:
2077873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca      break;
2078873773ee2b034e8df72ddfacc764915b8a76ebe2José Fonseca
207963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   default:
2080fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul      return FALSE;
208163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
208263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
2083faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   if(info->num_dst) {
2084ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      LLVMValueRef pred[NUM_CHANNELS];
2085ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
2086ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca      emit_fetch_predicate( bld, inst, pred );
2087ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca
2088faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      FOR_EACH_DST0_ENABLED_CHANNEL( inst, chan_index ) {
2089ff6c78f44f2f741f4825b07dbc15b3a951fe9b2cJosé Fonseca         emit_store( bld, inst, 0, chan_index, pred[chan_index], dst0[chan_index]);
2090faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca      }
2091faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca   }
2092faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca
2093fc9b8cd9dda946d8415732aeeed1eff5541cd1eeBrian Paul   return TRUE;
209463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca}
209563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
2096c0472f9c34da78bccecb2c790b54b9dd9712a0b9José Fonseca
2097c0472f9c34da78bccecb2c790b54b9dd9712a0b9José Fonsecavoid
209863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonsecalp_build_tgsi_soa(LLVMBuilderRef builder,
209963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca                  const struct tgsi_token *tokens,
2100b4835ea03d64261da5a892f9590c9977b06920e8José Fonseca                  struct lp_type type,
21013d7a88674f9eb3320eeff511968f041426e25023José Fonseca                  struct lp_build_mask_context *mask,
210263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca                  LLVMValueRef consts_ptr,
2103f85c5f8621382ba1c8baa1582d87b46b388258d2José Fonseca                  const LLVMValueRef *pos,
2104f85c5f8621382ba1c8baa1582d87b46b388258d2José Fonseca                  const LLVMValueRef (*inputs)[NUM_CHANNELS],
2105f85c5f8621382ba1c8baa1582d87b46b388258d2José Fonseca                  LLVMValueRef (*outputs)[NUM_CHANNELS],
2106021e0dc78b15fab29e761012860276c2597c8d8fZack Rusin                  struct lp_build_sampler_soa *sampler,
21073f6dc8e79d918283a6dfcf9c8937a6d52f3bb4f5Brian Paul                  const struct tgsi_shader_info *info)
210863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca{
210963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct lp_build_tgsi_soa_context bld;
211063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   struct tgsi_parse_context parse;
211163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   uint num_immediates = 0;
21120b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   uint num_instructions = 0;
211363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   unsigned i;
21140b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   int pc = 0;
211563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
21166d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   struct lp_type res_type;
21176d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca
21186d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   assert(type.length <= LP_MAX_VECTOR_LENGTH);
21196d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   memset(&res_type, 0, sizeof res_type);
21206d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   res_type.width = type.width;
21216d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   res_type.length = type.length;
21226d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   res_type.sign = 1;
21236d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca
212463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   /* Setup build context */
212563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   memset(&bld, 0, sizeof bld);
212663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   lp_build_context_init(&bld.base, builder, type);
21276d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   lp_build_context_init(&bld.uint_bld, builder, lp_uint_type(type));
2128c0472f9c34da78bccecb2c790b54b9dd9712a0b9José Fonseca   bld.mask = mask;
2129f85c5f8621382ba1c8baa1582d87b46b388258d2José Fonseca   bld.pos = pos;
2130f85c5f8621382ba1c8baa1582d87b46b388258d2José Fonseca   bld.inputs = inputs;
213163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   bld.outputs = outputs;
213263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   bld.consts_ptr = consts_ptr;
21338be72bb7646d430e66cb36e09c13c13bee030d53José Fonseca   bld.sampler = sampler;
21346d173da5c84142ee64f56f4c2e9e495dc1435e91José Fonseca   bld.info = info;
21353662afd87d61e3f65843b210a7e8c9c8a6cb27f0Brian Paul   bld.indirect_files = info->indirect_files;
21360b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   bld.instructions = (struct tgsi_full_instruction *)
21370b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                      MALLOC( LP_MAX_INSTRUCTIONS * sizeof(struct tgsi_full_instruction) );
21380b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   bld.max_instructions = LP_MAX_INSTRUCTIONS;
21390b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
21400b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   if (!bld.instructions) {
21410b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      return;
21420b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   }
214363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
214480f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin   lp_exec_mask_init(&bld.exec_mask, &bld.base);
214580f3cc36c511f62666162bca1d88c7746b98a27dZack Rusin
214663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   tgsi_parse_init( &parse, tokens );
214763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
214863b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   while( !tgsi_parse_end_of_tokens( &parse ) ) {
214963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      tgsi_parse_token( &parse );
215063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
215163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      switch( parse.FullToken.Token.Type ) {
215263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      case TGSI_TOKEN_TYPE_DECLARATION:
21531fc41002252419f4688c24ea8c3814553b3d76adJosé Fonseca         /* Inputs already interpolated */
2154e27983bc08d4eff5effbbcffbf5c9f5862fca2cfJosé Fonseca         emit_declaration( &bld, &parse.FullToken.FullDeclaration );
215563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         break;
215663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
215763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      case TGSI_TOKEN_TYPE_INSTRUCTION:
2158faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         {
21590b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin            /* save expanded instruction */
21600b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin            if (num_instructions == bld.max_instructions) {
2161079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca               struct tgsi_full_instruction *instructions;
2162079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca               instructions = REALLOC(bld.instructions,
2163079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca                                      bld.max_instructions
2164079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca                                      * sizeof(struct tgsi_full_instruction),
2165079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca                                      (bld.max_instructions + LP_MAX_INSTRUCTIONS)
2166079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca                                      * sizeof(struct tgsi_full_instruction));
2167079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca               if (!instructions) {
2168079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca                  break;
2169079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca               }
2170079763f74648fef051ee5b8f7d730f7fc1ba27d5José Fonseca               bld.instructions = instructions;
21710b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin               bld.max_instructions += LP_MAX_INSTRUCTIONS;
21720b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin            }
21730b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
21740b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin            memcpy(bld.instructions + num_instructions,
21750b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                   &parse.FullToken.FullInstruction,
21760b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                   sizeof(bld.instructions[0]));
21770b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
21780b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin            num_instructions++;
2179faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca         }
2180faec23387e035bcdd413b7364933d36a8ec22dbaJosé Fonseca
218163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         break;
218263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
218363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      case TGSI_TOKEN_TYPE_IMMEDIATE:
218463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         /* simply copy the immediate values into the next immediates[] slot */
218563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         {
218663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            const uint size = parse.FullToken.FullImmediate.Immediate.NrTokens - 1;
218763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            assert(size <= 4);
21886c8c88f02f0dc9cf39ce51d068525a94fccd5dc7José Fonseca            assert(num_immediates < LP_MAX_TGSI_IMMEDIATES);
218963b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            for( i = 0; i < size; ++i )
219063b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca               bld.immediates[num_immediates][i] =
2191185be3a87a5b38e8821a560c073975c11dcbd3e9Brian Paul                  lp_build_const_vec(type, parse.FullToken.FullImmediate.u[i].Float);
219263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            for( i = size; i < 4; ++i )
219363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca               bld.immediates[num_immediates][i] = bld.base.undef;
219463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca            num_immediates++;
219563b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         }
219663b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         break;
219763b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
21989381dd590f2e45acb8fbb0aa5503c917b832204dJosé Fonseca      case TGSI_TOKEN_TYPE_PROPERTY:
21999381dd590f2e45acb8fbb0aa5503c917b832204dJosé Fonseca         break;
22009381dd590f2e45acb8fbb0aa5503c917b832204dJosé Fonseca
220163b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      default:
220263b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca         assert( 0 );
220363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca      }
220463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   }
22050b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
22060b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   while (pc != -1) {
22070b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      struct tgsi_full_instruction *instr = bld.instructions + pc;
22080b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      const struct tgsi_opcode_info *opcode_info =
22090b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin         tgsi_get_opcode_info(instr->Instruction.Opcode);
22100b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      if (!emit_instruction( &bld, instr, opcode_info, &pc ))
22110b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin         _debug_printf("warning: failed to translate tgsi opcode %s to LLVM\n",
22120b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin                       opcode_info->mnemonic);
22130b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   }
22140b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
221518d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   if (0) {
221618d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      LLVMBasicBlockRef block = LLVMGetInsertBlock(builder);
221718d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      LLVMValueRef function = LLVMGetBasicBlockParent(block);
2218263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca      debug_printf("11111111111111111111111111111 \n");
221918d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin      tgsi_dump(tokens, 0);
22208ad3e0b55df50beac8ba3c5cafa0be79641a4977José Fonseca      lp_debug_dump_value(function);
2221263e038431f24f24aaec252e135ffc9f2f09640eJosé Fonseca      debug_printf("2222222222222222222222222222 \n");
222218d406e8a8a838c82ee4ec5dbf244ab8bba0855eZack Rusin   }
222363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca   tgsi_parse_free( &parse );
22240b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
22250b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   if (0) {
22260b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      LLVMModuleRef module = LLVMGetGlobalParent(
22270b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin         LLVMGetBasicBlockParent(LLVMGetInsertBlock(bld.base.builder)));
22280b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin      LLVMDumpModule(module);
22290b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
22300b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   }
22310b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin
22320b7ca2f8fcb187fb3aa37e0b6dc4b0a84101478fZack Rusin   FREE( bld.instructions );
223363b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca}
223463b07618b3e4034e11968f1c5323445dc4a0377fJosé Fonseca
2235