nv50_ir.h revision 9d60793a03e40e1d139b78fce0144cad57438741
1d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller/* 2d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Copyright 2011 Christoph Bumiller 3d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 4d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Permission is hereby granted, free of charge, to any person obtaining a 5d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * copy of this software and associated documentation files (the "Software"), 6d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * to deal in the Software without restriction, including without limitation 7d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * and/or sell copies of the Software, and to permit persons to whom the 9d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Software is furnished to do so, subject to the following conditions: 10d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 11d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * The above copyright notice and this permission notice shall be included in 12d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * all copies or substantial portions of the Software. 13d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 14d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 173d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 183d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 193d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 203d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * OTHER DEALINGS IN THE SOFTWARE. 21d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller */ 2257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 2357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#ifndef __NV50_IR_H__ 2457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define __NV50_IR_H__ 2557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 2657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdio.h> 2757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdlib.h> 2857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdint.h> 298cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <deque> 308cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <list> 318cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <vector> 32a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann#include <tr1/unordered_set> 3357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 345eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_util.h" 355eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_graph.h" 3657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 375eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_driver.h" 3857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 3957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillernamespace nv50_ir { 4057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 4157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum operation 4257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 4357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NOP = 0, 4457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PHI, 4557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_UNION, // unify a new definition and several source values 4657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SPLIT, // $r0d -> { $r0, $r1 } ($r0d and $r0/$r1 will be coalesced) 4757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MERGE, // opposite of split, e.g. combine 2 32 bit into a 64 bit value 4857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CONSTRAINT, // copy values into consecutive registers 49d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez OP_MOV, // simple copy, no modifiers allowed 5057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LOAD, 5157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_STORE, 5299e4eba669f13a0dc80880f4f91e2338377c1667Christoph Bumiller OP_ADD, // NOTE: add u64 + u32 is legal for targets w/o 64-bit integer adds 5357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SUB, 5457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MUL, 5557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DIV, 5657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MOD, 5757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MAD, 5857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_FMA, 5957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SAD, // abs(src0 - src1) + src2 6057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_ABS, 6157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NEG, 6257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NOT, 6357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_AND, 6457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_OR, 6557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_XOR, 6657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SHL, 6757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SHR, 6857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MAX, 6957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MIN, 7022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SAT, // CLAMP(f32, 0.0, 1.0) 7157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CEIL, 7257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_FLOOR, 7357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TRUNC, 7457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CVT, 7557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_AND, // dst = (src0 CMP src1) & src2 7657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_OR, 7757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_XOR, 7857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET, 7957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SELP, // dst = src2 ? src0 : src1 8057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SLCT, // dst = (src2 CMP 0) ? src0 : src1 8157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RCP, 8257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RSQ, 8357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LG2, 8457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SIN, 8557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_COS, 8657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EX2, 8757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXP, // exponential (base M_E) 8857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LOG, // natural logarithm 8957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRESIN, 9057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PREEX2, 9157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SQRT, 9257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_POW, 9357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BRA, 9457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CALL, 9557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RET, 9657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CONT, 9757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BREAK, 9857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRERET, 9957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRECONT, 10057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PREBREAK, 10157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BRKPT, // breakpoint (not related to loops) 10257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_JOINAT, // push control flow convergence point 10357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_JOIN, // converge 10457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DISCARD, 10557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXIT, 10622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_MEMBAR, // memory barrier (mfence, lfence, sfence) 10757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_VFETCH, // indirection 0 in attribute space, indirection 1 is vertex base 10857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PFETCH, // fetch base address of vertex src0 (immediate) [+ src1] 1099d60793a03e40e1d139b78fce0144cad57438741Ilia Mirkin OP_AFETCH, // fetch base address of shader input (a[%r1+0x10]) 11057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXPORT, 11157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LINTERP, 11257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PINTERP, 11357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EMIT, // emit vertex 11457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RESTART, // restart primitive 11557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TEX, 11657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXB, // texture bias 11757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXL, // texure lod 11857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXF, // texel fetch 11957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXQ, // texture size query 12057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXD, // texture derivatives 12157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXG, // texture gather 122d5faf8e78603a27dbedb2e9e28b58b1b2bc32858Ilia Mirkin OP_TXLQ, // texture query lod 12322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXCSAA, // texture op for coverage sampling 12422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXPREP, // turn cube map array into 2d array coordinates 12522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULDB, // surface load (raw) 12622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULDP, // surface load (formatted) 12722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUSTB, // surface store (raw) 12822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUSTP, // surface store (formatted) 12922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUREDB, 13022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUREDP, // surface reduction (atomic op) 13122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULEA, // surface load effective address 13222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUBFM, // surface bitfield manipulation 13322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUCLAMP, // clamp surface coordinates 13422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUEAU, // surface effective address 13522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_MADSP, // special integer multiply-add 13622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXBAR, // texture dependency barrier 13757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DFDX, 13857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DFDY, 13957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RDSV, // read system value 14057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_WRSV, // write system value 141af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin OP_PIXLD, // get info about raster object or surfaces 14257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADOP, 14357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADON, 14457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADPOP, 14557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_POPCNT, // bitcount(src0 & src1) 14657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_INSBF, // insert first src1[8:15] bits of src0 into src2 at src1[0:7] 14722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_EXTBF, // place bits [K,K+N) of src0 into dst, src1 = 0xNNKK 148b4b20d42f6a8cd5aec3ba529a0b8d6ea22e73305Ilia Mirkin OP_BFIND, // find highest/lowest set bit 14922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_PERMT, // dst = bytes from src2,src0 selected by src1 (nvc0's src order) 15022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_ATOM, 15122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_BAR, // execution barrier, sources = { id, thread count, predicate } 15222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VADD, // byte/word vector operations 15322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VAVG, 15422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VMIN, 15522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VMAX, 15622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSAD, 15722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSET, 15822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSHR, 15922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSHL, 16022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSEL, 16118fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller OP_CCTL, // cache control 162d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs OP_SHFL, // warp shuffle 16357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LAST 16457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 16557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 16600fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller// various instruction-specific modifier definitions Instruction::subOp 16700fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller// MOV_FINAL marks a MOV originating from an EXPORT (used for placing TEXBARs) 16857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_MUL_HIGH 1 16957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_EMIT_RESTART 1 17057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_IL 1 17157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_IS 2 17257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_ISL 3 1730e4e0ca6df52ddecd1bb2fe9a427549d1a82b9f9Christoph Bumiller#define NV50_IR_SUBOP_SHIFT_WRAP 1 174322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller#define NV50_IR_SUBOP_EMU_PRERET 1 175e44089b2f79aa2dcaacf348911433d1e21235c0cChristoph Bumiller#define NV50_IR_SUBOP_TEXBAR(n) n 17600fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller#define NV50_IR_SUBOP_MOV_FINAL 1 17722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_EXTBF_REV 1 178b4b20d42f6a8cd5aec3ba529a0b8d6ea22e73305Ilia Mirkin#define NV50_IR_SUBOP_BFIND_SAMT 1 179b87b498b88c51fb8c80901b8f581331d3fbcd972Ilia Mirkin#define NV50_IR_SUBOP_RCPRSQ_64H 1 18022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_F4E 1 18122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_B4E 2 18222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_RC8 3 18322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_ECL 4 18422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_ECR 5 18522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_RC16 6 18622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_SYNC 0 18722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_ARRIVE 1 18822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_AND 2 18922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_OR 3 19022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_POPC 4 19122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_L 1 19222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_S 2 19322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_M 3 19422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_CTA (0 << 2) 19522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_GL (1 << 2) 19622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_SYS (2 << 2) 19722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_DIR(m) ((m) & 0x3) 19822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_SCOPE(m) ((m) & ~0x3) 19922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR(d,s) \ 20022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller (NV50_IR_SUBOP_MEMBAR_##d | NV50_IR_SUBOP_MEMBAR_##s) 20122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_ADD 0 20222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_MIN 1 20322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_MAX 2 20422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_INC 3 20522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_DEC 4 20622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_AND 5 20722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_OR 6 20822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_XOR 7 20922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_CAS 8 21022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_EXCH 9 21118fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller#define NV50_IR_SUBOP_CCTL_IV 5 21218fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller#define NV50_IR_SUBOP_CCTL_IVALL 6 21322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_IGN 0 21422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_TRAP 1 21522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_SDCL 3 21622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_ZERO 0 21722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_TRAP 1 21822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_SDCL 3 21922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUBFM_3D 1 22022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_2D 0x10 22122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_SD(r, d) (( 0 + (r)) | ((d == 2) ? 0x10 : 0)) 22222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_PL(r, d) (( 5 + (r)) | ((d == 2) ? 0x10 : 0)) 22322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_BL(r, d) ((10 + (r)) | ((d == 2) ? 0x10 : 0)) 224af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COUNT 0 225af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COVMASK 1 226af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COVERED 2 227af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_OFFSET 3 228af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_CENT_OFFSET 4 229af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_SAMPLEID 5 230d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_IDX 0 231d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_UP 1 232d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_DOWN 2 233d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_BFLY 3 23422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MADSP_SD 0xffff 23522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// Yes, we could represent those with DataType. 23622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// Or put the type into operation and have a couple 1000 values in that enum. 23722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// This will have to do for now. 23822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// The bitfields are supposed to correspond to nve4 ISA. 23922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MADSP(a,b,c) (((c) << 8) | ((b) << 4) | (a)) 24022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V1(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x0000) 24122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V2(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x4000) 24222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V4(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x8000) 24322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_Vn(n) ((n) >> 14) 24457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 24557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum DataType 24657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 24757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_NONE, 24857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U8, 24957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S8, 25057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U16, 25157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S16, 25257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U32, 25357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S32, 25457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U64, // 64 bit operations are only lowered after register allocation 25557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S64, 25657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F16, 25757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F32, 25857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F64, 25957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_B96, 26057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_B128 26157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 26257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 26357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CondCode 26457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 26557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_FL = 0, 26657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NEVER = CC_FL, // when used with FILE_FLAGS 26757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LT = 1, 26857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_EQ = 2, 26957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NOT_P = CC_EQ, // when used with FILE_PREDICATE 27057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LE = 3, 27157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GT = 4, 27257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NE = 5, 27357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_P = CC_NE, 27457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GE = 6, 27557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_TR = 7, 27657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_ALWAYS = CC_TR, 27757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_U = 8, 27857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LTU = 9, 27957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_EQU = 10, 28057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LEU = 11, 28157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GTU = 12, 28257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NEU = 13, 28357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GEU = 14, 28457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NO = 0x10, 28557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NC = 0x11, 28657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NS = 0x12, 28757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NA = 0x13, 28857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_A = 0x14, 28957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_S = 0x15, 29057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_C = 0x16, 29157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_O = 0x17 29257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 29357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 29457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum RoundMode 29557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 29657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_N, // nearest 29757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_M, // towards -inf 29857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_Z, // towards 0 29957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_P, // towards +inf 30057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_NI, // nearest integer 30157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_MI, // to integer towards -inf 30257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_ZI, // to integer towards 0 30357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_PI, // to integer towards +inf 30457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 30557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 30657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CacheMode 30757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 30857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CA, // cache at all levels 30957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_WB = CACHE_CA, // cache write back 31057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CG, // cache at global level 31157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CS, // cache streaming 31257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CV, // cache as volatile 31357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_WT = CACHE_CV // cache write-through 31457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 31557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 31657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum DataFile 31757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 31857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_NULL = 0, 31957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_GPR, 32057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_PREDICATE, // boolean predicate 32157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_FLAGS, // zero/sign/carry/overflow bits 32257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_ADDRESS, 323e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller LAST_REGISTER_FILE = FILE_ADDRESS, 32457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_IMMEDIATE, 32557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_CONST, 32657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SHADER_INPUT, 32757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SHADER_OUTPUT, 32857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_GLOBAL, 32957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_SHARED, 33057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_LOCAL, 33157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SYSTEM_VALUE, 33257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DATA_FILE_COUNT 33357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 33457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 33557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum TexTarget 33657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 33757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D, 33857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D, 33957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_MS, 34057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_3D, 34157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE, 34257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_SHADOW, 34357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_SHADOW, 34457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_SHADOW, 34557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_ARRAY, 34657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_ARRAY, 34757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_MS_ARRAY, 34857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_ARRAY, 34957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_ARRAY_SHADOW, 35057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_ARRAY_SHADOW, 35157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_RECT, 35257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_RECT_SHADOW, 35357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_ARRAY_SHADOW, 35457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_BUFFER, 35557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_COUNT 35657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 35757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 35857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum SVSemantic 35957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 36057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POSITION, // WPOS 36157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VERTEX_ID, 36257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_INSTANCE_ID, 36357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_INVOCATION_ID, 36457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_PRIMITIVE_ID, 36557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VERTEX_COUNT, // gl_PatchVerticesIn 36657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LAYER, 36757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VIEWPORT_INDEX, 36857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_YDIR, 36957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_FACE, 37057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POINT_SIZE, 37157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POINT_COORD, 37257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CLIP_DISTANCE, 37357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_SAMPLE_INDEX, 374f715a0a39a0f7f19443e7721ae792878ba504eedIlia Mirkin SV_SAMPLE_POS, 375b3a2398aded19e25124a4a1d228eb3843827f6b2Ilia Mirkin SV_SAMPLE_MASK, 3767e0036a49258326cc2d875f2960d18c6b3665036Ilia Mirkin SV_TESS_OUTER, 3777e0036a49258326cc2d875f2960d18c6b3665036Ilia Mirkin SV_TESS_INNER, 37857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TESS_COORD, 37957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TID, 38057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CTAID, 38157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NTID, 38257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_GRIDID, 38357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NCTAID, 38457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LANEID, 38557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_PHYSID, 38657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NPHYSID, 38757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CLOCK, 38857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LBASE, 38957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_SBASE, 39067250acbaba924ccaab696f2b348dfa898c41d0bChristoph Bumiller SV_VERTEX_STRIDE, 391d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs SV_INVOCATION_INFO, 39257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_UNDEFINED, 39357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LAST 39457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 39557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 39657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Program; 39757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Function; 39857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass BasicBlock; 39957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 40057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Target; 40157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 40257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Instruction; 40357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass CmpInstruction; 40457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass TexInstruction; 40557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass FlowInstruction; 40657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 40757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Value; 40857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass LValue; 40957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Symbol; 41057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ImmediateValue; 41157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 41257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerstruct Storage 41357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 41457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataFile file; 41557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t fileIndex; // signed, may be indirect for CONST[] 41657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t size; // this should match the Instruction type's size 41757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType type; // mainly for pretty printing 41857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller union { 41957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint64_t u64; // immediate values 42057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t u32; 42157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint16_t u16; 42257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t u8; 42357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int64_t s64; 42457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int32_t s32; 42557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int16_t s16; 42657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t s8; 42757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller float f32; 42857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller double f64; 42957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int32_t offset; // offset from 0 (base of address space) 430e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller int32_t id; // register id (< 0 if virtual/unassigned, in units <= 4) 43157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct { 43257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SVSemantic sv; 43357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int index; 43457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } sv; 43557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } data; 43657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 43757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 43857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// precedence: NOT after SAT after NEG after ABS 43957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_ABS (1 << 0) 44057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NEG (1 << 1) 44157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_SAT (1 << 2) 44257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NOT (1 << 3) 44357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NEG_ABS (NV50_IR_MOD_NEG | NV50_IR_MOD_ABS) 44457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 44557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_MODE_MASK 0x3 44657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_LINEAR (0 << 0) 44757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_PERSPECTIVE (1 << 0) 44857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_FLAT (2 << 0) 44957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SC (3 << 0) // what exactly is that ? 45057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SAMPLE_MASK 0xc 45157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_DEFAULT (0 << 2) 45257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_CENTROID (1 << 2) 45357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_OFFSET (2 << 2) 45457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SAMPLEID (3 << 2) 45557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 45657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// do we really want this to be a class ? 45757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Modifier 45857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 45957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 46057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier() : bits(0) { } 46157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier(unsigned int m) : bits(m) { } 46257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier(operation op); 46357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 46457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // @return new Modifier applying a after b (asserts if unrepresentable) 46557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator*(const Modifier) const; 46614d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez Modifier operator*=(const Modifier m) { *this = *this * m; return *this; } 46757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator==(const Modifier m) const { return m.bits == bits; } 46857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator!=(const Modifier m) const { return m.bits != bits; } 46957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator&(const Modifier m) const { return bits & m.bits; } 47157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator|(const Modifier m) const { return bits | m.bits; } 47257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator^(const Modifier m) const { return bits ^ m.bits; } 47357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller operation getOp() const; 47557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int neg() const { return (bits & NV50_IR_MOD_NEG) ? 1 : 0; } 47757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int abs() const { return (bits & NV50_IR_MOD_ABS) ? 1 : 0; } 47857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47914d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez inline operator bool() const { return bits ? true : false; } 48057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void applyTo(ImmediateValue &imm) const; 48257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int print(char *buf, size_t size) const; 48457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 48657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t bits; 48757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 48857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ValueRef 49057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 49157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 49214d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez ValueRef(Value * = NULL); 4938cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez ValueRef(const ValueRef&); 49457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~ValueRef(); 49557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 49657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool exists() const { return value != NULL; } 49757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 49857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(Value *); 49957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(const ValueRef&); 50057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *get() const { return value; } 50157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *rep() const; 50257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 50357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const { return insn; } 50457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInsn(Instruction *inst) { insn = inst; } 50557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 50657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isIndirect(int dim) const { return indirect[dim] >= 0; } 50757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const ValueRef *getIndirect(int dim) const; 50857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 50957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline DataFile getFile() const; 51057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned getSize() const; 51157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 51257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // SSA: return eventual (traverse MOVs) literal value, if it exists 513d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez bool getImmediate(ImmediateValue&) const; 51457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 51557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 51657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier mod; 5179362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller int8_t indirect[2]; // >= 0 if relative to lvalue in insn->src(indirect[i]) 51857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t swizzle; 51957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 52057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool usedAsPtr; // for printing 52157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 52257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 52357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *value; 52457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *insn; 52557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 52657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 52757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ValueDef 52857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 52957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 53014d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez ValueDef(Value * = NULL); 5318cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez ValueDef(const ValueDef&); 53257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~ValueDef(); 53357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 53457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool exists() const { return value != NULL; } 53557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 53657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *get() const { return value; } 53757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *rep() const; 53857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(Value *); 53914d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez bool mayReplace(const ValueRef &); 54014d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez void replace(const ValueRef &, bool doSet); // replace all uses of the old value 54157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const { return insn; } 54357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInsn(Instruction *inst) { insn = inst; } 54457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline DataFile getFile() const; 54657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned getSize() const; 54757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setSSA(LValue *); 54957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const LValue *preSSA() const; 55057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 55257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *value; // should make this LValue * ... 5538cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez LValue *origin; // pre SSA value 55457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *insn; 55557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 55657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Value 55857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 55957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 56057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value(); 561da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez virtual ~Value() { } 56257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 563a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Value *clone(ClonePolicy<Function>&) const = 0; 56457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 56557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const = 0; 56657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 56757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *, bool strict = false) const; 56857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool interfers(const Value *) const; 569a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const { return true; } 57057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 5719362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *rep() const { return join; } 5729362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 57357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getUniqueInsn() const; 57457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const; // use when uniqueness is certain 57557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 5768cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline int refCount() { return uses.size(); } 57757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 57857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline LValue *asLValue(); 57957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Symbol *asSym(); 58057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline ImmediateValue *asImm(); 58157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const Symbol *asSym() const; 58257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const ImmediateValue *asImm() const; 58357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool inFile(DataFile f) { return reg.file == f; } 58557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline Value *get(Iterator&); 58757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 588a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann std::tr1::unordered_set<ValueRef *> uses; 5898cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez std::list<ValueDef *> defs; 590a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann typedef std::tr1::unordered_set<ValueRef *>::iterator UseIterator; 591a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann typedef std::tr1::unordered_set<ValueRef *>::const_iterator UseCIterator; 5928cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez typedef std::list<ValueDef *>::iterator DefIterator; 5938cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez typedef std::list<ValueDef *>::const_iterator DefCIterator; 59457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 59657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Storage reg; 59757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // TODO: these should be in LValue: 59957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Interval livei; 60057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *join; 60157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 60257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 60357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass LValue : public Value 60457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 60557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 60657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller LValue(Function *, DataFile file); 60757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller LValue(Function *, LValue *); 608da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~LValue() { } 60957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 610a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const; 611a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller 612a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual LValue *clone(ClonePolicy<Function>&) const; 61357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 61557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 617e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned compMask : 8; // compound/component mask 618e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned compound : 1; // used by RA, value involved in split/merge 619e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned ssa : 1; 620e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned fixedReg : 1; // set & used by RA, earlier just use (id < 0) 621e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned noSpill : 1; // do not spill (e.g. if spill temporary already) 62257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 62357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 62457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Symbol : public Value 62557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 62657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 62757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Symbol(Program *, DataFile file = FILE_MEMORY_CONST, ubyte fileIdx = 0); 628da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~Symbol() { } 62957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 630a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Symbol *clone(ClonePolicy<Function>&) const; 63157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 63257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *that, bool strict) const; 63357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 634a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const; 635a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller 63657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 63757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 63857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // print with indirect values 63957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int print(char *, size_t, Value *, Value *, DataType ty = TYPE_NONE) const; 64057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 64157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setFile(DataFile file, ubyte fileIndex = 0) 64257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 64357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller reg.file = file; 64457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller reg.fileIndex = fileIndex; 64557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 64657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 64757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setOffset(int32_t offset); 64857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setAddress(Symbol *base, int32_t offset); 64957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setSV(SVSemantic sv, uint32_t idx = 0); 65057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 65157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const Symbol *getBase() const { return baseSym; } 65257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 65357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 65457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Symbol *baseSym; // array base for Symbols representing array elements 65557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 65657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 65757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ImmediateValue : public Value 65857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 65957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 660d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez ImmediateValue() { } 66157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, uint32_t); 66257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, float); 66357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, double); 66457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // NOTE: not added to program with 66557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(const ImmediateValue *, DataType ty); 666da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~ImmediateValue() { }; 66757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 668784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez virtual ImmediateValue *clone(ClonePolicy<Function>&) const; 669784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 67057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *that, bool strict) const; 67157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // these only work if 'type' is valid (we mostly use untyped literals): 67357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isInteger(const int ival) const; // ival is cast to this' type 67457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isNegative() const; 67557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isPow2() const; 67657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void applyLog2(); 67857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // for constant folding: 68057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator+(const ImmediateValue&) const; 68157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator-(const ImmediateValue&) const; 68257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator*(const ImmediateValue&) const; 68357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator/(const ImmediateValue&) const; 68457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 685d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez ImmediateValue& operator=(const ImmediateValue&); // only sets value ! 686d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez 68757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool compare(CondCode cc, float fval) const; 68857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 68957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 69057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 69157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 69257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Instruction 69357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 69457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 69557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction(); 69657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction(Function *, operation, DataType); 69757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual ~Instruction(); 69857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 699a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Instruction *clone(ClonePolicy<Function>&, 700a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 70157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7028cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setDef(int i, Value *); 7038cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setSrc(int s, Value *); 7048cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setSrc(int s, const ValueRef&); 70557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void swapSources(int a, int b); 706ce1951daed9a4685bf559b4222f50510cb412301Christoph Bumiller void moveSources(int s, int delta); 70757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setIndirect(int s, int dim, Value *); 70857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7099362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline ValueRef& src(int s) { return srcs[s]; } 7109362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline ValueDef& def(int s) { return defs[s]; } 7119362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline const ValueRef& src(int s) const { return srcs[s]; } 7129362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline const ValueDef& def(int s) const { return defs[s]; } 7139362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 7149362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *getDef(int d) const { return defs[d].get(); } 7159362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *getSrc(int s) const { return srcs[s].get(); } 71657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirect(int s, int dim) const; 71757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7188cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline bool defExists(unsigned d) const 7198cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez { 7209362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller return d < defs.size() && defs[d].exists(); 7218cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez } 7228cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline bool srcExists(unsigned s) const 7238cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez { 7249362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller return s < srcs.size() && srcs[s].exists(); 7258cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez } 72657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 727e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller inline bool constrainedDefs() const; 72857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 72957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setPredicate(CondCode ccode, Value *); 73057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getPredicate() const; 73157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool writesPredicate() const; 732ca1fc2b86400e3fc9dd0517863e22721b5e91c77Christoph Bumiller inline bool isPredicated() const { return predSrc >= 0; } 73357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 73456cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller inline void setFlagsSrc(int s, Value *); 73556cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller inline void setFlagsDef(int d, Value *); 73699e4eba669f13a0dc80880f4f91e2338377c1667Christoph Bumiller inline bool usesFlags() const { return flagsSrc >= 0; } 73756cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller 7389362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller unsigned int defCount() const { return defs.size(); }; 739e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned int defCount(unsigned int mask, bool singleFile = false) const; 7409362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller unsigned int srcCount() const { return srcs.size(); }; 741e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned int srcCount(unsigned int mask, bool singleFile = false) const; 74257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // save & remove / set indirect[0,1] and predicate source 74457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void takeExtraSources(int s, Value *[3]); 74557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void putExtraSources(int s, Value *[3]); 74657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setType(DataType type) { dType = sType = type; } 74857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setType(DataType dtype, DataType stype) 75057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 75157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller dType = dtype; 75257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller sType = stype; 75357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 75457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 75557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isPseudo() const { return op < OP_MOV; } 75657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isDead() const; 75757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isNop() const; 75857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isCommutationLegal(const Instruction *) const; // must be adjacent ! 75957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isActionEqual(const Instruction *) const; 76057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isResultEqual(const Instruction *) const; 76157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print() const; 76357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline CmpInstruction *asCmp(); 76557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline TexInstruction *asTex(); 76657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline FlowInstruction *asFlow(); 76757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const TexInstruction *asTex() const; 76857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const CmpInstruction *asCmp() const; 76957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const FlowInstruction *asFlow() const; 77057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 77157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 77257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *next; 77357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *prev; 77457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 77557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int serial; // CFG order 77657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 77757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller operation op; 77857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType dType; // destination or defining type 77957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType sType; // source or secondary type 78057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode cc; 78157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller RoundMode rnd; 78257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CacheMode cache; 78357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 78422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller uint16_t subOp; // quadop, 1 for mul-high, etc. 785afcd7b5d1614a8a758ccb4353a9c31a601c9b9b4Christoph Bumiller 78657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned encSize : 4; // encoding size in bytes 78757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned saturate : 1; // to [0.0f, 1.0f] 78857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned join : 1; // converge control flow (use OP_JOIN until end) 78957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned fixed : 1; // prevent dead code elimination 79057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned terminator : 1; // end of basic block 79157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned ftz : 1; // flush denormal to zero 79257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned dnz : 1; // denormals, NaN are zero 79357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned ipa : 4; // interpolation mode 79457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned lanes : 4; 79557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned perPatch : 1; 79657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned exit : 1; // terminate program after insn 79722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller unsigned mask : 4; // for vector ops 79857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 79957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t postFactor; // MUL/DIV(if < 0) by 1 << postFactor 80057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 80157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t predSrc; 80257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t flagsDef; 80357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t flagsSrc; 80457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 805bede1bdb4828ea673bc7859db4058da7e35c6774Ben Skeggs uint32_t sched; // scheduling data (NOTE: maybe move to separate storage) 80622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller 80757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *bb; 80857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 8099362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumillerprotected: 8109362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller std::deque<ValueDef> defs; // no gaps ! 8119362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller std::deque<ValueRef> srcs; // no gaps ! 8129362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 81357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // instruction specific methods: 81457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // (don't want to subclass, would need more constructors and memory pools) 81557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 81657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInterpolate(unsigned int mode) { ipa = mode; } 81757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 81857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getInterpMode() const { return ipa & 0x3; } 81957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getSampleMode() const { return ipa & 0xc; } 82057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 82157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 82257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void init(); 82357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 82457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 82557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum TexQuery 82657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 82757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_DIMS, 82857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_TYPE, 82957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_SAMPLE_POSITION, 83057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_FILTER, 83157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_LOD, 83257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_WRAP, 83357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_BORDER_COLOUR 83457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 83557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 83657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass TexInstruction : public Instruction 83757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 83857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 83957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller class Target 84057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 84157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller public: 84257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target(TexTarget targ = TEX_TARGET_2D) : target(targ) { } 84357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 84457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const char *getName() const { return descTable[target].name; } 84557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getArgCount() const { return descTable[target].argc; } 84657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getDim() const { return descTable[target].dim; } 84757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isArray() const { return descTable[target].array ? 1 : 0; } 84857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isCube() const { return descTable[target].cube ? 1 : 0; } 84957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isShadow() const { return descTable[target].shadow ? 1 : 0; } 8504da54c91d24da891c56957f29274e7821c8254f6Christoph Bumiller int isMS() const { 8514da54c91d24da891c56957f29274e7821c8254f6Christoph Bumiller return target == TEX_TARGET_2D_MS || target == TEX_TARGET_2D_MS_ARRAY; } 8523bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin void clearMS() { 8533bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin if (isMS()) { 8543bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin if (isArray()) 8553bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin target = TEX_TARGET_2D_ARRAY; 8563bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin else 8573bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin target = TEX_TARGET_2D; 8583bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin } 8593bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin } 86057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 86157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target& operator=(TexTarget targ) 86257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 86357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller assert(targ < TEX_TARGET_COUNT); 864f7599b2c32185535b4c215de0ba0454129fa523fChristoph Bumiller target = targ; 86557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller return *this; 86657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 86757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 86857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool operator==(TexTarget targ) const { return target == targ; } 8694506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller inline bool operator!=(TexTarget targ) const { return target != targ; } 8704506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller 8714506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller enum TexTarget getEnum() const { return target; } 87257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 87357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller private: 87457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct Desc 87557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 87657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller char name[19]; 87757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t dim; 87857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t argc; 87957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool array; 88057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool cube; 88157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool shadow; 88257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 88357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 88457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static const struct Desc descTable[TEX_TARGET_COUNT]; 88557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 88657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller private: 88757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum TexTarget target; 88857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 88957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 89057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 89157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TexInstruction(Function *, operation); 89257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual ~TexInstruction(); 89357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 894a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual TexInstruction *clone(ClonePolicy<Function>&, 895a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 89657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 89757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setTexture(Target targ, uint8_t r, uint8_t s) 89857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 89957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.r = r; 90057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.s = s; 90157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.target = targ; 90257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 90357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 9047a91d3a2a4c4e7851fdb46465224213ce1874c9bChristoph Bumiller void setIndirectR(Value *); 9057a91d3a2a4c4e7851fdb46465224213ce1874c9bChristoph Bumiller void setIndirectS(Value *); 90657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirectR() const; 90757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirectS() const; 90857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 90957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 91057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct { 91157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target target; 91257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 913c2dfcd7f0eaf4eda375eb320e0e87793a80ef92dChristoph Bumiller uint16_t r; 914c2dfcd7f0eaf4eda375eb320e0e87793a80ef92dChristoph Bumiller uint16_t s; 91557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t rIndirectSrc; 91657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t sIndirectSrc; 91757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 91857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t mask; 91957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t gatherComp; 92057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool liveOnly; // only execute on live pixels of a quad (optimization) 92257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool levelZero; 9239c930639d9f6d713ccfd16b390a41a9f584f348cChristoph Bumiller bool derivAll; 92457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t useOffsets; // 0, 1, or 4 for textureGatherOffsets 926f3aa999383074d666d6e3f3506e66b0c937904caIlia Mirkin int8_t offset[3]; // only used on nv50 92757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum TexQuery query; 92957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } tex; 93057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 93157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ValueRef dPdx[3]; 93257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ValueRef dPdy[3]; 933f3aa999383074d666d6e3f3506e66b0c937904caIlia Mirkin ValueRef offset[4][3]; 93457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 93557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 93657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass CmpInstruction : public Instruction 93757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 93857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 93957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CmpInstruction(Function *, operation); 94057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 941a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual CmpInstruction *clone(ClonePolicy<Function>&, 942a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 94357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void setCondition(CondCode cond) { setCond = cond; } 94557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode getCondition() const { return setCond; } 94657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 94857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode setCond; 94957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 95057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 95157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass FlowInstruction : public Instruction 95257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 95357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 9549bb36d54a2c69ebdc9d1c9c4c71945060de8c860Francisco Jerez FlowInstruction(Function *, operation, void *target); 95557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 956784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez virtual FlowInstruction *clone(ClonePolicy<Function>&, 957784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez Instruction * = NULL) const; 958784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 95957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 96057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned allWarp : 1; 96157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned absolute : 1; 96257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned limit : 1; 96357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned builtin : 1; // true for calls to emulation code 964c893b9406060d3735b2c9e307ae89f6d83a4be40Christoph Bumiller unsigned indirect : 1; // target in src(0) 96557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 96657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller union { 96757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *bb; 96857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int builtin; 96957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *fn; 97057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } target; 97157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 97257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 97357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass BasicBlock 97457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 97557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 97657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock(Function *); 97757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~BasicBlock(); 97857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 979784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez BasicBlock *clone(ClonePolicy<Function>&) const; 980784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 98157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int getId() const { return id; } 98257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned int getInsnCount() const { return numInsns; } 98357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isTerminated() const { return exit && exit->terminator; } 98457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 98557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool dominatedBy(BasicBlock *bb); 98640c224a573f2b763046001e622aafca90f68c693Christoph Bumiller inline bool reachableBy(const BasicBlock *by, const BasicBlock *term); 98757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 98857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // returns mask of conditional out blocks 98957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // e.g. 3 for IF { .. } ELSE { .. } ENDIF, 1 for IF { .. } ENDIF 99057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int initiatesSimpleConditional() const; 99157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 99257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 99357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *getFunction() const { return func; } 99457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *getProgram() const { return program; } 99557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 99657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getEntry() const { return entry; } // first non-phi instruction 99757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getPhi() const { return phi; } 99857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getFirst() const { return phi ? phi : entry; } 99957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getExit() const { return exit; } 100057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 100157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertHead(Instruction *); 100257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertTail(Instruction *); 100357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertBefore(Instruction *, Instruction *); 100457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertAfter(Instruction *, Instruction *); 100557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void remove(Instruction *); 100657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void permuteAdjacent(Instruction *, Instruction *); 100757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 100857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *idom() const; 100957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1010c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller // NOTE: currently does not rebuild the dominator tree 1011c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller BasicBlock *splitBefore(Instruction *, bool attach = true); 1012c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller BasicBlock *splitAfter(Instruction *, bool attach = true); 1013c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller 101457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList& getDF() { return df; } 101557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList::Iterator iterDF() { return df.iterator(); } 101657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 101757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline BasicBlock *get(Iterator&); 101857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline BasicBlock *get(Graph::Node *); 101957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 102157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node cfg; // first edge is branch *taken* (the ELSE branch) 102257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node dom; 102357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BitSet liveSet; 10253e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez BitSet defSet; 102657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binPos; 102857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 102957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *joinAt; // for quick reference 103157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool explicitCont; // loop headers: true if loop contains continue stmts 103357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 103557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 103657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList df; 103757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *phi; 103957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *entry; 104057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *exit; 104157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int numInsns; 104357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 104557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *func; 104657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *program; 1047c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller 1048c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller void splitCommon(Instruction *, BasicBlock *, bool attach); 104957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 105057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 105157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Function 105257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 105357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 105498116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez Function(Program *, const char *name, uint32_t label); 105557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~Function(); 105657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1057d32ebb8c304725fa6bb7ec2d3d40ce828c713917Francisco Jerez static inline Function *get(Graph::Node *node); 1058d32ebb8c304725fa6bb7ec2d3d40ce828c713917Francisco Jerez 105957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Program *getProgram() const { return prog; } 106057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const char *getName() const { return name; } 106157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int getId() const { return id; } 106298116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez inline uint32_t getLabel() const { return label; } 106357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 106457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print(); 106557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void printLiveIntervals() const; 106657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void printCFGraph(const char *filePath); 106757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 106857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setEntry(BasicBlock *); 106957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setExit(BasicBlock *); 107057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 107157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int orderInstructions(ArrayList&); 107257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 107357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(BasicBlock *bb, int& id) { allBBlocks.insert(bb, id); } 107457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Instruction *insn, int& id) { allInsns.insert(insn, id); } 107557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(LValue *lval, int& id) { allLValues.insert(lval, id); } 107657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 107757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline LValue *getLValue(int id); 107857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1079898b0981b6c90d2f1e446a532b6ac3cbbb49747dFrancisco Jerez void buildLiveSets(); 10803e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez void buildDefSets(); 108157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool convertToSSA(); 108257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 108357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 1084a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<ValueDef> ins; 1085a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<ValueRef> outs; 1086a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<Value *> clobbers; 1087a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez 108857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph cfg; 108957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node *cfgExit; 109057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph *domTree; 109157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node call; // node in the call graph 109257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock **bbArray; // BBs in emission order 109457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int bbCount; 109557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int loopNestingBound; 109757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int regClobberMax; 109857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binPos; 110057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 110157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1102e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller Value *stackPtr; 1103e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller 1104e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsBase; // base address for l[] space (if no stack pointer is used) 1105e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsSize; 1106e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller 110757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allBBlocks; 110857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allInsns; 110957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allLValues; 111057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 111157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 111257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void buildLiveSetsPreSSA(BasicBlock *, const int sequence); 11133e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez void buildDefSetsPreSSA(BasicBlock *bb, const int seq); 111457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 111557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 111698116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez uint32_t label; 111757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 111857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const char *const name; 111957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *prog; 112057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 112157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CGStage 112357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 112457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_PRE_SSA, 112557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_SSA, // expected directly before register allocation 112657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_POST_RA 112757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 112857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Program 113057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 113157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 113257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum Type 113357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 113457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_VERTEX, 113557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_TESSELLATION_CONTROL, 113657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_TESSELLATION_EVAL, 113757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_GEOMETRY, 113857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_FRAGMENT, 113957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_COMPUTE 114057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 114157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program(Type type, Target *targ); 114357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~Program(); 114457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print(); 114657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Type getType() const { return progType; } 114857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Function *fn, int& id) { allFuncs.insert(fn, id); } 11505e4b2a1a47ca9a173f6419ed2f12c9fba80e757cFrancisco Jerez inline void del(Function *fn, int& id) { allFuncs.remove(id); } 115157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Value *rval, int& id) { allRValues.insert(rval, id); } 115257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 115357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool makeFromTGSI(struct nv50_ir_prog_info *); 115457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool makeFromSM4(struct nv50_ir_prog_info *); 115557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool convertToSSA(); 115657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool optimizeSSA(int level); 115757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool optimizePostRA(int level); 115857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool registerAllocation(); 115957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool emitBinary(struct nv50_ir_prog_info *); 116057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const Target *getTarget() const { return target; } 116257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 116498116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez void emitSymbolTable(struct nv50_ir_prog_info *); 116598116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez 116657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Type progType; 116757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target *target; 116857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 117057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *main; 117157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph calls; 117257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allFuncs; 117457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allRValues; 117557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t *code; 117757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 1178e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsSize; // size required for FILE_MEMORY_LOCAL 117957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 118057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int maxGPR; 118157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 118257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_Instruction; 118357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_CmpInstruction; 118457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_TexInstruction; 118557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_FlowInstruction; 118657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_LValue; 118757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_Symbol; 118857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_ImmediateValue; 118957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 119057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t dbgFlags; 1191322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller uint8_t optLevel; 1192322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller 1193322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller void *targetPriv; // e.g. to carry information between passes 119457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 11954506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller const struct nv50_ir_prog_info *driver; // for driver configuration 11964506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller 119757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void releaseInstruction(Instruction *); 119857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void releaseValue(Value *); 119957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 120057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 120157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// TODO: add const version 120257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Pass 120357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 120457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 120557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool run(Program *, bool ordered = false, bool skipPhi = false); 120657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool run(Function *, bool ordered = false, bool skipPhi = false); 120757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 120857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 120957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // return false to continue with next entity on next higher level 121057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(Function *) { return true; } 121157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(BasicBlock *) { return true; } 121257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(Instruction *) { return false; } 121357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 121457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool doRun(Program *, bool ordered, bool skipPhi); 121557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool doRun(Function *, bool ordered, bool skipPhi); 121657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 121757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprotected: 121857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool err; 121957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *func; 122057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *prog; 122157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 122257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// ============================================================================= 122457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 12255eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_inlines.h" 122657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller} // namespace nv50_ir 122857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#endif // __NV50_IR_H__ 1230