nv50_ir.h revision b87b498b88c51fb8c80901b8f581331d3fbcd972
1d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller/* 2d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Copyright 2011 Christoph Bumiller 3d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 4d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Permission is hereby granted, free of charge, to any person obtaining a 5d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * copy of this software and associated documentation files (the "Software"), 6d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * to deal in the Software without restriction, including without limitation 7d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * and/or sell copies of the Software, and to permit persons to whom the 9d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Software is furnished to do so, subject to the following conditions: 10d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 11d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * The above copyright notice and this permission notice shall be included in 12d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * all copies or substantial portions of the Software. 13d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 14d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 173d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 183d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 193d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 203d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * OTHER DEALINGS IN THE SOFTWARE. 21d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller */ 2257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 2357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#ifndef __NV50_IR_H__ 2457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define __NV50_IR_H__ 2557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 2657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdio.h> 2757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdlib.h> 2857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdint.h> 298cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <deque> 308cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <list> 318cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <vector> 32a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann#include <tr1/unordered_set> 3357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 345eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_util.h" 355eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_graph.h" 3657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 375eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_driver.h" 3857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 3957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillernamespace nv50_ir { 4057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 4157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum operation 4257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 4357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NOP = 0, 4457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PHI, 4557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_UNION, // unify a new definition and several source values 4657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SPLIT, // $r0d -> { $r0, $r1 } ($r0d and $r0/$r1 will be coalesced) 4757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MERGE, // opposite of split, e.g. combine 2 32 bit into a 64 bit value 4857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CONSTRAINT, // copy values into consecutive registers 49d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez OP_MOV, // simple copy, no modifiers allowed 5057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LOAD, 5157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_STORE, 5299e4eba669f13a0dc80880f4f91e2338377c1667Christoph Bumiller OP_ADD, // NOTE: add u64 + u32 is legal for targets w/o 64-bit integer adds 5357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SUB, 5457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MUL, 5557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DIV, 5657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MOD, 5757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MAD, 5857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_FMA, 5957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SAD, // abs(src0 - src1) + src2 6057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_ABS, 6157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NEG, 6257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NOT, 6357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_AND, 6457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_OR, 6557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_XOR, 6657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SHL, 6757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SHR, 6857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MAX, 6957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MIN, 7022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SAT, // CLAMP(f32, 0.0, 1.0) 7157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CEIL, 7257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_FLOOR, 7357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TRUNC, 7457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CVT, 7557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_AND, // dst = (src0 CMP src1) & src2 7657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_OR, 7757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_XOR, 7857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET, 7957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SELP, // dst = src2 ? src0 : src1 8057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SLCT, // dst = (src2 CMP 0) ? src0 : src1 8157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RCP, 8257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RSQ, 8357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LG2, 8457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SIN, 8557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_COS, 8657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EX2, 8757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXP, // exponential (base M_E) 8857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LOG, // natural logarithm 8957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRESIN, 9057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PREEX2, 9157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SQRT, 9257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_POW, 9357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BRA, 9457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CALL, 9557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RET, 9657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CONT, 9757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BREAK, 9857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRERET, 9957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRECONT, 10057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PREBREAK, 10157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BRKPT, // breakpoint (not related to loops) 10257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_JOINAT, // push control flow convergence point 10357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_JOIN, // converge 10457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DISCARD, 10557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXIT, 10622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_MEMBAR, // memory barrier (mfence, lfence, sfence) 10757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_VFETCH, // indirection 0 in attribute space, indirection 1 is vertex base 10857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PFETCH, // fetch base address of vertex src0 (immediate) [+ src1] 10957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXPORT, 11057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LINTERP, 11157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PINTERP, 11257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EMIT, // emit vertex 11357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RESTART, // restart primitive 11457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TEX, 11557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXB, // texture bias 11657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXL, // texure lod 11757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXF, // texel fetch 11857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXQ, // texture size query 11957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXD, // texture derivatives 12057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXG, // texture gather 121d5faf8e78603a27dbedb2e9e28b58b1b2bc32858Ilia Mirkin OP_TXLQ, // texture query lod 12222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXCSAA, // texture op for coverage sampling 12322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXPREP, // turn cube map array into 2d array coordinates 12422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULDB, // surface load (raw) 12522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULDP, // surface load (formatted) 12622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUSTB, // surface store (raw) 12722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUSTP, // surface store (formatted) 12822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUREDB, 12922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUREDP, // surface reduction (atomic op) 13022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULEA, // surface load effective address 13122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUBFM, // surface bitfield manipulation 13222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUCLAMP, // clamp surface coordinates 13322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUEAU, // surface effective address 13422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_MADSP, // special integer multiply-add 13522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXBAR, // texture dependency barrier 13657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DFDX, 13757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DFDY, 13857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RDSV, // read system value 13957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_WRSV, // write system value 140af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin OP_PIXLD, // get info about raster object or surfaces 14157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADOP, 14257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADON, 14357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADPOP, 14457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_POPCNT, // bitcount(src0 & src1) 14557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_INSBF, // insert first src1[8:15] bits of src0 into src2 at src1[0:7] 14622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_EXTBF, // place bits [K,K+N) of src0 into dst, src1 = 0xNNKK 147b4b20d42f6a8cd5aec3ba529a0b8d6ea22e73305Ilia Mirkin OP_BFIND, // find highest/lowest set bit 14822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_PERMT, // dst = bytes from src2,src0 selected by src1 (nvc0's src order) 14922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_ATOM, 15022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_BAR, // execution barrier, sources = { id, thread count, predicate } 15122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VADD, // byte/word vector operations 15222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VAVG, 15322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VMIN, 15422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VMAX, 15522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSAD, 15622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSET, 15722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSHR, 15822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSHL, 15922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSEL, 16018fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller OP_CCTL, // cache control 161d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs OP_SHFL, // warp shuffle 16257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LAST 16357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 16457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 16500fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller// various instruction-specific modifier definitions Instruction::subOp 16600fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller// MOV_FINAL marks a MOV originating from an EXPORT (used for placing TEXBARs) 16757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_MUL_HIGH 1 16857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_EMIT_RESTART 1 16957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_IL 1 17057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_IS 2 17157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_ISL 3 1720e4e0ca6df52ddecd1bb2fe9a427549d1a82b9f9Christoph Bumiller#define NV50_IR_SUBOP_SHIFT_WRAP 1 173322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller#define NV50_IR_SUBOP_EMU_PRERET 1 174e44089b2f79aa2dcaacf348911433d1e21235c0cChristoph Bumiller#define NV50_IR_SUBOP_TEXBAR(n) n 17500fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller#define NV50_IR_SUBOP_MOV_FINAL 1 17622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_EXTBF_REV 1 177b4b20d42f6a8cd5aec3ba529a0b8d6ea22e73305Ilia Mirkin#define NV50_IR_SUBOP_BFIND_SAMT 1 178b87b498b88c51fb8c80901b8f581331d3fbcd972Ilia Mirkin#define NV50_IR_SUBOP_RCPRSQ_64H 1 17922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_F4E 1 18022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_B4E 2 18122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_RC8 3 18222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_ECL 4 18322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_ECR 5 18422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_RC16 6 18522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_SYNC 0 18622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_ARRIVE 1 18722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_AND 2 18822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_OR 3 18922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_POPC 4 19022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_L 1 19122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_S 2 19222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_M 3 19322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_CTA (0 << 2) 19422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_GL (1 << 2) 19522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_SYS (2 << 2) 19622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_DIR(m) ((m) & 0x3) 19722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_SCOPE(m) ((m) & ~0x3) 19822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR(d,s) \ 19922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller (NV50_IR_SUBOP_MEMBAR_##d | NV50_IR_SUBOP_MEMBAR_##s) 20022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_ADD 0 20122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_MIN 1 20222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_MAX 2 20322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_INC 3 20422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_DEC 4 20522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_AND 5 20622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_OR 6 20722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_XOR 7 20822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_CAS 8 20922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_EXCH 9 21018fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller#define NV50_IR_SUBOP_CCTL_IV 5 21118fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller#define NV50_IR_SUBOP_CCTL_IVALL 6 21222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_IGN 0 21322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_TRAP 1 21422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_SDCL 3 21522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_ZERO 0 21622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_TRAP 1 21722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_SDCL 3 21822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUBFM_3D 1 21922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_2D 0x10 22022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_SD(r, d) (( 0 + (r)) | ((d == 2) ? 0x10 : 0)) 22122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_PL(r, d) (( 5 + (r)) | ((d == 2) ? 0x10 : 0)) 22222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_BL(r, d) ((10 + (r)) | ((d == 2) ? 0x10 : 0)) 223af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COUNT 0 224af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COVMASK 1 225af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COVERED 2 226af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_OFFSET 3 227af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_CENT_OFFSET 4 228af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_SAMPLEID 5 229d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_IDX 0 230d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_UP 1 231d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_DOWN 2 232d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_BFLY 3 23322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MADSP_SD 0xffff 23422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// Yes, we could represent those with DataType. 23522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// Or put the type into operation and have a couple 1000 values in that enum. 23622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// This will have to do for now. 23722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// The bitfields are supposed to correspond to nve4 ISA. 23822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MADSP(a,b,c) (((c) << 8) | ((b) << 4) | (a)) 23922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V1(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x0000) 24022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V2(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x4000) 24122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V4(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x8000) 24222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_Vn(n) ((n) >> 14) 24357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 24457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum DataType 24557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 24657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_NONE, 24757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U8, 24857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S8, 24957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U16, 25057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S16, 25157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U32, 25257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S32, 25357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U64, // 64 bit operations are only lowered after register allocation 25457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S64, 25557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F16, 25657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F32, 25757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F64, 25857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_B96, 25957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_B128 26057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 26157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 26257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CondCode 26357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 26457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_FL = 0, 26557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NEVER = CC_FL, // when used with FILE_FLAGS 26657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LT = 1, 26757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_EQ = 2, 26857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NOT_P = CC_EQ, // when used with FILE_PREDICATE 26957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LE = 3, 27057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GT = 4, 27157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NE = 5, 27257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_P = CC_NE, 27357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GE = 6, 27457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_TR = 7, 27557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_ALWAYS = CC_TR, 27657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_U = 8, 27757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LTU = 9, 27857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_EQU = 10, 27957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LEU = 11, 28057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GTU = 12, 28157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NEU = 13, 28257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GEU = 14, 28357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NO = 0x10, 28457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NC = 0x11, 28557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NS = 0x12, 28657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NA = 0x13, 28757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_A = 0x14, 28857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_S = 0x15, 28957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_C = 0x16, 29057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_O = 0x17 29157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 29257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 29357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum RoundMode 29457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 29557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_N, // nearest 29657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_M, // towards -inf 29757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_Z, // towards 0 29857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_P, // towards +inf 29957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_NI, // nearest integer 30057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_MI, // to integer towards -inf 30157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_ZI, // to integer towards 0 30257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_PI, // to integer towards +inf 30357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 30457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 30557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CacheMode 30657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 30757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CA, // cache at all levels 30857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_WB = CACHE_CA, // cache write back 30957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CG, // cache at global level 31057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CS, // cache streaming 31157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CV, // cache as volatile 31257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_WT = CACHE_CV // cache write-through 31357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 31457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 31557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum DataFile 31657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 31757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_NULL = 0, 31857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_GPR, 31957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_PREDICATE, // boolean predicate 32057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_FLAGS, // zero/sign/carry/overflow bits 32157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_ADDRESS, 322e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller LAST_REGISTER_FILE = FILE_ADDRESS, 32357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_IMMEDIATE, 32457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_CONST, 32557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SHADER_INPUT, 32657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SHADER_OUTPUT, 32757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_GLOBAL, 32857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_SHARED, 32957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_LOCAL, 33057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SYSTEM_VALUE, 33157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DATA_FILE_COUNT 33257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 33357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 33457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum TexTarget 33557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 33657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D, 33757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D, 33857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_MS, 33957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_3D, 34057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE, 34157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_SHADOW, 34257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_SHADOW, 34357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_SHADOW, 34457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_ARRAY, 34557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_ARRAY, 34657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_MS_ARRAY, 34757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_ARRAY, 34857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_ARRAY_SHADOW, 34957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_ARRAY_SHADOW, 35057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_RECT, 35157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_RECT_SHADOW, 35257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_ARRAY_SHADOW, 35357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_BUFFER, 35457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_COUNT 35557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 35657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 35757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum SVSemantic 35857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 35957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POSITION, // WPOS 36057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VERTEX_ID, 36157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_INSTANCE_ID, 36257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_INVOCATION_ID, 36357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_PRIMITIVE_ID, 36457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VERTEX_COUNT, // gl_PatchVerticesIn 36557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LAYER, 36657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VIEWPORT_INDEX, 36757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_YDIR, 36857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_FACE, 36957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POINT_SIZE, 37057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POINT_COORD, 37157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CLIP_DISTANCE, 37257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_SAMPLE_INDEX, 373f715a0a39a0f7f19443e7721ae792878ba504eedIlia Mirkin SV_SAMPLE_POS, 374b3a2398aded19e25124a4a1d228eb3843827f6b2Ilia Mirkin SV_SAMPLE_MASK, 37557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TESS_FACTOR, 37657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TESS_COORD, 37757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TID, 37857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CTAID, 37957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NTID, 38057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_GRIDID, 38157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NCTAID, 38257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LANEID, 38357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_PHYSID, 38457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NPHYSID, 38557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CLOCK, 38657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LBASE, 38757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_SBASE, 38867250acbaba924ccaab696f2b348dfa898c41d0bChristoph Bumiller SV_VERTEX_STRIDE, 389d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs SV_INVOCATION_INFO, 39057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_UNDEFINED, 39157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LAST 39257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 39357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 39457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Program; 39557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Function; 39657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass BasicBlock; 39757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 39857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Target; 39957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 40057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Instruction; 40157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass CmpInstruction; 40257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass TexInstruction; 40357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass FlowInstruction; 40457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 40557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Value; 40657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass LValue; 40757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Symbol; 40857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ImmediateValue; 40957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 41057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerstruct Storage 41157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 41257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataFile file; 41357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t fileIndex; // signed, may be indirect for CONST[] 41457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t size; // this should match the Instruction type's size 41557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType type; // mainly for pretty printing 41657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller union { 41757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint64_t u64; // immediate values 41857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t u32; 41957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint16_t u16; 42057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t u8; 42157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int64_t s64; 42257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int32_t s32; 42357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int16_t s16; 42457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t s8; 42557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller float f32; 42657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller double f64; 42757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int32_t offset; // offset from 0 (base of address space) 428e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller int32_t id; // register id (< 0 if virtual/unassigned, in units <= 4) 42957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct { 43057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SVSemantic sv; 43157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int index; 43257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } sv; 43357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } data; 43457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 43557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 43657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// precedence: NOT after SAT after NEG after ABS 43757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_ABS (1 << 0) 43857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NEG (1 << 1) 43957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_SAT (1 << 2) 44057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NOT (1 << 3) 44157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NEG_ABS (NV50_IR_MOD_NEG | NV50_IR_MOD_ABS) 44257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 44357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_MODE_MASK 0x3 44457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_LINEAR (0 << 0) 44557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_PERSPECTIVE (1 << 0) 44657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_FLAT (2 << 0) 44757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SC (3 << 0) // what exactly is that ? 44857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SAMPLE_MASK 0xc 44957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_DEFAULT (0 << 2) 45057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_CENTROID (1 << 2) 45157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_OFFSET (2 << 2) 45257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SAMPLEID (3 << 2) 45357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 45457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// do we really want this to be a class ? 45557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Modifier 45657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 45757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 45857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier() : bits(0) { } 45957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier(unsigned int m) : bits(m) { } 46057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier(operation op); 46157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 46257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // @return new Modifier applying a after b (asserts if unrepresentable) 46357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator*(const Modifier) const; 46414d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez Modifier operator*=(const Modifier m) { *this = *this * m; return *this; } 46557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator==(const Modifier m) const { return m.bits == bits; } 46657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator!=(const Modifier m) const { return m.bits != bits; } 46757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 46857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator&(const Modifier m) const { return bits & m.bits; } 46957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator|(const Modifier m) const { return bits | m.bits; } 47057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator^(const Modifier m) const { return bits ^ m.bits; } 47157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller operation getOp() const; 47357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int neg() const { return (bits & NV50_IR_MOD_NEG) ? 1 : 0; } 47557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int abs() const { return (bits & NV50_IR_MOD_ABS) ? 1 : 0; } 47657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47714d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez inline operator bool() const { return bits ? true : false; } 47857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void applyTo(ImmediateValue &imm) const; 48057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int print(char *buf, size_t size) const; 48257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 48457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t bits; 48557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 48657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ValueRef 48857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 48957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 49014d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez ValueRef(Value * = NULL); 4918cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez ValueRef(const ValueRef&); 49257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~ValueRef(); 49357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 49457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool exists() const { return value != NULL; } 49557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 49657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(Value *); 49757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(const ValueRef&); 49857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *get() const { return value; } 49957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *rep() const; 50057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 50157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const { return insn; } 50257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInsn(Instruction *inst) { insn = inst; } 50357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 50457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isIndirect(int dim) const { return indirect[dim] >= 0; } 50557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const ValueRef *getIndirect(int dim) const; 50657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 50757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline DataFile getFile() const; 50857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned getSize() const; 50957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 51057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // SSA: return eventual (traverse MOVs) literal value, if it exists 511d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez bool getImmediate(ImmediateValue&) const; 51257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 51357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 51457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier mod; 5159362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller int8_t indirect[2]; // >= 0 if relative to lvalue in insn->src(indirect[i]) 51657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t swizzle; 51757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 51857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool usedAsPtr; // for printing 51957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 52057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 52157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *value; 52257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *insn; 52357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 52457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 52557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ValueDef 52657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 52757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 52814d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez ValueDef(Value * = NULL); 5298cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez ValueDef(const ValueDef&); 53057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~ValueDef(); 53157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 53257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool exists() const { return value != NULL; } 53357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 53457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *get() const { return value; } 53557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *rep() const; 53657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(Value *); 53714d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez bool mayReplace(const ValueRef &); 53814d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez void replace(const ValueRef &, bool doSet); // replace all uses of the old value 53957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const { return insn; } 54157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInsn(Instruction *inst) { insn = inst; } 54257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline DataFile getFile() const; 54457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned getSize() const; 54557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setSSA(LValue *); 54757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const LValue *preSSA() const; 54857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 55057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *value; // should make this LValue * ... 5518cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez LValue *origin; // pre SSA value 55257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *insn; 55357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 55457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Value 55657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 55757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 55857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value(); 559da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez virtual ~Value() { } 56057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 561a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Value *clone(ClonePolicy<Function>&) const = 0; 56257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 56357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const = 0; 56457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 56557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *, bool strict = false) const; 56657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool interfers(const Value *) const; 567a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const { return true; } 56857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 5699362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *rep() const { return join; } 5709362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 57157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getUniqueInsn() const; 57257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const; // use when uniqueness is certain 57357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 5748cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline int refCount() { return uses.size(); } 57557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 57657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline LValue *asLValue(); 57757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Symbol *asSym(); 57857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline ImmediateValue *asImm(); 57957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const Symbol *asSym() const; 58057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const ImmediateValue *asImm() const; 58157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool inFile(DataFile f) { return reg.file == f; } 58357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline Value *get(Iterator&); 58557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 586a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann std::tr1::unordered_set<ValueRef *> uses; 5878cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez std::list<ValueDef *> defs; 588a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann typedef std::tr1::unordered_set<ValueRef *>::iterator UseIterator; 589a9b21015f5e3a6a37e53a8b3c755519f7b70479eTobias Klausmann typedef std::tr1::unordered_set<ValueRef *>::const_iterator UseCIterator; 5908cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez typedef std::list<ValueDef *>::iterator DefIterator; 5918cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez typedef std::list<ValueDef *>::const_iterator DefCIterator; 59257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 59457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Storage reg; 59557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // TODO: these should be in LValue: 59757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Interval livei; 59857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *join; 59957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 60057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 60157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass LValue : public Value 60257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 60357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 60457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller LValue(Function *, DataFile file); 60557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller LValue(Function *, LValue *); 606da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~LValue() { } 60757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 608a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const; 609a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller 610a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual LValue *clone(ClonePolicy<Function>&) const; 61157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 61357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 615e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned compMask : 8; // compound/component mask 616e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned compound : 1; // used by RA, value involved in split/merge 617e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned ssa : 1; 618e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned fixedReg : 1; // set & used by RA, earlier just use (id < 0) 619e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned noSpill : 1; // do not spill (e.g. if spill temporary already) 62057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 62157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 62257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Symbol : public Value 62357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 62457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 62557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Symbol(Program *, DataFile file = FILE_MEMORY_CONST, ubyte fileIdx = 0); 626da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~Symbol() { } 62757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 628a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Symbol *clone(ClonePolicy<Function>&) const; 62957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 63057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *that, bool strict) const; 63157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 632a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const; 633a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller 63457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 63557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 63657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // print with indirect values 63757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int print(char *, size_t, Value *, Value *, DataType ty = TYPE_NONE) const; 63857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 63957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setFile(DataFile file, ubyte fileIndex = 0) 64057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 64157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller reg.file = file; 64257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller reg.fileIndex = fileIndex; 64357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 64457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 64557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setOffset(int32_t offset); 64657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setAddress(Symbol *base, int32_t offset); 64757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setSV(SVSemantic sv, uint32_t idx = 0); 64857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 64957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const Symbol *getBase() const { return baseSym; } 65057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 65157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 65257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Symbol *baseSym; // array base for Symbols representing array elements 65357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 65457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 65557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ImmediateValue : public Value 65657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 65757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 658d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez ImmediateValue() { } 65957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, uint32_t); 66057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, float); 66157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, double); 66257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // NOTE: not added to program with 66357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(const ImmediateValue *, DataType ty); 664da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~ImmediateValue() { }; 66557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 666784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez virtual ImmediateValue *clone(ClonePolicy<Function>&) const; 667784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 66857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *that, bool strict) const; 66957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // these only work if 'type' is valid (we mostly use untyped literals): 67157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isInteger(const int ival) const; // ival is cast to this' type 67257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isNegative() const; 67357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isPow2() const; 67457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void applyLog2(); 67657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // for constant folding: 67857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator+(const ImmediateValue&) const; 67957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator-(const ImmediateValue&) const; 68057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator*(const ImmediateValue&) const; 68157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator/(const ImmediateValue&) const; 68257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 683d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez ImmediateValue& operator=(const ImmediateValue&); // only sets value ! 684d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez 68557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool compare(CondCode cc, float fval) const; 68657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 68757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 68857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 68957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 69057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Instruction 69157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 69257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 69357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction(); 69457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction(Function *, operation, DataType); 69557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual ~Instruction(); 69657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 697a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Instruction *clone(ClonePolicy<Function>&, 698a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 69957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7008cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setDef(int i, Value *); 7018cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setSrc(int s, Value *); 7028cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setSrc(int s, const ValueRef&); 70357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void swapSources(int a, int b); 704ce1951daed9a4685bf559b4222f50510cb412301Christoph Bumiller void moveSources(int s, int delta); 70557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setIndirect(int s, int dim, Value *); 70657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7079362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline ValueRef& src(int s) { return srcs[s]; } 7089362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline ValueDef& def(int s) { return defs[s]; } 7099362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline const ValueRef& src(int s) const { return srcs[s]; } 7109362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline const ValueDef& def(int s) const { return defs[s]; } 7119362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 7129362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *getDef(int d) const { return defs[d].get(); } 7139362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *getSrc(int s) const { return srcs[s].get(); } 71457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirect(int s, int dim) const; 71557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7168cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline bool defExists(unsigned d) const 7178cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez { 7189362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller return d < defs.size() && defs[d].exists(); 7198cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez } 7208cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline bool srcExists(unsigned s) const 7218cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez { 7229362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller return s < srcs.size() && srcs[s].exists(); 7238cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez } 72457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 725e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller inline bool constrainedDefs() const; 72657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 72757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setPredicate(CondCode ccode, Value *); 72857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getPredicate() const; 72957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool writesPredicate() const; 730ca1fc2b86400e3fc9dd0517863e22721b5e91c77Christoph Bumiller inline bool isPredicated() const { return predSrc >= 0; } 73157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 73256cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller inline void setFlagsSrc(int s, Value *); 73356cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller inline void setFlagsDef(int d, Value *); 73499e4eba669f13a0dc80880f4f91e2338377c1667Christoph Bumiller inline bool usesFlags() const { return flagsSrc >= 0; } 73556cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller 7369362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller unsigned int defCount() const { return defs.size(); }; 737e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned int defCount(unsigned int mask, bool singleFile = false) const; 7389362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller unsigned int srcCount() const { return srcs.size(); }; 739e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned int srcCount(unsigned int mask, bool singleFile = false) const; 74057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // save & remove / set indirect[0,1] and predicate source 74257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void takeExtraSources(int s, Value *[3]); 74357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void putExtraSources(int s, Value *[3]); 74457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setType(DataType type) { dType = sType = type; } 74657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setType(DataType dtype, DataType stype) 74857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 74957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller dType = dtype; 75057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller sType = stype; 75157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 75257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 75357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isPseudo() const { return op < OP_MOV; } 75457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isDead() const; 75557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isNop() const; 75657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isCommutationLegal(const Instruction *) const; // must be adjacent ! 75757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isActionEqual(const Instruction *) const; 75857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isResultEqual(const Instruction *) const; 75957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print() const; 76157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline CmpInstruction *asCmp(); 76357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline TexInstruction *asTex(); 76457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline FlowInstruction *asFlow(); 76557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const TexInstruction *asTex() const; 76657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const CmpInstruction *asCmp() const; 76757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const FlowInstruction *asFlow() const; 76857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 77057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *next; 77157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *prev; 77257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 77357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int serial; // CFG order 77457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 77557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller operation op; 77657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType dType; // destination or defining type 77757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType sType; // source or secondary type 77857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode cc; 77957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller RoundMode rnd; 78057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CacheMode cache; 78157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 78222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller uint16_t subOp; // quadop, 1 for mul-high, etc. 783afcd7b5d1614a8a758ccb4353a9c31a601c9b9b4Christoph Bumiller 78457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned encSize : 4; // encoding size in bytes 78557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned saturate : 1; // to [0.0f, 1.0f] 78657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned join : 1; // converge control flow (use OP_JOIN until end) 78757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned fixed : 1; // prevent dead code elimination 78857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned terminator : 1; // end of basic block 78957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned ftz : 1; // flush denormal to zero 79057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned dnz : 1; // denormals, NaN are zero 79157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned ipa : 4; // interpolation mode 79257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned lanes : 4; 79357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned perPatch : 1; 79457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned exit : 1; // terminate program after insn 79522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller unsigned mask : 4; // for vector ops 79657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 79757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t postFactor; // MUL/DIV(if < 0) by 1 << postFactor 79857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 79957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t predSrc; 80057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t flagsDef; 80157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t flagsSrc; 80257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 803bede1bdb4828ea673bc7859db4058da7e35c6774Ben Skeggs uint32_t sched; // scheduling data (NOTE: maybe move to separate storage) 80422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller 80557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *bb; 80657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 8079362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumillerprotected: 8089362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller std::deque<ValueDef> defs; // no gaps ! 8099362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller std::deque<ValueRef> srcs; // no gaps ! 8109362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 81157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // instruction specific methods: 81257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // (don't want to subclass, would need more constructors and memory pools) 81357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 81457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInterpolate(unsigned int mode) { ipa = mode; } 81557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 81657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getInterpMode() const { return ipa & 0x3; } 81757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getSampleMode() const { return ipa & 0xc; } 81857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 81957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 82057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void init(); 82157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 82257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 82357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum TexQuery 82457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 82557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_DIMS, 82657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_TYPE, 82757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_SAMPLE_POSITION, 82857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_FILTER, 82957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_LOD, 83057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_WRAP, 83157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_BORDER_COLOUR 83257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 83357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 83457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass TexInstruction : public Instruction 83557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 83657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 83757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller class Target 83857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 83957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller public: 84057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target(TexTarget targ = TEX_TARGET_2D) : target(targ) { } 84157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 84257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const char *getName() const { return descTable[target].name; } 84357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getArgCount() const { return descTable[target].argc; } 84457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getDim() const { return descTable[target].dim; } 84557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isArray() const { return descTable[target].array ? 1 : 0; } 84657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isCube() const { return descTable[target].cube ? 1 : 0; } 84757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isShadow() const { return descTable[target].shadow ? 1 : 0; } 8484da54c91d24da891c56957f29274e7821c8254f6Christoph Bumiller int isMS() const { 8494da54c91d24da891c56957f29274e7821c8254f6Christoph Bumiller return target == TEX_TARGET_2D_MS || target == TEX_TARGET_2D_MS_ARRAY; } 8503bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin void clearMS() { 8513bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin if (isMS()) { 8523bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin if (isArray()) 8533bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin target = TEX_TARGET_2D_ARRAY; 8543bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin else 8553bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin target = TEX_TARGET_2D; 8563bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin } 8573bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin } 85857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 85957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target& operator=(TexTarget targ) 86057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 86157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller assert(targ < TEX_TARGET_COUNT); 862f7599b2c32185535b4c215de0ba0454129fa523fChristoph Bumiller target = targ; 86357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller return *this; 86457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 86557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 86657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool operator==(TexTarget targ) const { return target == targ; } 8674506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller inline bool operator!=(TexTarget targ) const { return target != targ; } 8684506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller 8694506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller enum TexTarget getEnum() const { return target; } 87057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 87157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller private: 87257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct Desc 87357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 87457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller char name[19]; 87557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t dim; 87657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t argc; 87757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool array; 87857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool cube; 87957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool shadow; 88057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 88157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 88257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static const struct Desc descTable[TEX_TARGET_COUNT]; 88357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 88457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller private: 88557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum TexTarget target; 88657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 88757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 88857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 88957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TexInstruction(Function *, operation); 89057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual ~TexInstruction(); 89157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 892a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual TexInstruction *clone(ClonePolicy<Function>&, 893a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 89457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 89557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setTexture(Target targ, uint8_t r, uint8_t s) 89657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 89757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.r = r; 89857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.s = s; 89957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.target = targ; 90057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 90157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 9027a91d3a2a4c4e7851fdb46465224213ce1874c9bChristoph Bumiller void setIndirectR(Value *); 9037a91d3a2a4c4e7851fdb46465224213ce1874c9bChristoph Bumiller void setIndirectS(Value *); 90457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirectR() const; 90557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirectS() const; 90657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 90757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 90857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct { 90957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target target; 91057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 911c2dfcd7f0eaf4eda375eb320e0e87793a80ef92dChristoph Bumiller uint16_t r; 912c2dfcd7f0eaf4eda375eb320e0e87793a80ef92dChristoph Bumiller uint16_t s; 91357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t rIndirectSrc; 91457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t sIndirectSrc; 91557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 91657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t mask; 91757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t gatherComp; 91857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 91957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool liveOnly; // only execute on live pixels of a quad (optimization) 92057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool levelZero; 9219c930639d9f6d713ccfd16b390a41a9f584f348cChristoph Bumiller bool derivAll; 92257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t useOffsets; // 0, 1, or 4 for textureGatherOffsets 924f3aa999383074d666d6e3f3506e66b0c937904caIlia Mirkin int8_t offset[3]; // only used on nv50 92557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum TexQuery query; 92757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } tex; 92857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ValueRef dPdx[3]; 93057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ValueRef dPdy[3]; 931f3aa999383074d666d6e3f3506e66b0c937904caIlia Mirkin ValueRef offset[4][3]; 93257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 93357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 93457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass CmpInstruction : public Instruction 93557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 93657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 93757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CmpInstruction(Function *, operation); 93857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 939a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual CmpInstruction *clone(ClonePolicy<Function>&, 940a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 94157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void setCondition(CondCode cond) { setCond = cond; } 94357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode getCondition() const { return setCond; } 94457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 94657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode setCond; 94757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 94857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass FlowInstruction : public Instruction 95057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 95157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 9529bb36d54a2c69ebdc9d1c9c4c71945060de8c860Francisco Jerez FlowInstruction(Function *, operation, void *target); 95357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 954784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez virtual FlowInstruction *clone(ClonePolicy<Function>&, 955784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez Instruction * = NULL) const; 956784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 95757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 95857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned allWarp : 1; 95957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned absolute : 1; 96057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned limit : 1; 96157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned builtin : 1; // true for calls to emulation code 962c893b9406060d3735b2c9e307ae89f6d83a4be40Christoph Bumiller unsigned indirect : 1; // target in src(0) 96357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 96457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller union { 96557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *bb; 96657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int builtin; 96757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *fn; 96857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } target; 96957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 97057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 97157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass BasicBlock 97257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 97357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 97457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock(Function *); 97557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~BasicBlock(); 97657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 977784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez BasicBlock *clone(ClonePolicy<Function>&) const; 978784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 97957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int getId() const { return id; } 98057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned int getInsnCount() const { return numInsns; } 98157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isTerminated() const { return exit && exit->terminator; } 98257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 98357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool dominatedBy(BasicBlock *bb); 98440c224a573f2b763046001e622aafca90f68c693Christoph Bumiller inline bool reachableBy(const BasicBlock *by, const BasicBlock *term); 98557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 98657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // returns mask of conditional out blocks 98757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // e.g. 3 for IF { .. } ELSE { .. } ENDIF, 1 for IF { .. } ENDIF 98857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int initiatesSimpleConditional() const; 98957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 99057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 99157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *getFunction() const { return func; } 99257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *getProgram() const { return program; } 99357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 99457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getEntry() const { return entry; } // first non-phi instruction 99557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getPhi() const { return phi; } 99657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getFirst() const { return phi ? phi : entry; } 99757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getExit() const { return exit; } 99857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 99957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertHead(Instruction *); 100057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertTail(Instruction *); 100157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertBefore(Instruction *, Instruction *); 100257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertAfter(Instruction *, Instruction *); 100357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void remove(Instruction *); 100457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void permuteAdjacent(Instruction *, Instruction *); 100557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 100657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *idom() const; 100757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1008c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller // NOTE: currently does not rebuild the dominator tree 1009c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller BasicBlock *splitBefore(Instruction *, bool attach = true); 1010c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller BasicBlock *splitAfter(Instruction *, bool attach = true); 1011c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller 101257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList& getDF() { return df; } 101357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList::Iterator iterDF() { return df.iterator(); } 101457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 101557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline BasicBlock *get(Iterator&); 101657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline BasicBlock *get(Graph::Node *); 101757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 101857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 101957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node cfg; // first edge is branch *taken* (the ELSE branch) 102057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node dom; 102157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BitSet liveSet; 10233e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez BitSet defSet; 102457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binPos; 102657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 102757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *joinAt; // for quick reference 102957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool explicitCont; // loop headers: true if loop contains continue stmts 103157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 103357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 103457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList df; 103557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *phi; 103757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *entry; 103857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *exit; 103957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int numInsns; 104157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 104357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *func; 104457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *program; 1045c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller 1046c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller void splitCommon(Instruction *, BasicBlock *, bool attach); 104757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 104857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Function 105057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 105157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 105298116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez Function(Program *, const char *name, uint32_t label); 105357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~Function(); 105457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1055d32ebb8c304725fa6bb7ec2d3d40ce828c713917Francisco Jerez static inline Function *get(Graph::Node *node); 1056d32ebb8c304725fa6bb7ec2d3d40ce828c713917Francisco Jerez 105757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Program *getProgram() const { return prog; } 105857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const char *getName() const { return name; } 105957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int getId() const { return id; } 106098116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez inline uint32_t getLabel() const { return label; } 106157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 106257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print(); 106357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void printLiveIntervals() const; 106457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void printCFGraph(const char *filePath); 106557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 106657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setEntry(BasicBlock *); 106757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setExit(BasicBlock *); 106857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 106957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int orderInstructions(ArrayList&); 107057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 107157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(BasicBlock *bb, int& id) { allBBlocks.insert(bb, id); } 107257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Instruction *insn, int& id) { allInsns.insert(insn, id); } 107357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(LValue *lval, int& id) { allLValues.insert(lval, id); } 107457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 107557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline LValue *getLValue(int id); 107657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1077898b0981b6c90d2f1e446a532b6ac3cbbb49747dFrancisco Jerez void buildLiveSets(); 10783e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez void buildDefSets(); 107957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool convertToSSA(); 108057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 108157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 1082a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<ValueDef> ins; 1083a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<ValueRef> outs; 1084a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<Value *> clobbers; 1085a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez 108657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph cfg; 108757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node *cfgExit; 108857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph *domTree; 108957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node call; // node in the call graph 109057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock **bbArray; // BBs in emission order 109257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int bbCount; 109357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int loopNestingBound; 109557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int regClobberMax; 109657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binPos; 109857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 109957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1100e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller Value *stackPtr; 1101e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller 1102e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsBase; // base address for l[] space (if no stack pointer is used) 1103e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsSize; 1104e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller 110557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allBBlocks; 110657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allInsns; 110757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allLValues; 110857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 110957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 111057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void buildLiveSetsPreSSA(BasicBlock *, const int sequence); 11113e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez void buildDefSetsPreSSA(BasicBlock *bb, const int seq); 111257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 111357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 111498116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez uint32_t label; 111557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 111657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const char *const name; 111757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *prog; 111857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 111957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CGStage 112157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 112257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_PRE_SSA, 112357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_SSA, // expected directly before register allocation 112457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_POST_RA 112557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 112657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Program 112857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 112957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 113057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum Type 113157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 113257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_VERTEX, 113357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_TESSELLATION_CONTROL, 113457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_TESSELLATION_EVAL, 113557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_GEOMETRY, 113657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_FRAGMENT, 113757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_COMPUTE 113857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 113957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program(Type type, Target *targ); 114157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~Program(); 114257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print(); 114457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Type getType() const { return progType; } 114657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Function *fn, int& id) { allFuncs.insert(fn, id); } 11485e4b2a1a47ca9a173f6419ed2f12c9fba80e757cFrancisco Jerez inline void del(Function *fn, int& id) { allFuncs.remove(id); } 114957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Value *rval, int& id) { allRValues.insert(rval, id); } 115057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 115157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool makeFromTGSI(struct nv50_ir_prog_info *); 115257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool makeFromSM4(struct nv50_ir_prog_info *); 115357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool convertToSSA(); 115457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool optimizeSSA(int level); 115557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool optimizePostRA(int level); 115657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool registerAllocation(); 115757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool emitBinary(struct nv50_ir_prog_info *); 115857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 115957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const Target *getTarget() const { return target; } 116057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 116298116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez void emitSymbolTable(struct nv50_ir_prog_info *); 116398116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez 116457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Type progType; 116557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target *target; 116657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 116857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *main; 116957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph calls; 117057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allFuncs; 117257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allRValues; 117357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t *code; 117557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 1176e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsSize; // size required for FILE_MEMORY_LOCAL 117757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int maxGPR; 117957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 118057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_Instruction; 118157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_CmpInstruction; 118257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_TexInstruction; 118357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_FlowInstruction; 118457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_LValue; 118557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_Symbol; 118657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_ImmediateValue; 118757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 118857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t dbgFlags; 1189322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller uint8_t optLevel; 1190322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller 1191322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller void *targetPriv; // e.g. to carry information between passes 119257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 11934506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller const struct nv50_ir_prog_info *driver; // for driver configuration 11944506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller 119557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void releaseInstruction(Instruction *); 119657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void releaseValue(Value *); 119757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 119857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 119957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// TODO: add const version 120057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Pass 120157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 120257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 120357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool run(Program *, bool ordered = false, bool skipPhi = false); 120457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool run(Function *, bool ordered = false, bool skipPhi = false); 120557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 120657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 120757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // return false to continue with next entity on next higher level 120857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(Function *) { return true; } 120957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(BasicBlock *) { return true; } 121057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(Instruction *) { return false; } 121157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 121257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool doRun(Program *, bool ordered, bool skipPhi); 121357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool doRun(Function *, bool ordered, bool skipPhi); 121457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 121557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprotected: 121657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool err; 121757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *func; 121857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *prog; 121957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 122057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// ============================================================================= 122257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 12235eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_inlines.h" 122457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller} // namespace nv50_ir 122657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#endif // __NV50_IR_H__ 1228