1d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller/* 2d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Copyright 2011 Christoph Bumiller 3d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 4d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Permission is hereby granted, free of charge, to any person obtaining a 5d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * copy of this software and associated documentation files (the "Software"), 6d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * to deal in the Software without restriction, including without limitation 7d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * and/or sell copies of the Software, and to permit persons to whom the 9d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * Software is furnished to do so, subject to the following conditions: 10d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 11d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * The above copyright notice and this permission notice shall be included in 12d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * all copies or substantial portions of the Software. 13d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * 14d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 15d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 16d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 173d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR 183d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, 193d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR 203d8d5b298a268b119d840bc9bae0ee9e0c9244a9Kenneth Graunke * OTHER DEALINGS IN THE SOFTWARE. 21d2d19ea51fa3575a8d014a69a9b835c335728817Christoph Bumiller */ 2257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 2357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#ifndef __NV50_IR_H__ 2457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define __NV50_IR_H__ 2557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 2657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdio.h> 2757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdlib.h> 2857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#include <stdint.h> 298cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <deque> 308cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <list> 318cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez#include <vector> 3257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 332a4af36517333ef61d5f7ca2264fec3f49ee3662Chih-Wei Huang#include "codegen/unordered_set.h" 345eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_util.h" 355eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_graph.h" 3657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 375eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_driver.h" 3857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 3957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillernamespace nv50_ir { 4057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 4157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum operation 4257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 4357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NOP = 0, 4457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PHI, 4557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_UNION, // unify a new definition and several source values 4657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SPLIT, // $r0d -> { $r0, $r1 } ($r0d and $r0/$r1 will be coalesced) 4757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MERGE, // opposite of split, e.g. combine 2 32 bit into a 64 bit value 4857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CONSTRAINT, // copy values into consecutive registers 49d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez OP_MOV, // simple copy, no modifiers allowed 5057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LOAD, 5157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_STORE, 5299e4eba669f13a0dc80880f4f91e2338377c1667Christoph Bumiller OP_ADD, // NOTE: add u64 + u32 is legal for targets w/o 64-bit integer adds 5357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SUB, 5457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MUL, 5557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DIV, 5657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MOD, 5757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MAD, 5857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_FMA, 5957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SAD, // abs(src0 - src1) + src2 6085132c7453230960f34cfe7b7b7fcaaab158d79fSamuel Pitoiset OP_SHLADD, 6157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_ABS, 6257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NEG, 6357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_NOT, 6457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_AND, 6557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_OR, 6657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_XOR, 6757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SHL, 6857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SHR, 6957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MAX, 7057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_MIN, 7122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SAT, // CLAMP(f32, 0.0, 1.0) 7257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CEIL, 7357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_FLOOR, 7457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TRUNC, 7557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CVT, 7657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_AND, // dst = (src0 CMP src1) & src2 7757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_OR, 7857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET_XOR, 7957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SET, 8057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SELP, // dst = src2 ? src0 : src1 8157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SLCT, // dst = (src2 CMP 0) ? src0 : src1 8257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RCP, 8357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RSQ, 8457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LG2, 8557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SIN, 8657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_COS, 8757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EX2, 8857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXP, // exponential (base M_E) 8957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LOG, // natural logarithm 9057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRESIN, 9157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PREEX2, 9257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_SQRT, 9357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_POW, 9457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BRA, 9557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CALL, 9657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RET, 9757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_CONT, 9857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BREAK, 9957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRERET, 10057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PRECONT, 10157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PREBREAK, 10257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_BRKPT, // breakpoint (not related to loops) 10357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_JOINAT, // push control flow convergence point 10457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_JOIN, // converge 10557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DISCARD, 10657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXIT, 10722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_MEMBAR, // memory barrier (mfence, lfence, sfence) 10857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_VFETCH, // indirection 0 in attribute space, indirection 1 is vertex base 10957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PFETCH, // fetch base address of vertex src0 (immediate) [+ src1] 1109d60793a03e40e1d139b78fce0144cad57438741Ilia Mirkin OP_AFETCH, // fetch base address of shader input (a[%r1+0x10]) 11157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EXPORT, 11257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LINTERP, 11357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_PINTERP, 11457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_EMIT, // emit vertex 11557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RESTART, // restart primitive 11657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TEX, 11757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXB, // texture bias 11857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXL, // texure lod 11957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXF, // texel fetch 12057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXQ, // texture size query 12157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXD, // texture derivatives 12257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_TXG, // texture gather 123d5faf8e78603a27dbedb2e9e28b58b1b2bc32858Ilia Mirkin OP_TXLQ, // texture query lod 12422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXCSAA, // texture op for coverage sampling 12522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXPREP, // turn cube map array into 2d array coordinates 12622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULDB, // surface load (raw) 12722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULDP, // surface load (formatted) 12822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUSTB, // surface store (raw) 12922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUSTP, // surface store (formatted) 13022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUREDB, 13122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUREDP, // surface reduction (atomic op) 13222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SULEA, // surface load effective address 13322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUBFM, // surface bitfield manipulation 13422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUCLAMP, // clamp surface coordinates 13522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_SUEAU, // surface effective address 1362c4eeb0b5cf17caa06cb3fa46d4f64e6a8005d23Ilia Mirkin OP_SUQ, // surface query 13722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_MADSP, // special integer multiply-add 13822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_TEXBAR, // texture dependency barrier 13957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DFDX, 14057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_DFDY, 14157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_RDSV, // read system value 14257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_WRSV, // write system value 143af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin OP_PIXLD, // get info about raster object or surfaces 14457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADOP, 14557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADON, 14657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_QUADPOP, 14757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_POPCNT, // bitcount(src0 & src1) 14857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_INSBF, // insert first src1[8:15] bits of src0 into src2 at src1[0:7] 14922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_EXTBF, // place bits [K,K+N) of src0 into dst, src1 = 0xNNKK 150b4b20d42f6a8cd5aec3ba529a0b8d6ea22e73305Ilia Mirkin OP_BFIND, // find highest/lowest set bit 15122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_PERMT, // dst = bytes from src2,src0 selected by src1 (nvc0's src order) 15222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_ATOM, 15322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_BAR, // execution barrier, sources = { id, thread count, predicate } 15422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VADD, // byte/word vector operations 15522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VAVG, 15622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VMIN, 15722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VMAX, 15822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSAD, 15922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSET, 16022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSHR, 16122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSHL, 16222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller OP_VSEL, 16318fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller OP_CCTL, // cache control 164d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs OP_SHFL, // warp shuffle 16507ed003faf3199a3e95852e7a34763aeaf76503dSamuel Pitoiset OP_VOTE, 1667c47db359e193f21be796df3a7b5d037dd42b28fSamuel Pitoiset OP_BUFQ, // buffer query 16757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller OP_LAST 16857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 16957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 17000fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller// various instruction-specific modifier definitions Instruction::subOp 17100fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller// MOV_FINAL marks a MOV originating from an EXPORT (used for placing TEXBARs) 17257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_MUL_HIGH 1 17357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_EMIT_RESTART 1 17457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_IL 1 17557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_IS 2 17657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_SUBOP_LDC_ISL 3 1770e4e0ca6df52ddecd1bb2fe9a427549d1a82b9f9Christoph Bumiller#define NV50_IR_SUBOP_SHIFT_WRAP 1 178322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller#define NV50_IR_SUBOP_EMU_PRERET 1 179e44089b2f79aa2dcaacf348911433d1e21235c0cChristoph Bumiller#define NV50_IR_SUBOP_TEXBAR(n) n 18000fe442253744c4c4e7e68da44d6983da053968bChristoph Bumiller#define NV50_IR_SUBOP_MOV_FINAL 1 18122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_EXTBF_REV 1 182b4b20d42f6a8cd5aec3ba529a0b8d6ea22e73305Ilia Mirkin#define NV50_IR_SUBOP_BFIND_SAMT 1 183b87b498b88c51fb8c80901b8f581331d3fbcd972Ilia Mirkin#define NV50_IR_SUBOP_RCPRSQ_64H 1 18422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_F4E 1 18522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_B4E 2 18622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_RC8 3 18722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_ECL 4 18822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_ECR 5 18922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_PERMT_RC16 6 19022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_SYNC 0 19122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_ARRIVE 1 19222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_AND 2 19322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_OR 3 19422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_BAR_RED_POPC 4 19522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_L 1 19622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_S 2 19722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_M 3 19822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_CTA (0 << 2) 19922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_GL (1 << 2) 20022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_SYS (2 << 2) 20122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_DIR(m) ((m) & 0x3) 20222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR_SCOPE(m) ((m) & ~0x3) 20322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MEMBAR(d,s) \ 20422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller (NV50_IR_SUBOP_MEMBAR_##d | NV50_IR_SUBOP_MEMBAR_##s) 20522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_ADD 0 20622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_MIN 1 20722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_MAX 2 20822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_INC 3 20922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_DEC 4 21022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_AND 5 21122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_OR 6 21222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_XOR 7 21322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_CAS 8 21422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_ATOM_EXCH 9 21518fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller#define NV50_IR_SUBOP_CCTL_IV 5 21618fdfbdc32f204d6728c1ad57a693b1a6ad0aec9Christoph Bumiller#define NV50_IR_SUBOP_CCTL_IVALL 6 21722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_IGN 0 21822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_TRAP 1 21922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUST_SDCL 3 22022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_ZERO 0 22122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_TRAP 1 22222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SULD_SDCL 3 22322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUBFM_3D 1 22422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_2D 0x10 22522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_SD(r, d) (( 0 + (r)) | ((d == 2) ? 0x10 : 0)) 22622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_PL(r, d) (( 5 + (r)) | ((d == 2) ? 0x10 : 0)) 22722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_SUCLAMP_BL(r, d) ((10 + (r)) | ((d == 2) ? 0x10 : 0)) 228af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COUNT 0 229af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COVMASK 1 230af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_COVERED 2 231af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_OFFSET 3 232af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_CENT_OFFSET 4 233af38ef907c89ecb1125bf258cafa0793f79a5eb7Ilia Mirkin#define NV50_IR_SUBOP_PIXLD_SAMPLEID 5 234d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_IDX 0 235d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_UP 1 236d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_DOWN 2 237d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs#define NV50_IR_SUBOP_SHFL_BFLY 3 2380c930557bf96721ce50ca95b5201be09da905cb8Samuel Pitoiset#define NV50_IR_SUBOP_LOAD_LOCKED 1 2390c930557bf96721ce50ca95b5201be09da905cb8Samuel Pitoiset#define NV50_IR_SUBOP_STORE_UNLOCKED 2 24022b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MADSP_SD 0xffff 24122b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// Yes, we could represent those with DataType. 24222b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// Or put the type into operation and have a couple 1000 values in that enum. 24322b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// This will have to do for now. 24422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller// The bitfields are supposed to correspond to nve4 ISA. 24522b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_MADSP(a,b,c) (((c) << 8) | ((b) << 4) | (a)) 24622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V1(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x0000) 24722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V2(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x4000) 24822b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_V4(d,a,b) (((d) << 10) | ((b) << 5) | (a) | 0x8000) 24922b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller#define NV50_IR_SUBOP_Vn(n) ((n) >> 14) 25007ed003faf3199a3e95852e7a34763aeaf76503dSamuel Pitoiset#define NV50_IR_SUBOP_VOTE_ALL 0 25107ed003faf3199a3e95852e7a34763aeaf76503dSamuel Pitoiset#define NV50_IR_SUBOP_VOTE_ANY 1 25207ed003faf3199a3e95852e7a34763aeaf76503dSamuel Pitoiset#define NV50_IR_SUBOP_VOTE_UNI 2 25357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 25457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum DataType 25557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 25657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_NONE, 25757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U8, 25857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S8, 25957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U16, 26057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S16, 26157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U32, 26257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S32, 26357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_U64, // 64 bit operations are only lowered after register allocation 26457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_S64, 26557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F16, 26657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F32, 26757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_F64, 26857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_B96, 26957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_B128 27057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 27157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 27257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CondCode 27357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 27457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_FL = 0, 27557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NEVER = CC_FL, // when used with FILE_FLAGS 27657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LT = 1, 27757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_EQ = 2, 27857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NOT_P = CC_EQ, // when used with FILE_PREDICATE 27957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LE = 3, 28057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GT = 4, 28157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NE = 5, 28257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_P = CC_NE, 28357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GE = 6, 28457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_TR = 7, 28557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_ALWAYS = CC_TR, 28657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_U = 8, 28757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LTU = 9, 28857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_EQU = 10, 28957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_LEU = 11, 29057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GTU = 12, 29157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NEU = 13, 29257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_GEU = 14, 29357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NO = 0x10, 29457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NC = 0x11, 29557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NS = 0x12, 29657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_NA = 0x13, 29757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_A = 0x14, 29857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_S = 0x15, 29957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_C = 0x16, 30057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CC_O = 0x17 30157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 30257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 30357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum RoundMode 30457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 30557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_N, // nearest 30657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_M, // towards -inf 30757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_Z, // towards 0 30857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_P, // towards +inf 30957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_NI, // nearest integer 31057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_MI, // to integer towards -inf 31157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_ZI, // to integer towards 0 31257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ROUND_PI, // to integer towards +inf 31357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 31457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 31557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CacheMode 31657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 31757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CA, // cache at all levels 31857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_WB = CACHE_CA, // cache write back 31957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CG, // cache at global level 32057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CS, // cache streaming 32157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_CV, // cache as volatile 32257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CACHE_WT = CACHE_CV // cache write-through 32357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 32457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 32557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum DataFile 32657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 32757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_NULL = 0, 32857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_GPR, 32957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_PREDICATE, // boolean predicate 33057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_FLAGS, // zero/sign/carry/overflow bits 33157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_ADDRESS, 332e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller LAST_REGISTER_FILE = FILE_ADDRESS, 33357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_IMMEDIATE, 33457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_CONST, 33557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SHADER_INPUT, 33657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SHADER_OUTPUT, 33761d52a5fb9379eede3bf68b011f9477176341ee9Hans de Goede FILE_MEMORY_BUFFER, 33857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_GLOBAL, 33957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_SHARED, 34057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_MEMORY_LOCAL, 34157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller FILE_SYSTEM_VALUE, 34257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DATA_FILE_COUNT 34357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 34457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 34557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum TexTarget 34657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 34757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D, 34857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D, 34957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_MS, 35057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_3D, 35157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE, 35257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_SHADOW, 35357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_SHADOW, 35457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_SHADOW, 35557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_ARRAY, 35657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_ARRAY, 35757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_MS_ARRAY, 35857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_ARRAY, 35957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_1D_ARRAY_SHADOW, 36057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_2D_ARRAY_SHADOW, 36157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_RECT, 36257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_RECT_SHADOW, 36357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_CUBE_ARRAY_SHADOW, 36457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_BUFFER, 36557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TEX_TARGET_COUNT 36657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 36757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 3683ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkinenum ImgFormat 3693ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin{ 3703ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_NONE, 3713ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 3723ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA32F, 3733ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA16F, 3743ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG32F, 3753ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG16F, 3763ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R11G11B10F, 3773ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R32F, 3783ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R16F, 3793ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 3803ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA32UI, 3813ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA16UI, 3823ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGB10A2UI, 3833ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA8UI, 3843ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG32UI, 3853ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG16UI, 3863ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG8UI, 3873ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R32UI, 3883ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R16UI, 3893ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R8UI, 3903ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 3913ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA32I, 3923ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA16I, 3933ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA8I, 3943ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG32I, 3953ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG16I, 3963ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG8I, 3973ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R32I, 3983ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R16I, 3993ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R8I, 4003ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 4013ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA16, 4023ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGB10A2, 4033ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA8, 4043ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG16, 4053ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG8, 4063ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R16, 4073ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R8, 4083ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 4093ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA16_SNORM, 4103ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RGBA8_SNORM, 4113ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG16_SNORM, 4123ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_RG8_SNORM, 4133ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R16_SNORM, 4143ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FMT_R8_SNORM, 4153ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 4168e7893eb53213254997a1a3beb0575be11821f83Ilia Mirkin FMT_BGRA8, 4178e7893eb53213254997a1a3beb0575be11821f83Ilia Mirkin 4183ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin IMG_FORMAT_COUNT, 4193ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin}; 4203ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 4213ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkinenum ImgType { 4223ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin UINT, 4233ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin SINT, 4243ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin UNORM, 4253ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin SNORM, 4263ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin FLOAT, 4273ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin}; 4283ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 42957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum SVSemantic 43057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 43157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POSITION, // WPOS 43257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VERTEX_ID, 43357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_INSTANCE_ID, 43457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_INVOCATION_ID, 43557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_PRIMITIVE_ID, 43657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VERTEX_COUNT, // gl_PatchVerticesIn 43757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LAYER, 43857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_VIEWPORT_INDEX, 43957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_YDIR, 44057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_FACE, 44157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POINT_SIZE, 44257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_POINT_COORD, 44357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CLIP_DISTANCE, 44457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_SAMPLE_INDEX, 445f715a0a39a0f7f19443e7721ae792878ba504eedIlia Mirkin SV_SAMPLE_POS, 446b3a2398aded19e25124a4a1d228eb3843827f6b2Ilia Mirkin SV_SAMPLE_MASK, 4477e0036a49258326cc2d875f2960d18c6b3665036Ilia Mirkin SV_TESS_OUTER, 4487e0036a49258326cc2d875f2960d18c6b3665036Ilia Mirkin SV_TESS_INNER, 44957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TESS_COORD, 45057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_TID, 45157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CTAID, 45257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NTID, 45357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_GRIDID, 45457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NCTAID, 45557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LANEID, 45657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_PHYSID, 45757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_NPHYSID, 45857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_CLOCK, 45957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LBASE, 46057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_SBASE, 46167250acbaba924ccaab696f2b348dfa898c41d0bChristoph Bumiller SV_VERTEX_STRIDE, 462d548d47edf9f05e6dbf9656abc2f8e78d02cb2f6Ben Skeggs SV_INVOCATION_INFO, 46339f51ec96f00f601b9c4d4e321dacb3af9dc866fIlia Mirkin SV_THREAD_KILL, 464517a93b346e720082e22e358b63b5dbc5c42aa09Ilia Mirkin SV_BASEVERTEX, 465517a93b346e720082e22e358b63b5dbc5c42aa09Ilia Mirkin SV_BASEINSTANCE, 466517a93b346e720082e22e358b63b5dbc5c42aa09Ilia Mirkin SV_DRAWID, 4672aa1197eee442ab960f6ad6b84d4cf58511d6cb7Hans de Goede SV_WORK_DIM, 46857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_UNDEFINED, 46957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SV_LAST 47057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 47157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Program; 47357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Function; 47457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass BasicBlock; 47557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Target; 47757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 47857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Instruction; 47957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass CmpInstruction; 48057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass TexInstruction; 48157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass FlowInstruction; 48257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Value; 48457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass LValue; 48557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Symbol; 48657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ImmediateValue; 48757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 48857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerstruct Storage 48957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 49057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataFile file; 49157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t fileIndex; // signed, may be indirect for CONST[] 49257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t size; // this should match the Instruction type's size 49357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType type; // mainly for pretty printing 49457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller union { 49557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint64_t u64; // immediate values 49657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t u32; 49757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint16_t u16; 49857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t u8; 49957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int64_t s64; 50057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int32_t s32; 50157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int16_t s16; 50257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t s8; 50357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller float f32; 50457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller double f64; 50557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int32_t offset; // offset from 0 (base of address space) 506e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller int32_t id; // register id (< 0 if virtual/unassigned, in units <= 4) 50757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct { 50857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller SVSemantic sv; 50957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int index; 51057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } sv; 51157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } data; 51257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 51357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 51457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// precedence: NOT after SAT after NEG after ABS 51557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_ABS (1 << 0) 51657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NEG (1 << 1) 51757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_SAT (1 << 2) 51857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NOT (1 << 3) 51957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_MOD_NEG_ABS (NV50_IR_MOD_NEG | NV50_IR_MOD_ABS) 52057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 52157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_MODE_MASK 0x3 52257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_LINEAR (0 << 0) 52357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_PERSPECTIVE (1 << 0) 52457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_FLAT (2 << 0) 52557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SC (3 << 0) // what exactly is that ? 52657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SAMPLE_MASK 0xc 52757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_DEFAULT (0 << 2) 52857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_CENTROID (1 << 2) 52957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_OFFSET (2 << 2) 53057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#define NV50_IR_INTERP_SAMPLEID (3 << 2) 53157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 53257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// do we really want this to be a class ? 53357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Modifier 53457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 53557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 53657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier() : bits(0) { } 53757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier(unsigned int m) : bits(m) { } 53857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier(operation op); 53957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // @return new Modifier applying a after b (asserts if unrepresentable) 54157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator*(const Modifier) const; 54214d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez Modifier operator*=(const Modifier m) { *this = *this * m; return *this; } 54357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator==(const Modifier m) const { return m.bits == bits; } 54457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier operator!=(const Modifier m) const { return m.bits != bits; } 54557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 54657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator&(const Modifier m) const { return bits & m.bits; } 54757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator|(const Modifier m) const { return bits | m.bits; } 54857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Modifier operator^(const Modifier m) const { return bits ^ m.bits; } 54957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller operation getOp() const; 55157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int neg() const { return (bits & NV50_IR_MOD_NEG) ? 1 : 0; } 55357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int abs() const { return (bits & NV50_IR_MOD_ABS) ? 1 : 0; } 55457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55514d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez inline operator bool() const { return bits ? true : false; } 55657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void applyTo(ImmediateValue &imm) const; 55857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 55957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int print(char *buf, size_t size) const; 56057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 56157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 56257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t bits; 56357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 56457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 56557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ValueRef 56657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 56757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 56814d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez ValueRef(Value * = NULL); 5698cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez ValueRef(const ValueRef&); 57057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~ValueRef(); 57157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 57257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool exists() const { return value != NULL; } 57357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 57457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(Value *); 57557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(const ValueRef&); 57657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *get() const { return value; } 57757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *rep() const; 57857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 57957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const { return insn; } 58057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInsn(Instruction *inst) { insn = inst; } 58157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isIndirect(int dim) const { return indirect[dim] >= 0; } 58357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const ValueRef *getIndirect(int dim) const; 58457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline DataFile getFile() const; 58657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned getSize() const; 58757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 58857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // SSA: return eventual (traverse MOVs) literal value, if it exists 589d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez bool getImmediate(ImmediateValue&) const; 59057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 59257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Modifier mod; 5939362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller int8_t indirect[2]; // >= 0 if relative to lvalue in insn->src(indirect[i]) 59457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t swizzle; 59557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool usedAsPtr; // for printing 59757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 59857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 59957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *value; 60057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *insn; 60157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 60257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 60357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ValueDef 60457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 60557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 60614d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez ValueDef(Value * = NULL); 6078cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez ValueDef(const ValueDef&); 60857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~ValueDef(); 60957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool exists() const { return value != NULL; } 61157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *get() const { return value; } 61357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *rep() const; 61457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void set(Value *); 61514d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez bool mayReplace(const ValueRef &); 61614d5f975a65c57830077dabf2f95261afbc51773Francisco Jerez void replace(const ValueRef &, bool doSet); // replace all uses of the old value 61757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 61857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const { return insn; } 61957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInsn(Instruction *inst) { insn = inst; } 62057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 62157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline DataFile getFile() const; 62257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned getSize() const; 62357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 62457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setSSA(LValue *); 62557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const LValue *preSSA() const; 62657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 62757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 62857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *value; // should make this LValue * ... 6298cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez LValue *origin; // pre SSA value 63057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *insn; 63157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 63257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 63357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Value 63457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 63557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 63657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value(); 637da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez virtual ~Value() { } 63857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 639a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Value *clone(ClonePolicy<Function>&) const = 0; 64057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 64157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const = 0; 64257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 64357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *, bool strict = false) const; 64457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool interfers(const Value *) const; 645a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const { return true; } 64657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 6479362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *rep() const { return join; } 6489362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 64957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getUniqueInsn() const; 65057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Instruction *getInsn() const; // use when uniqueness is certain 65157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 6528cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline int refCount() { return uses.size(); } 65357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 65457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline LValue *asLValue(); 65557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Symbol *asSym(); 65657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline ImmediateValue *asImm(); 65757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const Symbol *asSym() const; 65857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const ImmediateValue *asImm() const; 65957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 66057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool inFile(DataFile f) { return reg.file == f; } 66157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 66257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline Value *get(Iterator&); 66357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 6642a4af36517333ef61d5f7ca2264fec3f49ee3662Chih-Wei Huang unordered_set<ValueRef *> uses; 6658cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez std::list<ValueDef *> defs; 6662a4af36517333ef61d5f7ca2264fec3f49ee3662Chih-Wei Huang typedef unordered_set<ValueRef *>::iterator UseIterator; 6672a4af36517333ef61d5f7ca2264fec3f49ee3662Chih-Wei Huang typedef unordered_set<ValueRef *>::const_iterator UseCIterator; 6688cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez typedef std::list<ValueDef *>::iterator DefIterator; 6698cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez typedef std::list<ValueDef *>::const_iterator DefCIterator; 67057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 67257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Storage reg; 67357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // TODO: these should be in LValue: 67557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Interval livei; 67657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Value *join; 67757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 67857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 67957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass LValue : public Value 68057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 68157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 68257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller LValue(Function *, DataFile file); 68357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller LValue(Function *, LValue *); 684da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~LValue() { } 68557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 686a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const; 687a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller 688a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual LValue *clone(ClonePolicy<Function>&) const; 68957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 69057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 69157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 69257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 693e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned compMask : 8; // compound/component mask 694e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned compound : 1; // used by RA, value involved in split/merge 695e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned ssa : 1; 696e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned fixedReg : 1; // set & used by RA, earlier just use (id < 0) 697e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned noSpill : 1; // do not spill (e.g. if spill temporary already) 69857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 69957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 70057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Symbol : public Value 70157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 70257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 70357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Symbol(Program *, DataFile file = FILE_MEMORY_CONST, ubyte fileIdx = 0); 704da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~Symbol() { } 70557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 706a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Symbol *clone(ClonePolicy<Function>&) const; 70757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 70857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *that, bool strict) const; 70957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 710a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller virtual bool isUniform() const; 711a765d7880f80d01be261a5d1f4b356a2b6fcfaadChristoph Bumiller 71257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 71357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 71457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // print with indirect values 71557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int print(char *, size_t, Value *, Value *, DataType ty = TYPE_NONE) const; 71657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 71757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setFile(DataFile file, ubyte fileIndex = 0) 71857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 71957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller reg.file = file; 72057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller reg.fileIndex = fileIndex; 72157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 72257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 72357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setOffset(int32_t offset); 72457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setAddress(Symbol *base, int32_t offset); 72557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setSV(SVSemantic sv, uint32_t idx = 0); 72657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 72757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const Symbol *getBase() const { return baseSym; } 72857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 72957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 73057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Symbol *baseSym; // array base for Symbols representing array elements 73157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 73257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 73357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass ImmediateValue : public Value 73457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 73557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 736d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez ImmediateValue() { } 73757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, uint32_t); 73857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, float); 73957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(Program *, double); 74057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // NOTE: not added to program with 74157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue(const ImmediateValue *, DataType ty); 742da28ba00d84f59650bf180769d9d9a1609eb6164Francisco Jerez ~ImmediateValue() { }; 74357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 744784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez virtual ImmediateValue *clone(ClonePolicy<Function>&) const; 745784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 74657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool equals(const Value *that, bool strict) const; 74757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 74857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // these only work if 'type' is valid (we mostly use untyped literals): 74957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isInteger(const int ival) const; // ival is cast to this' type 75057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isNegative() const; 75157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isPow2() const; 75257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 75357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void applyLog2(); 75457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 75557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // for constant folding: 75657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator+(const ImmediateValue&) const; 75757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator-(const ImmediateValue&) const; 75857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator*(const ImmediateValue&) const; 75957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ImmediateValue operator/(const ImmediateValue&) const; 76057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 761d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez ImmediateValue& operator=(const ImmediateValue&); // only sets value ! 762d6d1f0e4a25c9fbefce7485d77617855a8ea956aFrancisco Jerez 76357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool compare(CondCode cc, float fval) const; 76457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual int print(char *, size_t, DataType ty = TYPE_NONE) const; 76657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 76757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 76857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Instruction 76957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 77057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 77157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction(); 77257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction(Function *, operation, DataType); 77357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual ~Instruction(); 77457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 775a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual Instruction *clone(ClonePolicy<Function>&, 776a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 77757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7788cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setDef(int i, Value *); 7798cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setSrc(int s, Value *); 7808cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez void setSrc(int s, const ValueRef&); 78157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void swapSources(int a, int b); 782ce1951daed9a4685bf559b4222f50510cb412301Christoph Bumiller void moveSources(int s, int delta); 78357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setIndirect(int s, int dim, Value *); 78457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7859362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline ValueRef& src(int s) { return srcs[s]; } 7869362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline ValueDef& def(int s) { return defs[s]; } 7879362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline const ValueRef& src(int s) const { return srcs[s]; } 7889362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline const ValueDef& def(int s) const { return defs[s]; } 7899362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 7909362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *getDef(int d) const { return defs[d].get(); } 7919362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller inline Value *getSrc(int s) const { return srcs[s].get(); } 79257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirect(int s, int dim) const; 79357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 7948cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline bool defExists(unsigned d) const 7958cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez { 7969362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller return d < defs.size() && defs[d].exists(); 7978cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez } 7988cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez inline bool srcExists(unsigned s) const 7998cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez { 8009362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller return s < srcs.size() && srcs[s].exists(); 8018cc2eca5df0116aa7fb8233a9ab6ad1c9e4203cdFrancisco Jerez } 80257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 803e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller inline bool constrainedDefs() const; 80457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 80557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setPredicate(CondCode ccode, Value *); 80657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getPredicate() const; 80757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool writesPredicate() const; 808ca1fc2b86400e3fc9dd0517863e22721b5e91c77Christoph Bumiller inline bool isPredicated() const { return predSrc >= 0; } 80957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 81056cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller inline void setFlagsSrc(int s, Value *); 81156cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller inline void setFlagsDef(int d, Value *); 81299e4eba669f13a0dc80880f4f91e2338377c1667Christoph Bumiller inline bool usesFlags() const { return flagsSrc >= 0; } 81356cf2da02226aee6b7476675c0e05ac7c218756eChristoph Bumiller 8149362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller unsigned int defCount() const { return defs.size(); }; 815e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned int defCount(unsigned int mask, bool singleFile = false) const; 8169362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller unsigned int srcCount() const { return srcs.size(); }; 817e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller unsigned int srcCount(unsigned int mask, bool singleFile = false) const; 81857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 81957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // save & remove / set indirect[0,1] and predicate source 82057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void takeExtraSources(int s, Value *[3]); 82157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void putExtraSources(int s, Value *[3]); 82257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 82357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setType(DataType type) { dType = sType = type; } 82457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 82557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setType(DataType dtype, DataType stype) 82657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 82757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller dType = dtype; 82857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller sType = stype; 82957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 83057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 83157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isPseudo() const { return op < OP_MOV; } 83257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isDead() const; 83357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isNop() const; 83457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isCommutationLegal(const Instruction *) const; // must be adjacent ! 83557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isActionEqual(const Instruction *) const; 83657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool isResultEqual(const Instruction *) const; 83757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 838d0cf7a6beb4470d945bccb4e753cc7eb6ca5dda8Karol Herbst // check whether the defs interfere with srcs and defs of another instruction 839d0cf7a6beb4470d945bccb4e753cc7eb6ca5dda8Karol Herbst bool canCommuteDefDef(const Instruction *) const; 840d0cf7a6beb4470d945bccb4e753cc7eb6ca5dda8Karol Herbst bool canCommuteDefSrc(const Instruction *) const; 841d0cf7a6beb4470d945bccb4e753cc7eb6ca5dda8Karol Herbst 84257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print() const; 84357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 84457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline CmpInstruction *asCmp(); 84557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline TexInstruction *asTex(); 84657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline FlowInstruction *asFlow(); 84757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const TexInstruction *asTex() const; 84857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const CmpInstruction *asCmp() const; 84957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const FlowInstruction *asFlow() const; 85057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 85157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 85257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *next; 85357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *prev; 85457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 85557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int serial; // CFG order 85657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 85757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller operation op; 85857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType dType; // destination or defining type 85957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DataType sType; // source or secondary type 86057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode cc; 86157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller RoundMode rnd; 86257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CacheMode cache; 86357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 86422b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller uint16_t subOp; // quadop, 1 for mul-high, etc. 865afcd7b5d1614a8a758ccb4353a9c31a601c9b9b4Christoph Bumiller 86657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned encSize : 4; // encoding size in bytes 86757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned saturate : 1; // to [0.0f, 1.0f] 86857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned join : 1; // converge control flow (use OP_JOIN until end) 86957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned fixed : 1; // prevent dead code elimination 87057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned terminator : 1; // end of basic block 87157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned ftz : 1; // flush denormal to zero 87257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned dnz : 1; // denormals, NaN are zero 87357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned ipa : 4; // interpolation mode 87457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned lanes : 4; 87557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned perPatch : 1; 87657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned exit : 1; // terminate program after insn 87722b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller unsigned mask : 4; // for vector ops 87857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 87957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t postFactor; // MUL/DIV(if < 0) by 1 << postFactor 88057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 88157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t predSrc; 88257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t flagsDef; 88357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t flagsSrc; 88457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 885bede1bdb4828ea673bc7859db4058da7e35c6774Ben Skeggs uint32_t sched; // scheduling data (NOTE: maybe move to separate storage) 88622b762f9b495b14400f30bd6537f7c5a6d262325Christoph Bumiller 88757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *bb; 88857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 8899362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumillerprotected: 8909362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller std::deque<ValueDef> defs; // no gaps ! 8919362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller std::deque<ValueRef> srcs; // no gaps ! 8929362d4bc0a03860ec386156cf499e855a9c2d2a5Christoph Bumiller 89357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // instruction specific methods: 89457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // (don't want to subclass, would need more constructors and memory pools) 89557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 89657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setInterpolate(unsigned int mode) { ipa = mode; } 89757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 89857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getInterpMode() const { return ipa & 0x3; } 89957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getSampleMode() const { return ipa & 0xc; } 90057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 90157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 90257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void init(); 90357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 90457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 90557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum TexQuery 90657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 9074294db90b1804dd213b0b4b3ff4eb46a5c390c76Ilia Mirkin TXQ_DIMS, /* x, y, z, levels */ 9084294db90b1804dd213b0b4b3ff4eb46a5c390c76Ilia Mirkin TXQ_TYPE, /* ?, ?, samples, ? */ 90957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_SAMPLE_POSITION, 91057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_FILTER, 91157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_LOD, 91257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_WRAP, 91357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TXQ_BORDER_COLOUR 91457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 91557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 91657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass TexInstruction : public Instruction 91757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 91857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 91957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller class Target 92057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 92157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller public: 92257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target(TexTarget targ = TEX_TARGET_2D) : target(targ) { } 92357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 92457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const char *getName() const { return descTable[target].name; } 92557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getArgCount() const { return descTable[target].argc; } 92657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int getDim() const { return descTable[target].dim; } 92757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isArray() const { return descTable[target].array ? 1 : 0; } 92857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isCube() const { return descTable[target].cube ? 1 : 0; } 92957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int isShadow() const { return descTable[target].shadow ? 1 : 0; } 9304da54c91d24da891c56957f29274e7821c8254f6Christoph Bumiller int isMS() const { 9314da54c91d24da891c56957f29274e7821c8254f6Christoph Bumiller return target == TEX_TARGET_2D_MS || target == TEX_TARGET_2D_MS_ARRAY; } 9323bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin void clearMS() { 9333bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin if (isMS()) { 9343bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin if (isArray()) 9353bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin target = TEX_TARGET_2D_ARRAY; 9363bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin else 9373bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin target = TEX_TARGET_2D; 9383bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin } 9393bd40073b9803baf62f77ed5ac79979e037d2ed6Ilia Mirkin } 94057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target& operator=(TexTarget targ) 94257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 94357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller assert(targ < TEX_TARGET_COUNT); 944f7599b2c32185535b4c215de0ba0454129fa523fChristoph Bumiller target = targ; 94557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller return *this; 94657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 94757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 94857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool operator==(TexTarget targ) const { return target == targ; } 9494506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller inline bool operator!=(TexTarget targ) const { return target != targ; } 9504506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller 9514506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller enum TexTarget getEnum() const { return target; } 95257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 95357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller private: 95457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct Desc 95557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 95657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller char name[19]; 95757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t dim; 95857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t argc; 95957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool array; 96057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool cube; 96157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool shadow; 96257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 96357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 96457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static const struct Desc descTable[TEX_TARGET_COUNT]; 96557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 96657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller private: 96757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum TexTarget target; 96857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 96957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 97057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 9713ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin struct ImgFormatDesc 9723ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin { 9733ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin char name[19]; 9743ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin uint8_t components; 9753ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin uint8_t bits[4]; 9763ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin ImgType type; 9778e7893eb53213254997a1a3beb0575be11821f83Ilia Mirkin bool bgra; 9783ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin }; 9793ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 9803ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin static const struct ImgFormatDesc formatTable[IMG_FORMAT_COUNT]; 9813ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin 9823ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkinpublic: 98357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TexInstruction(Function *, operation); 98457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual ~TexInstruction(); 98557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 986a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual TexInstruction *clone(ClonePolicy<Function>&, 987a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 98857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 98957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void setTexture(Target targ, uint8_t r, uint8_t s) 99057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 99157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.r = r; 99257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.s = s; 99357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller tex.target = targ; 99457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } 99557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 9967a91d3a2a4c4e7851fdb46465224213ce1874c9bChristoph Bumiller void setIndirectR(Value *); 9977a91d3a2a4c4e7851fdb46465224213ce1874c9bChristoph Bumiller void setIndirectS(Value *); 99857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirectR() const; 99957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Value *getIndirectS() const; 100057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 100157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 100257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller struct { 100357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target target; 100457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1005c2dfcd7f0eaf4eda375eb320e0e87793a80ef92dChristoph Bumiller uint16_t r; 1006c2dfcd7f0eaf4eda375eb320e0e87793a80ef92dChristoph Bumiller uint16_t s; 100757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t rIndirectSrc; 100857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t sIndirectSrc; 100957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 101057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t mask; 101157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint8_t gatherComp; 101257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 101357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool liveOnly; // only execute on live pixels of a quad (optimization) 101457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool levelZero; 10159c930639d9f6d713ccfd16b390a41a9f584f348cChristoph Bumiller bool derivAll; 101657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 101757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int8_t useOffsets; // 0, 1, or 4 for textureGatherOffsets 1018f3aa999383074d666d6e3f3506e66b0c937904caIlia Mirkin int8_t offset[3]; // only used on nv50 101957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum TexQuery query; 10213ce80f924d07648040ab08a9cd30588621fb47a1Ilia Mirkin const struct ImgFormatDesc *format; 102257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } tex; 102357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ValueRef dPdx[3]; 102557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ValueRef dPdy[3]; 1026f3aa999383074d666d6e3f3506e66b0c937904caIlia Mirkin ValueRef offset[4][3]; 102757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 102857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 102957594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass CmpInstruction : public Instruction 103057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 103157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 103257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CmpInstruction(Function *, operation); 103357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1034a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez virtual CmpInstruction *clone(ClonePolicy<Function>&, 1035a05e6a3fa28168d58a13cfb07f7a664e84b925aeFrancisco Jerez Instruction * = NULL) const; 103657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 103757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void setCondition(CondCode cond) { setCond = cond; } 103857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode getCondition() const { return setCond; } 103957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 104157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CondCode setCond; 104257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 104357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 104457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass FlowInstruction : public Instruction 104557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 104657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 10479bb36d54a2c69ebdc9d1c9c4c71945060de8c860Francisco Jerez FlowInstruction(Function *, operation, void *target); 104857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1049784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez virtual FlowInstruction *clone(ClonePolicy<Function>&, 1050784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez Instruction * = NULL) const; 1051784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 105257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 105357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned allWarp : 1; 105457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned absolute : 1; 105557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned limit : 1; 105657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned builtin : 1; // true for calls to emulation code 1057c893b9406060d3735b2c9e307ae89f6d83a4be40Christoph Bumiller unsigned indirect : 1; // target in src(0) 105857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 105957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller union { 106057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *bb; 106157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int builtin; 106257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *fn; 106357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller } target; 106457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 106557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 106657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass BasicBlock 106757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 106857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 106957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock(Function *); 107057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~BasicBlock(); 107157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1072784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez BasicBlock *clone(ClonePolicy<Function>&) const; 1073784848a94d621b11020838fc058fc04a7fc57aa9Francisco Jerez 107457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int getId() const { return id; } 107557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline unsigned int getInsnCount() const { return numInsns; } 107657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline bool isTerminated() const { return exit && exit->terminator; } 107757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 107857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool dominatedBy(BasicBlock *bb); 107940c224a573f2b763046001e622aafca90f68c693Christoph Bumiller inline bool reachableBy(const BasicBlock *by, const BasicBlock *term); 108057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 108157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // returns mask of conditional out blocks 108257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // e.g. 3 for IF { .. } ELSE { .. } ENDIF, 1 for IF { .. } ENDIF 108357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int initiatesSimpleConditional() const; 108457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 108557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 108657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *getFunction() const { return func; } 108757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *getProgram() const { return program; } 108857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 108957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getEntry() const { return entry; } // first non-phi instruction 109057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getPhi() const { return phi; } 109157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getFirst() const { return phi ? phi : entry; } 109257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *getExit() const { return exit; } 109357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 109457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertHead(Instruction *); 109557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertTail(Instruction *); 109657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertBefore(Instruction *, Instruction *); 109757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void insertAfter(Instruction *, Instruction *); 109857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void remove(Instruction *); 109957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void permuteAdjacent(Instruction *, Instruction *); 110057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 110157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock *idom() const; 110257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1103c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller // NOTE: currently does not rebuild the dominator tree 1104c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller BasicBlock *splitBefore(Instruction *, bool attach = true); 1105c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller BasicBlock *splitAfter(Instruction *, bool attach = true); 1106c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller 110757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList& getDF() { return df; } 110857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList::Iterator iterDF() { return df.iterator(); } 110957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 111057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline BasicBlock *get(Iterator&); 111157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller static inline BasicBlock *get(Graph::Node *); 111257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 111357594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 111457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node cfg; // first edge is branch *taken* (the ELSE branch) 111557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node dom; 111657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 111757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BitSet liveSet; 11183e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez BitSet defSet; 111957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binPos; 112157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 112257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *joinAt; // for quick reference 112457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool explicitCont; // loop headers: true if loop contains continue stmts 112657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 112757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 112857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 112957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller DLList df; 113057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 113157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *phi; 113257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *entry; 113357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Instruction *exit; 113457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 113557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int numInsns; 113657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 113757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 113857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *func; 113957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *program; 1140c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller 1141c04d6d95e0efb8eea4d788d8d7b629209a3afaeaChristoph Bumiller void splitCommon(Instruction *, BasicBlock *, bool attach); 114257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 114357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 114457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Function 114557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 114657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 114798116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez Function(Program *, const char *name, uint32_t label); 114857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~Function(); 114957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1150d32ebb8c304725fa6bb7ec2d3d40ce828c713917Francisco Jerez static inline Function *get(Graph::Node *node); 1151d32ebb8c304725fa6bb7ec2d3d40ce828c713917Francisco Jerez 115257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline Program *getProgram() const { return prog; } 115357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline const char *getName() const { return name; } 115457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline int getId() const { return id; } 115598116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez inline uint32_t getLabel() const { return label; } 115657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 115757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print(); 115857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void printLiveIntervals() const; 115957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void printCFGraph(const char *filePath); 116057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setEntry(BasicBlock *); 116257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool setExit(BasicBlock *); 116357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int orderInstructions(ArrayList&); 116557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 116657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(BasicBlock *bb, int& id) { allBBlocks.insert(bb, id); } 116757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Instruction *insn, int& id) { allInsns.insert(insn, id); } 116857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(LValue *lval, int& id) { allLValues.insert(lval, id); } 116957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline LValue *getLValue(int id); 117157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1172898b0981b6c90d2f1e446a532b6ac3cbbb49747dFrancisco Jerez void buildLiveSets(); 11733e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez void buildDefSets(); 117457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool convertToSSA(); 117557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 117657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 1177a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<ValueDef> ins; 1178a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<ValueRef> outs; 1179a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez std::deque<Value *> clobbers; 1180a3dd45e1c27e4e55dadb9467c2ea428f58083ac1Francisco Jerez 118157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph cfg; 118257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node *cfgExit; 118357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph *domTree; 118457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph::Node call; // node in the call graph 118557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 118657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller BasicBlock **bbArray; // BBs in emission order 118757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int bbCount; 118857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 118957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller unsigned int loopNestingBound; 119057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int regClobberMax; 119157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 119257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binPos; 119357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 119457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 1195e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller Value *stackPtr; 1196e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller 1197e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsBase; // base address for l[] space (if no stack pointer is used) 1198e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsSize; 1199e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller 120057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allBBlocks; 120157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allInsns; 120257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allLValues; 120357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 120457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 120557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void buildLiveSetsPreSSA(BasicBlock *, const int sequence); 12063e9150cd961b2399e402e940400deae11ec7852fFrancisco Jerez void buildDefSetsPreSSA(BasicBlock *bb, const int seq); 120757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 120857594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 120998116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez uint32_t label; 121057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int id; 121157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const char *const name; 121257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *prog; 121357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 121457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 121557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerenum CGStage 121657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 121757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_PRE_SSA, 121857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_SSA, // expected directly before register allocation 121957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller CG_STAGE_POST_RA 122057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 122157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 122257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Program 122357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 122457594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 122557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller enum Type 122657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller { 122757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_VERTEX, 122857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_TESSELLATION_CONTROL, 122957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_TESSELLATION_EVAL, 123057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_GEOMETRY, 123157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_FRAGMENT, 123257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller TYPE_COMPUTE 123357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller }; 123457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 123557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program(Type type, Target *targ); 123657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ~Program(); 123757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 123857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void print(); 123957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 124057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Type getType() const { return progType; } 124157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 124257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Function *fn, int& id) { allFuncs.insert(fn, id); } 12435e4b2a1a47ca9a173f6419ed2f12c9fba80e757cFrancisco Jerez inline void del(Function *fn, int& id) { allFuncs.remove(id); } 124457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller inline void add(Value *rval, int& id) { allRValues.insert(rval, id); } 124557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 124657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool makeFromTGSI(struct nv50_ir_prog_info *); 124757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool makeFromSM4(struct nv50_ir_prog_info *); 124857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool convertToSSA(); 124957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool optimizeSSA(int level); 125057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool optimizePostRA(int level); 125157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool registerAllocation(); 125257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool emitBinary(struct nv50_ir_prog_info *); 125357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 125457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller const Target *getTarget() const { return target; } 125557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 125657594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 125798116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez void emitSymbolTable(struct nv50_ir_prog_info *); 125898116cc3dc3fc2cd84990cc2c968f05fe2978b4aFrancisco Jerez 125957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Type progType; 126057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Target *target; 126157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 126257594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 126357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *main; 126457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Graph calls; 126557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 126657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allFuncs; 126757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller ArrayList allRValues; 126857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 126957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t *code; 127057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t binSize; 1271e43a3a66a9d8a99021d76ff4d07dec7b8cfd62caChristoph Bumiller uint32_t tlsSize; // size required for FILE_MEMORY_LOCAL 127257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 127357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller int maxGPR; 127457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 127557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_Instruction; 127657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_CmpInstruction; 127757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_TexInstruction; 127857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_FlowInstruction; 127957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_LValue; 128057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_Symbol; 128157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller MemoryPool mem_ImmediateValue; 128257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 128357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller uint32_t dbgFlags; 1284322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller uint8_t optLevel; 1285322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller 1286322bc7ed68ed92233c97168c036d0aa50c11a20eChristoph Bumiller void *targetPriv; // e.g. to carry information between passes 128757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 12884506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller const struct nv50_ir_prog_info *driver; // for driver configuration 12894506ed28de7f9d76bbc99c0758a7891b84528729Christoph Bumiller 129057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void releaseInstruction(Instruction *); 129157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller void releaseValue(Value *); 129257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 129357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 129457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// TODO: add const version 129557594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerclass Pass 129657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller{ 129757594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerpublic: 129857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool run(Program *, bool ordered = false, bool skipPhi = false); 129957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool run(Function *, bool ordered = false, bool skipPhi = false); 130057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 130157594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprivate: 130257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller // return false to continue with next entity on next higher level 130357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(Function *) { return true; } 130457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(BasicBlock *) { return true; } 130557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller virtual bool visit(Instruction *) { return false; } 130657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 130757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool doRun(Program *, bool ordered, bool skipPhi); 130857594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool doRun(Function *, bool ordered, bool skipPhi); 130957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 131057594065c30feec9376be9b2132659f7d87362eeChristoph Bumillerprotected: 131157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller bool err; 131257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Function *func; 131357594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller Program *prog; 131457594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller}; 131557594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 131657594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller// ============================================================================= 131757594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 13185eb7ff1175a644ffe3b0f1a75cb235400355f9fbJohannes Obermayr#include "codegen/nv50_ir_inlines.h" 131957594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 132057594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller} // namespace nv50_ir 132157594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller 132257594065c30feec9376be9b2132659f7d87362eeChristoph Bumiller#endif // __NV50_IR_H__ 1323