18cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott/* 28cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Copyright (C) 2005-2007 Brian Paul All Rights Reserved. 38cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Copyright (C) 2008 VMware, Inc. All Rights Reserved. 48cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Copyright © 2014 Intel Corporation 58cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * 68cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Permission is hereby granted, free of charge, to any person obtaining a 78cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * copy of this software and associated documentation files (the "Software"), 88cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * to deal in the Software without restriction, including without limitation 98cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * the rights to use, copy, modify, merge, publish, distribute, sublicense, 108cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * and/or sell copies of the Software, and to permit persons to whom the 118cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Software is furnished to do so, subject to the following conditions: 128cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * 138cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * The above copyright notice and this permission notice (including the next 148cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * paragraph) shall be included in all copies or substantial portions of the 158cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Software. 168cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * 178cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 188cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 198cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 208cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 218cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 228cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER 238cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * DEALINGS IN THE SOFTWARE. 248cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott */ 258cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 268cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "nir.h" 27ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri#include "nir_builder.h" 28eb63640c1d38a200a7b1540405051d3ff79d0d8aEmil Velikov#include "compiler/glsl/ir_uniform.h" 298cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 308cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "main/compiler.h" 318cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "main/mtypes.h" 328cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "program/prog_parameter.h" 338cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "program/program.h" 348cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 35ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri/* Calculate the sampler index based on array indicies and also 36ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri * calculate the base uniform location for struct members. 37ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri */ 38ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceristatic void 39ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arcericalc_sampler_offsets(nir_deref *tail, nir_tex_instr *instr, 40ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri unsigned *array_elements, nir_ssa_def **indirect, 41ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_builder *b, unsigned *location) 428cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{ 43ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri if (tail->child == NULL) 44ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri return; 45ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 46ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri switch (tail->child->deref_type) { 47ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri case nir_deref_type_array: { 48ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_deref_array *deref_array = nir_deref_as_array(tail->child); 49ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 50ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri assert(deref_array->deref_array_type != nir_deref_array_type_wildcard); 51ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 52ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri calc_sampler_offsets(tail->child, instr, array_elements, 53ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri indirect, b, location); 54ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand instr->texture_index += deref_array->base_offset * *array_elements; 55ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 56ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri if (deref_array->deref_array_type == nir_deref_array_type_indirect) { 57ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_ssa_def *mul = 58ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_imul(b, nir_imm_int(b, *array_elements), 59ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_ssa_for_src(b, deref_array->indirect, 1)); 60ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 61ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_instr_rewrite_src(&instr->instr, &deref_array->indirect, 62ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri NIR_SRC_INIT); 63ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 64ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri if (*indirect) { 65ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri *indirect = nir_iadd(b, *indirect, mul); 66ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri } else { 67ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri *indirect = mul; 68ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri } 69ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri } 70ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 71ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri *array_elements *= glsl_get_length(tail->type); 72ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri break; 738cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott } 748cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 75ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri case nir_deref_type_struct: { 76ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_deref_struct *deref_struct = nir_deref_as_struct(tail->child); 77de7ffdb38343b7f9292184ca827987de9852c80cEmil Velikov *location += glsl_get_record_location_offset(tail->type, deref_struct->index); 78ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri calc_sampler_offsets(tail->child, instr, array_elements, 79ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri indirect, b, location); 80ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri break; 818cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott } 828cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 83ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri default: 84ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri unreachable("Invalid deref type"); 85ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri break; 86ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri } 878cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott} 888cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 898cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbottstatic void 90500da98e0b96d211eab27629696ef50c47caaff9Kenneth Graunkelower_sampler(nir_tex_instr *instr, const struct gl_shader_program *shader_program, 9166e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand gl_shader_stage stage, nir_builder *b) 928cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{ 93ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand if (instr->texture == NULL) 9460ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand return; 9560ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 965ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand /* In GLSL, we only fill out the texture field. The sampler is inferred */ 975ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand assert(instr->sampler == NULL); 985ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand 99ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand instr->texture_index = 0; 100ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand unsigned location = instr->texture->var->data.location; 101ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri unsigned array_elements = 1; 102ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_ssa_def *indirect = NULL; 103ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 10466e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand b->cursor = nir_before_instr(&instr->instr); 105ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand calc_sampler_offsets(&instr->texture->deref, instr, &array_elements, 10666e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand &indirect, b, &location); 107ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 108ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri if (indirect) { 10966e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand assert(array_elements >= 1); 11066e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand indirect = nir_umin(b, indirect, nir_imm_int(b, array_elements - 1)); 11166e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand 112ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri /* First, we have to resize the array of texture sources */ 113ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_tex_src *new_srcs = rzalloc_array(instr, nir_tex_src, 1145ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand instr->num_srcs + 2); 115ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri 116ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri for (unsigned i = 0; i < instr->num_srcs; i++) { 117ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri new_srcs[i].src_type = instr->src[i].src_type; 118ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_instr_move_src(&instr->instr, &new_srcs[i].src, 119ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri &instr->src[i].src); 120ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri } 12160ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 122ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri ralloc_free(instr->src); 123ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri instr->src = new_srcs; 12460ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 125ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri /* Now we can go ahead and move the source over to being a 126ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri * first-class texture source. 127ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri */ 128ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand instr->src[instr->num_srcs].src_type = nir_tex_src_texture_offset; 129ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri instr->num_srcs++; 130ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_instr_rewrite_src(&instr->instr, 131ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri &instr->src[instr->num_srcs - 1].src, 132ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri nir_src_for_ssa(indirect)); 13395774ca258d216d42877f9a8da7e1bb4212a6500Tapani Pälli 1345ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand instr->src[instr->num_srcs].src_type = nir_tex_src_sampler_offset; 1355ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand instr->num_srcs++; 1365ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand nir_instr_rewrite_src(&instr->instr, 1375ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand &instr->src[instr->num_srcs - 1].src, 1385ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand nir_src_for_ssa(indirect)); 1395ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand 140ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand instr->texture_array_size = array_elements; 141ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri } 14260ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 143203c8794a1debc0e45019fe945d1cc55459e6c6fTimothy Arceri if (location > shader_program->data->NumUniformStorage - 1 || 144203c8794a1debc0e45019fe945d1cc55459e6c6fTimothy Arceri !shader_program->data->UniformStorage[location].opaque[stage].active) { 145ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri assert(!"cannot return a sampler"); 146ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri return; 1478cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott } 14860ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 149ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand instr->texture_index += 150203c8794a1debc0e45019fe945d1cc55459e6c6fTimothy Arceri shader_program->data->UniformStorage[location].opaque[stage].index; 15160ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 1525ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand instr->sampler_index = instr->texture_index; 1535ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand 154ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand instr->texture = NULL; 1558cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott} 1568cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 1578cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbottstatic void 158500da98e0b96d211eab27629696ef50c47caaff9Kenneth Graunkelower_impl(nir_function_impl *impl, const struct gl_shader_program *shader_program, 15999264b7f37dc92bcb3a9ae226e00c9300414431cKenneth Graunke gl_shader_stage stage) 1608cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{ 16126b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott nir_builder b; 16226b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott nir_builder_init(&b, impl); 16360ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand 16426b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott nir_foreach_block(block, impl) { 165707e72f13bb78869ee95d3286980bf1709cba6cfJason Ekstrand nir_foreach_instr(instr, block) { 16626b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott if (instr->type == nir_instr_type_tex) 16726b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott lower_sampler(nir_instr_as_tex(instr), shader_program, stage, &b); 16826b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott } 16926b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott } 1708cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott} 1718cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott 172de7ffdb38343b7f9292184ca827987de9852c80cEmil Velikovvoid 1735f14c417c86ced1847746c64d4db54c7e5ddc187Kenneth Graunkenir_lower_samplers(nir_shader *shader, 1745f14c417c86ced1847746c64d4db54c7e5ddc187Kenneth Graunke const struct gl_shader_program *shader_program) 1758cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{ 1769464d8c49813aba77285e7465b96e92a91ed327cJason Ekstrand nir_foreach_function(function, shader) { 177237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand if (function->impl) 178237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand lower_impl(function->impl, shader_program, shader->stage); 1798cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott } 1808cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott} 181