18cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott/*
28cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Copyright (C) 2005-2007  Brian Paul   All Rights Reserved.
38cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Copyright (C) 2008  VMware, Inc.   All Rights Reserved.
48cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Copyright © 2014 Intel Corporation
58cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott *
68cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Permission is hereby granted, free of charge, to any person obtaining a
78cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * copy of this software and associated documentation files (the "Software"),
88cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * to deal in the Software without restriction, including without limitation
98cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * the rights to use, copy, modify, merge, publish, distribute, sublicense,
108cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * and/or sell copies of the Software, and to permit persons to whom the
118cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Software is furnished to do so, subject to the following conditions:
128cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott *
138cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * The above copyright notice and this permission notice (including the next
148cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * paragraph) shall be included in all copies or substantial portions of the
158cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * Software.
168cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott *
178cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
188cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
198cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
208cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
218cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
228cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
238cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott * DEALINGS IN THE SOFTWARE.
248cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott */
258cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
268cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "nir.h"
27ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri#include "nir_builder.h"
28eb63640c1d38a200a7b1540405051d3ff79d0d8aEmil Velikov#include "compiler/glsl/ir_uniform.h"
298cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
308cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "main/compiler.h"
318cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "main/mtypes.h"
328cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "program/prog_parameter.h"
338cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott#include "program/program.h"
348cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
35ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri/* Calculate the sampler index based on array indicies and also
36ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri * calculate the base uniform location for struct members.
37ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri */
38ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceristatic void
39ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arcericalc_sampler_offsets(nir_deref *tail, nir_tex_instr *instr,
40ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                     unsigned *array_elements, nir_ssa_def **indirect,
41ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                     nir_builder *b, unsigned *location)
428cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{
43ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   if (tail->child == NULL)
44ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      return;
45ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
46ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   switch (tail->child->deref_type) {
47ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   case nir_deref_type_array: {
48ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      nir_deref_array *deref_array = nir_deref_as_array(tail->child);
49ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
50ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      assert(deref_array->deref_array_type != nir_deref_array_type_wildcard);
51ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
52ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      calc_sampler_offsets(tail->child, instr, array_elements,
53ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                           indirect, b, location);
54ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand      instr->texture_index += deref_array->base_offset * *array_elements;
55ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
56ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      if (deref_array->deref_array_type == nir_deref_array_type_indirect) {
57ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         nir_ssa_def *mul =
58ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri            nir_imul(b, nir_imm_int(b, *array_elements),
59ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                     nir_ssa_for_src(b, deref_array->indirect, 1));
60ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
61ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         nir_instr_rewrite_src(&instr->instr, &deref_array->indirect,
62ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                               NIR_SRC_INIT);
63ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
64ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         if (*indirect) {
65ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri            *indirect = nir_iadd(b, *indirect, mul);
66ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         } else {
67ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri            *indirect = mul;
68ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         }
69ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      }
70ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
71ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      *array_elements *= glsl_get_length(tail->type);
72ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri       break;
738cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott   }
748cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
75ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   case nir_deref_type_struct: {
76ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      nir_deref_struct *deref_struct = nir_deref_as_struct(tail->child);
77de7ffdb38343b7f9292184ca827987de9852c80cEmil Velikov      *location += glsl_get_record_location_offset(tail->type, deref_struct->index);
78ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      calc_sampler_offsets(tail->child, instr, array_elements,
79ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                           indirect, b, location);
80ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      break;
818cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott   }
828cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
83ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   default:
84ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      unreachable("Invalid deref type");
85ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      break;
86ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   }
878cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott}
888cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
898cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbottstatic void
90500da98e0b96d211eab27629696ef50c47caaff9Kenneth Graunkelower_sampler(nir_tex_instr *instr, const struct gl_shader_program *shader_program,
9166e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand              gl_shader_stage stage, nir_builder *b)
928cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{
93ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand   if (instr->texture == NULL)
9460ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand      return;
9560ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
965ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand   /* In GLSL, we only fill out the texture field.  The sampler is inferred */
975ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand   assert(instr->sampler == NULL);
985ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand
99ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand   instr->texture_index = 0;
100ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand   unsigned location = instr->texture->var->data.location;
101ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   unsigned array_elements = 1;
102ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   nir_ssa_def *indirect = NULL;
103ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
10466e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand   b->cursor = nir_before_instr(&instr->instr);
105ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand   calc_sampler_offsets(&instr->texture->deref, instr, &array_elements,
10666e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand                        &indirect, b, &location);
107ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
108ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   if (indirect) {
10966e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand      assert(array_elements >= 1);
11066e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand      indirect = nir_umin(b, indirect, nir_imm_int(b, array_elements - 1));
11166e137ecf1e6a77374c0278a02246cff3cab0355Jason Ekstrand
112ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      /* First, we have to resize the array of texture sources */
113ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      nir_tex_src *new_srcs = rzalloc_array(instr, nir_tex_src,
1145ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand                                            instr->num_srcs + 2);
115ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri
116ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      for (unsigned i = 0; i < instr->num_srcs; i++) {
117ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         new_srcs[i].src_type = instr->src[i].src_type;
118ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri         nir_instr_move_src(&instr->instr, &new_srcs[i].src,
119ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                            &instr->src[i].src);
120ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      }
12160ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
122ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      ralloc_free(instr->src);
123ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      instr->src = new_srcs;
12460ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
125ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      /* Now we can go ahead and move the source over to being a
126ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri       * first-class texture source.
127ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri       */
128ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand      instr->src[instr->num_srcs].src_type = nir_tex_src_texture_offset;
129ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      instr->num_srcs++;
130ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      nir_instr_rewrite_src(&instr->instr,
131ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                            &instr->src[instr->num_srcs - 1].src,
132ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri                            nir_src_for_ssa(indirect));
13395774ca258d216d42877f9a8da7e1bb4212a6500Tapani Pälli
1345ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand      instr->src[instr->num_srcs].src_type = nir_tex_src_sampler_offset;
1355ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand      instr->num_srcs++;
1365ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand      nir_instr_rewrite_src(&instr->instr,
1375ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand                            &instr->src[instr->num_srcs - 1].src,
1385ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand                            nir_src_for_ssa(indirect));
1395ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand
140ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand      instr->texture_array_size = array_elements;
141ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri   }
14260ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
143203c8794a1debc0e45019fe945d1cc55459e6c6fTimothy Arceri   if (location > shader_program->data->NumUniformStorage - 1 ||
144203c8794a1debc0e45019fe945d1cc55459e6c6fTimothy Arceri       !shader_program->data->UniformStorage[location].opaque[stage].active) {
145ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      assert(!"cannot return a sampler");
146ef8eebc6ad5d86e524426f0755c0f7d0b4c0cd3eTimothy Arceri      return;
1478cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott   }
14860ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
149ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand   instr->texture_index +=
150203c8794a1debc0e45019fe945d1cc55459e6c6fTimothy Arceri      shader_program->data->UniformStorage[location].opaque[stage].index;
15160ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
1525ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand   instr->sampler_index = instr->texture_index;
1535ec456375e4fdd0b6c7d797f99191044e19ead74Jason Ekstrand
154ee85014b90af1d94d637ec763a803479e9bac5dcJason Ekstrand   instr->texture = NULL;
1558cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott}
1568cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
1578cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbottstatic void
158500da98e0b96d211eab27629696ef50c47caaff9Kenneth Graunkelower_impl(nir_function_impl *impl, const struct gl_shader_program *shader_program,
15999264b7f37dc92bcb3a9ae226e00c9300414431cKenneth Graunke           gl_shader_stage stage)
1608cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{
16126b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott   nir_builder b;
16226b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott   nir_builder_init(&b, impl);
16360ec60a600875a6c40a1a90d34d00000c7aa96e7Jason Ekstrand
16426b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott   nir_foreach_block(block, impl) {
165707e72f13bb78869ee95d3286980bf1709cba6cfJason Ekstrand      nir_foreach_instr(instr, block) {
16626b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott         if (instr->type == nir_instr_type_tex)
16726b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott            lower_sampler(nir_instr_as_tex(instr), shader_program, stage, &b);
16826b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott      }
16926b4c9ee159a8cb87b29eec0a1b8701c1750a29dConnor Abbott   }
1708cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott}
1718cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott
172de7ffdb38343b7f9292184ca827987de9852c80cEmil Velikovvoid
1735f14c417c86ced1847746c64d4db54c7e5ddc187Kenneth Graunkenir_lower_samplers(nir_shader *shader,
1745f14c417c86ced1847746c64d4db54c7e5ddc187Kenneth Graunke                   const struct gl_shader_program *shader_program)
1758cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott{
1769464d8c49813aba77285e7465b96e92a91ed327cJason Ekstrand   nir_foreach_function(function, shader) {
177237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand      if (function->impl)
178237f2f2d8b45d9d956102eec6f9be63193e5269bJason Ekstrand         lower_impl(function->impl, shader_program, shader->stage);
1798cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott   }
1808cdcfce5cea1a0dd761bdb82a03433f06c83f36bConnor Abbott}
181