brw_shader.h revision 6e3f6097c995a74d4ce52f542413b01ff819c203
1/*
2 * Copyright © 2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24#pragma once
25
26#include <stdint.h>
27#include "brw_reg.h"
28#include "brw_defines.h"
29#include "brw_context.h"
30#include "compiler/nir/nir.h"
31
32#ifdef __cplusplus
33#include "brw_ir_allocator.h"
34#endif
35
36#define MAX_SAMPLER_MESSAGE_SIZE 11
37#define MAX_VGRF_SIZE 16
38
39#ifdef __cplusplus
40struct backend_reg : private brw_reg
41{
42   backend_reg() {}
43   backend_reg(const struct brw_reg &reg) : brw_reg(reg) {}
44
45   const brw_reg &as_brw_reg() const
46   {
47      assert(file == ARF || file == FIXED_GRF || file == MRF || file == IMM);
48      assert(offset == 0);
49      return static_cast<const brw_reg &>(*this);
50   }
51
52   brw_reg &as_brw_reg()
53   {
54      assert(file == ARF || file == FIXED_GRF || file == MRF || file == IMM);
55      assert(offset == 0);
56      return static_cast<brw_reg &>(*this);
57   }
58
59   bool equals(const backend_reg &r) const;
60
61   bool is_zero() const;
62   bool is_one() const;
63   bool is_negative_one() const;
64   bool is_null() const;
65   bool is_accumulator() const;
66
67   /** Offset from the start of the (virtual) register in bytes. */
68   uint16_t offset;
69
70   using brw_reg::type;
71   using brw_reg::file;
72   using brw_reg::negate;
73   using brw_reg::abs;
74   using brw_reg::address_mode;
75   using brw_reg::subnr;
76   using brw_reg::nr;
77
78   using brw_reg::swizzle;
79   using brw_reg::writemask;
80   using brw_reg::indirect_offset;
81   using brw_reg::vstride;
82   using brw_reg::width;
83   using brw_reg::hstride;
84
85   using brw_reg::df;
86   using brw_reg::f;
87   using brw_reg::d;
88   using brw_reg::ud;
89};
90#endif
91
92struct cfg_t;
93struct bblock_t;
94
95#ifdef __cplusplus
96struct backend_instruction : public exec_node {
97   bool is_3src(const struct gen_device_info *devinfo) const;
98   bool is_tex() const;
99   bool is_math() const;
100   bool is_control_flow() const;
101   bool is_commutative() const;
102   bool can_do_source_mods() const;
103   bool can_do_saturate() const;
104   bool can_do_cmod() const;
105   bool reads_accumulator_implicitly() const;
106   bool writes_accumulator_implicitly(const struct gen_device_info *devinfo) const;
107
108   void remove(bblock_t *block);
109   void insert_after(bblock_t *block, backend_instruction *inst);
110   void insert_before(bblock_t *block, backend_instruction *inst);
111   void insert_before(bblock_t *block, exec_list *list);
112
113   /**
114    * True if the instruction has side effects other than writing to
115    * its destination registers.  You are expected not to reorder or
116    * optimize these out unless you know what you are doing.
117    */
118   bool has_side_effects() const;
119
120   /**
121    * True if the instruction might be affected by side effects of other
122    * instructions.
123    */
124   bool is_volatile() const;
125#else
126struct backend_instruction {
127   struct exec_node link;
128#endif
129   /** @{
130    * Annotation for the generated IR.  One of the two can be set.
131    */
132   const void *ir;
133   const char *annotation;
134   /** @} */
135
136   /**
137    * Execution size of the instruction.  This is used by the generator to
138    * generate the correct binary for the given instruction.  Current valid
139    * values are 1, 4, 8, 16, 32.
140    */
141   uint8_t exec_size;
142
143   /**
144    * Channel group from the hardware execution and predication mask that
145    * should be applied to the instruction.  The subset of channel enable
146    * signals (calculated from the EU control flow and predication state)
147    * given by [group, group + exec_size) will be used to mask GRF writes and
148    * any other side effects of the instruction.
149    */
150   uint8_t group;
151
152   uint32_t offset; /**< spill/unspill offset or texture offset bitfield */
153   uint8_t mlen; /**< SEND message length */
154   int8_t base_mrf; /**< First MRF in the SEND message, if mlen is nonzero. */
155   uint8_t target; /**< MRT target. */
156   unsigned size_written; /**< Data written to the destination register in bytes. */
157
158   enum opcode opcode; /* BRW_OPCODE_* or FS_OPCODE_* */
159   enum brw_conditional_mod conditional_mod; /**< BRW_CONDITIONAL_* */
160   enum brw_predicate predicate;
161   bool predicate_inverse:1;
162   bool writes_accumulator:1; /**< instruction implicitly writes accumulator */
163   bool force_writemask_all:1;
164   bool no_dd_clear:1;
165   bool no_dd_check:1;
166   bool saturate:1;
167   bool shadow_compare:1;
168
169   /* Chooses which flag subregister (f0.0 or f0.1) is used for conditional
170    * mod and predication.
171    */
172   unsigned flag_subreg:1;
173
174   /** The number of hardware registers used for a message header. */
175   uint8_t header_size;
176};
177
178#ifdef __cplusplus
179
180enum instruction_scheduler_mode {
181   SCHEDULE_PRE,
182   SCHEDULE_PRE_NON_LIFO,
183   SCHEDULE_PRE_LIFO,
184   SCHEDULE_POST,
185};
186
187struct backend_shader {
188protected:
189
190   backend_shader(const struct brw_compiler *compiler,
191                  void *log_data,
192                  void *mem_ctx,
193                  const nir_shader *shader,
194                  struct brw_stage_prog_data *stage_prog_data);
195
196public:
197
198   const struct brw_compiler *compiler;
199   void *log_data; /* Passed to compiler->*_log functions */
200
201   const struct gen_device_info * const devinfo;
202   const nir_shader *nir;
203   struct brw_stage_prog_data * const stage_prog_data;
204
205   /** ralloc context for temporary data used during compile */
206   void *mem_ctx;
207
208   /**
209    * List of either fs_inst or vec4_instruction (inheriting from
210    * backend_instruction)
211    */
212   exec_list instructions;
213
214   cfg_t *cfg;
215
216   gl_shader_stage stage;
217   bool debug_enabled;
218   const char *stage_name;
219   const char *stage_abbrev;
220   bool is_passthrough_shader;
221
222   brw::simple_allocator alloc;
223
224   virtual void dump_instruction(backend_instruction *inst) = 0;
225   virtual void dump_instruction(backend_instruction *inst, FILE *file) = 0;
226   virtual void dump_instructions();
227   virtual void dump_instructions(const char *name);
228
229   void calculate_cfg();
230
231   virtual void invalidate_live_intervals() = 0;
232};
233
234bool brw_texture_offset(int *offsets,
235                        unsigned num_components,
236                        uint32_t *offset_bits);
237
238void brw_setup_image_uniform_values(gl_shader_stage stage,
239                                    struct brw_stage_prog_data *stage_prog_data,
240                                    unsigned param_start_index,
241                                    const gl_uniform_storage *storage);
242
243#else
244struct backend_shader;
245#endif /* __cplusplus */
246
247enum brw_reg_type brw_type_for_base_type(const struct glsl_type *type);
248enum brw_conditional_mod brw_conditional_for_comparison(unsigned int op);
249uint32_t brw_math_function(enum opcode op);
250const char *brw_instruction_name(const struct gen_device_info *devinfo,
251                                 enum opcode op);
252bool brw_saturate_immediate(enum brw_reg_type type, struct brw_reg *reg);
253bool brw_negate_immediate(enum brw_reg_type type, struct brw_reg *reg);
254bool brw_abs_immediate(enum brw_reg_type type, struct brw_reg *reg);
255
256bool opt_predicated_break(struct backend_shader *s);
257
258#ifdef __cplusplus
259extern "C" {
260#endif
261
262/**
263 * Scratch data used when compiling a GLSL geometry shader.
264 */
265struct brw_gs_compile
266{
267   struct brw_gs_prog_key key;
268   struct brw_vue_map input_vue_map;
269
270   unsigned control_data_bits_per_vertex;
271   unsigned control_data_header_size_bits;
272};
273
274uint32_t
275brw_assign_common_binding_table_offsets(const struct gen_device_info *devinfo,
276                                        const struct gl_program *prog,
277                                        struct brw_stage_prog_data *stage_prog_data,
278                                        uint32_t next_binding_table_offset);
279
280bool brw_vs_precompile(struct gl_context *ctx, struct gl_program *prog);
281bool brw_tcs_precompile(struct gl_context *ctx,
282                        struct gl_shader_program *shader_prog,
283                        struct gl_program *prog);
284bool brw_tes_precompile(struct gl_context *ctx,
285                        struct gl_shader_program *shader_prog,
286                        struct gl_program *prog);
287bool brw_gs_precompile(struct gl_context *ctx, struct gl_program *prog);
288bool brw_fs_precompile(struct gl_context *ctx, struct gl_program *prog);
289bool brw_cs_precompile(struct gl_context *ctx, struct gl_program *prog);
290
291GLboolean brw_link_shader(struct gl_context *ctx, struct gl_shader_program *prog);
292struct gl_linked_shader *brw_new_shader(gl_shader_stage stage);
293
294unsigned tesslevel_outer_components(GLenum tes_primitive_mode);
295unsigned tesslevel_inner_components(GLenum tes_primitive_mode);
296unsigned writemask_for_backwards_vector(unsigned mask);
297
298unsigned get_atomic_counter_op(nir_intrinsic_op op);
299
300#ifdef __cplusplus
301}
302#endif
303