ir_optimization.h revision a75f2681d26aecad185895c1c2f13dd542281ff9
1/*
2 * Copyright © 2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23
24
25/**
26 * \file ir_optimization.h
27 *
28 * Prototypes for optimization passes to be called by the compiler and drivers.
29 */
30
31/* Operations for lower_instructions() */
32#define SUB_TO_ADD_NEG     0x01
33#define DIV_TO_MUL_RCP     0x02
34#define EXP_TO_EXP2        0x04
35#define POW_TO_EXP2        0x08
36#define LOG_TO_LOG2        0x10
37#define MOD_TO_FRACT       0x20
38#define INT_DIV_TO_MUL_RCP 0x40
39
40bool do_common_optimization(exec_list *ir, bool linked,
41			    bool uniform_locations_assigned,
42			    unsigned max_unroll_iterations);
43
44bool do_algebraic(exec_list *instructions);
45bool do_constant_folding(exec_list *instructions);
46bool do_constant_variable(exec_list *instructions);
47bool do_constant_variable_unlinked(exec_list *instructions);
48bool do_copy_propagation(exec_list *instructions);
49bool do_copy_propagation_elements(exec_list *instructions);
50bool do_constant_propagation(exec_list *instructions);
51bool do_dead_code(exec_list *instructions, bool uniform_locations_assigned);
52bool do_dead_code_local(exec_list *instructions);
53bool do_dead_code_unlinked(exec_list *instructions);
54bool do_dead_functions(exec_list *instructions);
55bool do_function_inlining(exec_list *instructions);
56bool do_lower_jumps(exec_list *instructions, bool pull_out_jumps = true, bool lower_sub_return = true, bool lower_main_return = false, bool lower_continue = false, bool lower_break = false);
57bool do_lower_texture_projection(exec_list *instructions);
58bool do_if_simplification(exec_list *instructions);
59bool do_discard_simplification(exec_list *instructions);
60bool lower_if_to_cond_assign(exec_list *instructions, unsigned max_depth = 0);
61bool do_mat_op_to_vec(exec_list *instructions);
62bool do_noop_swizzle(exec_list *instructions);
63bool do_structure_splitting(exec_list *instructions);
64bool do_swizzle_swizzle(exec_list *instructions);
65bool do_tree_grafting(exec_list *instructions);
66bool do_vec_index_to_cond_assign(exec_list *instructions);
67bool do_vec_index_to_swizzle(exec_list *instructions);
68bool lower_discard(exec_list *instructions);
69void lower_discard_flow(exec_list *instructions);
70bool lower_instructions(exec_list *instructions, unsigned what_to_lower);
71bool lower_noise(exec_list *instructions);
72bool lower_variable_index_to_cond_assign(exec_list *instructions,
73    bool lower_input, bool lower_output, bool lower_temp, bool lower_uniform);
74bool lower_quadop_vector(exec_list *instructions, bool dont_lower_swz);
75bool lower_clip_distance(exec_list *instructions);
76void lower_output_reads(exec_list *instructions);
77void lower_ubo_reference(struct gl_shader *shader, exec_list *instructions);
78bool optimize_redundant_jumps(exec_list *instructions);
79bool optimize_split_arrays(exec_list *instructions, bool linked);
80
81ir_rvalue *
82compare_index_block(exec_list *instructions, ir_variable *index,
83		    unsigned base, unsigned components, void *mem_ctx);
84