11c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák/* 21c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Copyright 2009 Nicolai Hähnle <nhaehnle@gmail.com> 31c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * 41c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Permission is hereby granted, free of charge, to any person obtaining a 51c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * copy of this software and associated documentation files (the "Software"), 61c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * to deal in the Software without restriction, including without limitation 71c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * on the rights to use, copy, modify, merge, publish, distribute, sub 81c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * license, and/or sell copies of the Software, and to permit persons to whom 91c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * the Software is furnished to do so, subject to the following conditions: 101c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * 111c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * The above copyright notice and this permission notice (including the next 121c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * paragraph) shall be included in all copies or substantial portions of the 131c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Software. 141c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * 151c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 161c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 171c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 181c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, 191c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 201c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 211c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * USE OR OTHER DEALINGS IN THE SOFTWARE. */ 221c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 231c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#ifndef RADEON_COMPILER_H 241c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define RADEON_COMPILER_H 251c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 261c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "main/compiler.h" 271c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 281c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "memory_pool.h" 291c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "radeon_code.h" 301c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "radeon_program.h" 311c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "radeon_emulate_loops.h" 321c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 331c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define RC_DBG_LOG (1 << 0) 341c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define RC_DBG_STATS (1 << 1) 351c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 361c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct rc_swizzle_caps; 371c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 381c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákenum rc_program_type { 391c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák RC_VERTEX_PROGRAM, 401c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák RC_FRAGMENT_PROGRAM, 411c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák RC_NUM_PROGRAM_TYPES 421c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák}; 431c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 441c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct radeon_compiler { 451c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct memory_pool Pool; 461c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct rc_program Program; 471c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák enum rc_program_type type; 481c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned Debug:2; 491c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned Error:1; 501c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák char * ErrorMsg; 511c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 521c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /* Hardware specification. */ 531c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned is_r400:1; 541c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned is_r500:1; 551c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned has_half_swizzles:1; 561c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned has_presub:1; 57e945fb04d04c33da5e77d22d739c5740a522a61eTom Stellard unsigned has_omod:1; 581c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned disable_optimizations:1; 591c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned max_temp_regs; 601c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned max_constants; 611c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák int max_alu_insts; 621c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned max_tex_insts; 631c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 641c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /* Whether to remove unused constants and empty holes in constant space. */ 651c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned remove_unused_constants:1; 661c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 671c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /** 681c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Variables used internally, not be touched by callers 691c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * of the compiler 701c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák */ 711c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /*@{*/ 721c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct rc_swizzle_caps * SwizzleCaps; 731c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /*@}*/ 741c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 751c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct emulate_loop_state loop_state; 761c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 771c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned initial_num_insts; /* Number of instructions at start. */ 781c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák}; 791c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 801c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_init(struct radeon_compiler * c); 811c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_destroy(struct radeon_compiler * c); 821c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 831c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_debug(struct radeon_compiler * c, const char * fmt, ...); 841c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_error(struct radeon_compiler * c, const char * fmt, ...); 851c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 861c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákint rc_if_fail_helper(struct radeon_compiler * c, const char * file, int line, const char * assertion); 871c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 881c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák/** 891c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * This macro acts like an if-statement that can be used to implement 901c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * non-aborting assertions in the compiler. 911c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * 921c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * It checks whether \p cond is true. If not, an internal compiler error is 931c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * flagged and the if-clause is run. 941c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * 951c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * A typical use-case would be: 961c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * 971c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * if (rc_assert(c, condition-that-must-be-true)) 981c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * return; 991c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák */ 1001c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define rc_assert(c, cond) \ 1011c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák (!(cond) && rc_if_fail_helper(c, __FILE__, __LINE__, #cond)) 1021c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1031c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_calculate_inputs_outputs(struct radeon_compiler * c); 1041c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1051c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_move_input(struct radeon_compiler * c, unsigned input, struct rc_src_register new_input); 1061c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_move_output(struct radeon_compiler * c, unsigned output, unsigned new_output, unsigned writemask); 1071c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_copy_output(struct radeon_compiler * c, unsigned output, unsigned dup_output); 1081c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_transform_fragment_wpos(struct radeon_compiler * c, unsigned wpos, unsigned new_input, 1091c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák int full_vtransform); 1101c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_transform_fragment_face(struct radeon_compiler *c, unsigned face); 1111c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1121c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct r300_fragment_program_compiler { 1131c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct radeon_compiler Base; 1141c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct rX00_fragment_program_code *code; 1151c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /* Optional transformations and features. */ 1161c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct r300_fragment_program_external_state state; 1171c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /* Register corresponding to the depthbuffer. */ 1181c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned OutputDepth; 1191c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák /* Registers corresponding to the four colorbuffers. */ 1201c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned OutputColor[4]; 1211c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1221c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void * UserData; 1231c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void (*AllocateHwInputs)( 1241c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct r300_fragment_program_compiler * c, 1251c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void (*allocate)(void * data, unsigned input, unsigned hwreg), 1261c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void * mydata); 1271c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák}; 1281c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1291c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid r3xx_compile_fragment_program(struct r300_fragment_program_compiler* c); 1301c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1311c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct r300_vertex_program_compiler { 1321c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct radeon_compiler Base; 1331c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák struct r300_vertex_program_code *code; 1341c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák uint32_t RequiredOutputs; 1351c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1361c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void * UserData; 1371c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void (*SetHwInputOutput)(struct r300_vertex_program_compiler * c); 1381c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1391c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák}; 1401c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1411c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid r3xx_compile_vertex_program(struct r300_vertex_program_compiler* c); 142b2df031a959f36743527b9abc89913ce4f895de3Tom Stellardvoid rc_vert_fc(struct radeon_compiler *compiler, void *user); 1431c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid r300_vertex_program_dump(struct radeon_compiler *compiler, void *user); 1441c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1451c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct radeon_compiler_pass { 1461c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák const char *name; /* Name of the pass. */ 1471c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák int dump; /* Dump the program if Debug == 1? */ 1481c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák int predicate; /* Run this pass? */ 1491c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void (*run)(struct radeon_compiler *c, void *user); /* The main entrypoint. */ 1501c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák void *user; /* Optional parameter which is passed to the run function. */ 1511c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák}; 1521c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1531c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct rc_program_stats { 1541c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_insts; 1551c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_fc_insts; 1561c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_tex_insts; 1571c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_rgb_insts; 1581c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_alpha_insts; 1591c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_presub_ops; 1601c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák unsigned num_temp_regs; 161e945fb04d04c33da5e77d22d739c5740a522a61eTom Stellard unsigned num_omod_ops; 162befcce264c8bf8fdac233e6a01cadc595a1d11d3Tom Stellard unsigned num_inline_literals; 1631c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák}; 1641c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1651c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_get_stats(struct radeon_compiler *c, struct rc_program_stats *s); 1661c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1671c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák/* Executes a list of compiler passes given in the parameter 'list'. */ 1681c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_run_compiler_passes(struct radeon_compiler *c, struct radeon_compiler_pass *list); 1691c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_run_compiler(struct radeon_compiler *c, struct radeon_compiler_pass *list); 1701c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_validate_final_shader(struct radeon_compiler *c, void *user); 1711c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák 1721c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#endif /* RADEON_COMPILER_H */ 173