11c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák/*
21c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Copyright 2009 Nicolai Hähnle <nhaehnle@gmail.com>
31c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *
41c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Permission is hereby granted, free of charge, to any person obtaining a
51c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * copy of this software and associated documentation files (the "Software"),
61c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * to deal in the Software without restriction, including without limitation
71c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * on the rights to use, copy, modify, merge, publish, distribute, sub
81c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * license, and/or sell copies of the Software, and to permit persons to whom
91c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * the Software is furnished to do so, subject to the following conditions:
101c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *
111c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * The above copyright notice and this permission notice (including the next
121c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * paragraph) shall be included in all copies or substantial portions of the
131c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * Software.
141c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *
151c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
161c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
171c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
181c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
191c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
201c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
211c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * USE OR OTHER DEALINGS IN THE SOFTWARE. */
221c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
231c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#ifndef RADEON_COMPILER_H
241c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define RADEON_COMPILER_H
251c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
261c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "main/compiler.h"
271c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
281c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "memory_pool.h"
291c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "radeon_code.h"
301c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "radeon_program.h"
311c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#include "radeon_emulate_loops.h"
321c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
331c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define RC_DBG_LOG        (1 << 0)
341c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define RC_DBG_STATS      (1 << 1)
351c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
361c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct rc_swizzle_caps;
371c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
381c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákenum rc_program_type {
391c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	RC_VERTEX_PROGRAM,
401c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	RC_FRAGMENT_PROGRAM,
411c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	RC_NUM_PROGRAM_TYPES
421c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák};
431c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
441c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct radeon_compiler {
451c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct memory_pool Pool;
461c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct rc_program Program;
471c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	enum rc_program_type type;
481c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned Debug:2;
491c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned Error:1;
501c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	char * ErrorMsg;
511c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
521c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/* Hardware specification. */
531c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned is_r400:1;
541c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned is_r500:1;
551c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned has_half_swizzles:1;
561c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned has_presub:1;
57e945fb04d04c33da5e77d22d739c5740a522a61eTom Stellard	unsigned has_omod:1;
581c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned disable_optimizations:1;
591c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned max_temp_regs;
601c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned max_constants;
611c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	int max_alu_insts;
621c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned max_tex_insts;
631c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
641c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/* Whether to remove unused constants and empty holes in constant space. */
651c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned remove_unused_constants:1;
661c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
671c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/**
681c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	 * Variables used internally, not be touched by callers
691c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	 * of the compiler
701c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	 */
711c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/*@{*/
721c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct rc_swizzle_caps * SwizzleCaps;
731c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/*@}*/
741c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
751c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct emulate_loop_state loop_state;
761c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
771c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned initial_num_insts; /* Number of instructions at start. */
781c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák};
791c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
801c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_init(struct radeon_compiler * c);
811c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_destroy(struct radeon_compiler * c);
821c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
831c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_debug(struct radeon_compiler * c, const char * fmt, ...);
841c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_error(struct radeon_compiler * c, const char * fmt, ...);
851c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
861c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákint rc_if_fail_helper(struct radeon_compiler * c, const char * file, int line, const char * assertion);
871c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
881c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák/**
891c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * This macro acts like an if-statement that can be used to implement
901c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * non-aborting assertions in the compiler.
911c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *
921c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * It checks whether \p cond is true. If not, an internal compiler error is
931c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * flagged and the if-clause is run.
941c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *
951c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák * A typical use-case would be:
961c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *
971c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *  if (rc_assert(c, condition-that-must-be-true))
981c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák *  	return;
991c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák */
1001c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#define rc_assert(c, cond) \
1011c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	(!(cond) && rc_if_fail_helper(c, __FILE__, __LINE__, #cond))
1021c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1031c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_calculate_inputs_outputs(struct radeon_compiler * c);
1041c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1051c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_move_input(struct radeon_compiler * c, unsigned input, struct rc_src_register new_input);
1061c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_move_output(struct radeon_compiler * c, unsigned output, unsigned new_output, unsigned writemask);
1071c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_copy_output(struct radeon_compiler * c, unsigned output, unsigned dup_output);
1081c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_transform_fragment_wpos(struct radeon_compiler * c, unsigned wpos, unsigned new_input,
1091c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák                                int full_vtransform);
1101c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_transform_fragment_face(struct radeon_compiler *c, unsigned face);
1111c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1121c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct r300_fragment_program_compiler {
1131c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct radeon_compiler Base;
1141c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct rX00_fragment_program_code *code;
1151c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/* Optional transformations and features. */
1161c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct r300_fragment_program_external_state state;
1171c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/* Register corresponding to the depthbuffer. */
1181c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned OutputDepth;
1191c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	/* Registers corresponding to the four colorbuffers. */
1201c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned OutputColor[4];
1211c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1221c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	void * UserData;
1231c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	void (*AllocateHwInputs)(
1241c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák		struct r300_fragment_program_compiler * c,
1251c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák		void (*allocate)(void * data, unsigned input, unsigned hwreg),
1261c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák		void * mydata);
1271c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák};
1281c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1291c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid r3xx_compile_fragment_program(struct r300_fragment_program_compiler* c);
1301c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1311c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct r300_vertex_program_compiler {
1321c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct radeon_compiler Base;
1331c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	struct r300_vertex_program_code *code;
1341c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	uint32_t RequiredOutputs;
1351c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1361c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	void * UserData;
1371c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	void (*SetHwInputOutput)(struct r300_vertex_program_compiler * c);
1381c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1391c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák};
1401c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1411c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid r3xx_compile_vertex_program(struct r300_vertex_program_compiler* c);
142b2df031a959f36743527b9abc89913ce4f895de3Tom Stellardvoid rc_vert_fc(struct radeon_compiler *compiler, void *user);
1431c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid r300_vertex_program_dump(struct radeon_compiler *compiler, void *user);
1441c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1451c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct radeon_compiler_pass {
1461c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	const char *name;	/* Name of the pass. */
1471c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	int dump;		/* Dump the program if Debug == 1? */
1481c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	int predicate;		/* Run this pass? */
1491c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	void (*run)(struct radeon_compiler *c, void *user); /* The main entrypoint. */
1501c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	void *user;		/* Optional parameter which is passed to the run function. */
1511c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák};
1521c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1531c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákstruct rc_program_stats {
1541c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_insts;
1551c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_fc_insts;
1561c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_tex_insts;
1571c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_rgb_insts;
1581c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_alpha_insts;
1591c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_presub_ops;
1601c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák	unsigned num_temp_regs;
161e945fb04d04c33da5e77d22d739c5740a522a61eTom Stellard	unsigned num_omod_ops;
162befcce264c8bf8fdac233e6a01cadc595a1d11d3Tom Stellard	unsigned num_inline_literals;
1631c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák};
1641c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1651c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_get_stats(struct radeon_compiler *c, struct rc_program_stats *s);
1661c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1671c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák/* Executes a list of compiler passes given in the parameter 'list'. */
1681c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_run_compiler_passes(struct radeon_compiler *c, struct radeon_compiler_pass *list);
1691c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_run_compiler(struct radeon_compiler *c, struct radeon_compiler_pass *list);
1701c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšákvoid rc_validate_final_shader(struct radeon_compiler *c, void *user);
1711c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák
1721c2c4ddbd1e97bfd13430521e5c09cb5ce8e36e6Marek Olšák#endif /* RADEON_COMPILER_H */
173