1/* 2 * Copyright 2009 Nicolai Hähnle <nhaehnle@gmail.com> 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * on the rights to use, copy, modify, merge, publish, distribute, sub 8 * license, and/or sell copies of the Software, and to permit persons to whom 9 * the Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice (including the next 12 * paragraph) shall be included in all copies or substantial portions of the 13 * Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL 18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM, 19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR 20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE 21 * USE OR OTHER DEALINGS IN THE SOFTWARE. */ 22 23#include "radeon_compiler.h" 24 25#include <stdio.h> 26 27#include "radeon_compiler_util.h" 28#include "radeon_dataflow.h" 29#include "radeon_emulate_branches.h" 30#include "radeon_emulate_loops.h" 31#include "radeon_program_alu.h" 32#include "radeon_program_tex.h" 33#include "radeon_rename_regs.h" 34#include "radeon_remove_constants.h" 35#include "r300_fragprog.h" 36#include "r300_fragprog_swizzle.h" 37#include "r500_fragprog.h" 38 39 40static void dataflow_outputs_mark_use(void * userdata, void * data, 41 void (*callback)(void *, unsigned int, unsigned int)) 42{ 43 struct r300_fragment_program_compiler * c = userdata; 44 callback(data, c->OutputColor[0], RC_MASK_XYZW); 45 callback(data, c->OutputColor[1], RC_MASK_XYZW); 46 callback(data, c->OutputColor[2], RC_MASK_XYZW); 47 callback(data, c->OutputColor[3], RC_MASK_XYZW); 48 callback(data, c->OutputDepth, RC_MASK_W); 49} 50 51static void rc_rewrite_depth_out(struct radeon_compiler *cc, void *user) 52{ 53 struct r300_fragment_program_compiler *c = (struct r300_fragment_program_compiler*)cc; 54 struct rc_instruction *rci; 55 56 for (rci = c->Base.Program.Instructions.Next; rci != &c->Base.Program.Instructions; rci = rci->Next) { 57 struct rc_sub_instruction * inst = &rci->U.I; 58 unsigned i; 59 const struct rc_opcode_info *info = rc_get_opcode_info(inst->Opcode); 60 61 if (inst->DstReg.File != RC_FILE_OUTPUT || inst->DstReg.Index != c->OutputDepth) 62 continue; 63 64 if (inst->DstReg.WriteMask & RC_MASK_Z) { 65 inst->DstReg.WriteMask = RC_MASK_W; 66 } else { 67 inst->DstReg.WriteMask = 0; 68 continue; 69 } 70 71 if (!info->IsComponentwise) { 72 continue; 73 } 74 75 for (i = 0; i < info->NumSrcRegs; i++) { 76 inst->SrcReg[i] = lmul_swizzle(RC_SWIZZLE_ZZZZ, inst->SrcReg[i]); 77 } 78 } 79} 80 81void r3xx_compile_fragment_program(struct r300_fragment_program_compiler* c) 82{ 83 int is_r500 = c->Base.is_r500; 84 int opt = !c->Base.disable_optimizations; 85 86 /* Lists of instruction transformations. */ 87 struct radeon_program_transformation rewrite_tex[] = { 88 { &radeonTransformTEX, c }, 89 { 0, 0 } 90 }; 91 92 struct radeon_program_transformation rewrite_if[] = { 93 { &r500_transform_IF, 0 }, 94 {0, 0} 95 }; 96 97 struct radeon_program_transformation native_rewrite_r500[] = { 98 { &radeonTransformALU, 0 }, 99 { &radeonTransformDeriv, 0 }, 100 { &radeonTransformTrigScale, 0 }, 101 { 0, 0 } 102 }; 103 104 struct radeon_program_transformation native_rewrite_r300[] = { 105 { &radeonTransformALU, 0 }, 106 { &r300_transform_trig_simple, 0 }, 107 { 0, 0 } 108 }; 109 110 /* List of compiler passes. */ 111 struct radeon_compiler_pass fs_list[] = { 112 /* NAME DUMP PREDICATE FUNCTION PARAM */ 113 {"rewrite depth out", 1, 1, rc_rewrite_depth_out, NULL}, 114 /* This transformation needs to be done before any of the IF 115 * instructions are modified. */ 116 {"transform KILP", 1, 1, rc_transform_KILP, NULL}, 117 {"unroll loops", 1, is_r500, rc_unroll_loops, NULL}, 118 {"transform loops", 1, !is_r500, rc_transform_loops, NULL}, 119 {"emulate branches", 1, !is_r500, rc_emulate_branches, NULL}, 120 {"transform TEX", 1, 1, rc_local_transform, rewrite_tex}, 121 {"transform IF", 1, is_r500, rc_local_transform, rewrite_if}, 122 {"native rewrite", 1, is_r500, rc_local_transform, native_rewrite_r500}, 123 {"native rewrite", 1, !is_r500, rc_local_transform, native_rewrite_r300}, 124 {"deadcode", 1, opt, rc_dataflow_deadcode, dataflow_outputs_mark_use}, 125 {"emulate loops", 1, !is_r500, rc_emulate_loops, NULL}, 126 {"register rename", 1, !is_r500 || opt, rc_rename_regs, NULL}, 127 {"dataflow optimize", 1, opt, rc_optimize, NULL}, 128 {"inline literals", 1, is_r500 && opt, rc_inline_literals, NULL}, 129 {"dataflow swizzles", 1, 1, rc_dataflow_swizzles, NULL}, 130 {"dead constants", 1, 1, rc_remove_unused_constants, &c->code->constants_remap_table}, 131 {"pair translate", 1, 1, rc_pair_translate, NULL}, 132 {"pair scheduling", 1, 1, rc_pair_schedule, &opt}, 133 {"dead sources", 1, 1, rc_pair_remove_dead_sources, NULL}, 134 {"register allocation", 1, 1, rc_pair_regalloc, &opt}, 135 {"final code validation", 0, 1, rc_validate_final_shader, NULL}, 136 {"machine code generation", 0, is_r500, r500BuildFragmentProgramHwCode, NULL}, 137 {"machine code generation", 0, !is_r500, r300BuildFragmentProgramHwCode, NULL}, 138 {"dump machine code", 0, is_r500 && (c->Base.Debug & RC_DBG_LOG), r500FragmentProgramDump, NULL}, 139 {"dump machine code", 0, !is_r500 && (c->Base.Debug & RC_DBG_LOG), r300FragmentProgramDump, NULL}, 140 {NULL, 0, 0, NULL, NULL} 141 }; 142 143 c->Base.type = RC_FRAGMENT_PROGRAM; 144 c->Base.SwizzleCaps = c->Base.is_r500 ? &r500_swizzle_caps : &r300_swizzle_caps; 145 146 rc_run_compiler(&c->Base, fs_list); 147 148 rc_constants_copy(&c->code->constants, &c->Base.Program.Constants); 149} 150