111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick/* 211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Copyright © 2010 Intel Corporation 311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * 411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Permission is hereby granted, free of charge, to any person obtaining a 511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * copy of this software and associated documentation files (the "Software"), 611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * to deal in the Software without restriction, including without limitation 711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * the rights to use, copy, modify, merge, publish, distribute, sublicense, 811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * and/or sell copies of the Software, and to permit persons to whom the 911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Software is furnished to do so, subject to the following conditions: 1011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * 1111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * The above copyright notice and this permission notice (including the next 1211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * paragraph) shall be included in all copies or substantial portions of the 1311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Software. 1411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * 1511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 1611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 1711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 1811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 1911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 2011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER 2111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * DEALINGS IN THE SOFTWARE. 2211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 2311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 2411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick/** 2511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * \file lower_vector.cpp 2611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * IR lowering pass to remove some types of ir_quadop_vector 2711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * 2811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * \author Ian Romanick <ian.d.romanick@intel.com> 2911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 3011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 3111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick#include "ir.h" 3211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick#include "ir_rvalue_visitor.h" 3311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 3411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickclass lower_vector_visitor : public ir_rvalue_visitor { 3511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickpublic: 3611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick lower_vector_visitor() : progress(false) 3711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick { 3811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* empty */ 3911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 4011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 4111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick void handle_rvalue(ir_rvalue **rvalue); 4211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 4311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /** 4411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Should SWZ-like expressions be lowered? 4511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 4611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick bool dont_lower_swz; 4711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 4811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick bool progress; 4911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick}; 5011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 5111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick/** 5211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Determine if an IR expression tree looks like an extended swizzle 5311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * 5411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Extended swizzles consist of access of a single vector source (with possible 5511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * per component negation) and the constants -1, 0, or 1. 5611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 5711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickbool 5811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickis_extended_swizzle(ir_expression *ir) 5911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick{ 6011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* Track any variables that are accessed by this expression. 6111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 6211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_variable *var = NULL; 6311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 6411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assert(ir->operation == ir_quadop_vector); 6511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 6611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick for (unsigned i = 0; i < ir->type->vector_elements; i++) { 6711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_rvalue *op = ir->operands[i]; 6811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 6911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick while (op != NULL) { 7011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick switch (op->ir_type) { 7111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case ir_type_constant: { 7211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick const ir_constant *const c = op->as_constant(); 7311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 7411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (!c->is_one() && !c->is_zero() && !c->is_negative_one()) 7511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return false; 7611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 7711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick op = NULL; 7811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick break; 7911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 8011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 8111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case ir_type_dereference_variable: { 8211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_dereference_variable *const d = (ir_dereference_variable *) op; 8311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 8411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if ((var != NULL) && (var != d->var)) 8511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return false; 8611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 8711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick var = d->var; 8811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick op = NULL; 8911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick break; 9011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 9111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 9211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case ir_type_expression: { 9311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_expression *const ex = (ir_expression *) op; 9411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 9511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (ex->operation != ir_unop_neg) 9611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return false; 9711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 9811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick op = ex->operands[0]; 9911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick break; 10011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 10111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 10211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case ir_type_swizzle: 10311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick op = ((ir_swizzle *) op)->val; 10411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick break; 10511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 10611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick default: 10711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return false; 10811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 10911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 11011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 11111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 11211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return true; 11311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick} 11411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 11511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickvoid 11611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanicklower_vector_visitor::handle_rvalue(ir_rvalue **rvalue) 11711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick{ 11811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (!*rvalue) 11911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return; 12011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 12111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_expression *expr = (*rvalue)->as_expression(); 12211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if ((expr == NULL) || (expr->operation != ir_quadop_vector)) 12311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return; 12411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 12511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (this->dont_lower_swz && is_extended_swizzle(expr)) 12611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return; 12711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 128d3073f58c17d8675a2ecdd5dfa83e5520c78e1a8Kenneth Graunke /* FINISHME: Is this the right thing to use for the ralloc context? 12911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 13011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick void *const mem_ctx = expr; 13111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 13211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assert(expr->type->vector_elements == expr->get_num_operands()); 13311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 13411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* Generate a temporary with the same type as the ir_quadop_operation. 13511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 13611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_variable *const temp = 13711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick new(mem_ctx) ir_variable(expr->type, "vecop_tmp", ir_var_temporary); 13811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 13911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick this->base_ir->insert_before(temp); 14011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 14111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* Counter of the number of components collected so far. 14211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 14311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick unsigned assigned; 14411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 14511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* Write-mask in the destination that receives counted by 'assigned'. 14611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 14711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick unsigned write_mask; 14811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 14911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 15011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* Generate upto four assignments to that variable. Try to group component 15111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * assignments together: 15211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * 15311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * - All constant components can be assigned at once. 15411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * - All assigments of components from a single variable with the same 15511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * unary operator can be assigned at once. 15611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 15711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_constant_data d = { { 0 } }; 15811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 15911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assigned = 0; 16011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick write_mask = 0; 16111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick for (unsigned i = 0; i < expr->type->vector_elements; i++) { 16211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick const ir_constant *const c = expr->operands[i]->as_constant(); 16311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 16411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (c == NULL) 16511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick continue; 16611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 16711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick switch (expr->type->base_type) { 16811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case GLSL_TYPE_UINT: d.u[assigned] = c->value.u[0]; break; 16911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case GLSL_TYPE_INT: d.i[assigned] = c->value.i[0]; break; 17011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case GLSL_TYPE_FLOAT: d.f[assigned] = c->value.f[0]; break; 17111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick case GLSL_TYPE_BOOL: d.b[assigned] = c->value.b[0]; break; 172a172368ef1500fd2c7c1e55133e8e098b73d97a5Vinson Lee default: assert(!"Should not get here."); break; 17311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 17411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 17511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick write_mask |= (1U << i); 17611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assigned++; 17711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 17811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 17911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assert((write_mask == 0) == (assigned == 0)); 18011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 18111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* If there were constant values, generate an assignment. 18211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 18311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (assigned > 0) { 18411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_constant *const c = 18511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick new(mem_ctx) ir_constant(glsl_type::get_instance(expr->type->base_type, 1869d998a2a592ed688c90b408604b9dbec26b752ffIan Romanick assigned, 1), 18711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick &d); 18811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_dereference *const lhs = new(mem_ctx) ir_dereference_variable(temp); 18911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_assignment *const assign = 19011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick new(mem_ctx) ir_assignment(lhs, c, NULL, write_mask); 19111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 19211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick this->base_ir->insert_before(assign); 19311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 19411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 19511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick /* FINISHME: This should try to coalesce assignments. 19611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */ 19711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick for (unsigned i = 0; i < expr->type->vector_elements; i++) { 19811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick if (expr->operands[i]->ir_type == ir_type_constant) 19911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick continue; 20011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 20111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_dereference *const lhs = new(mem_ctx) ir_dereference_variable(temp); 20211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick ir_assignment *const assign = 20311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick new(mem_ctx) ir_assignment(lhs, expr->operands[i], NULL, (1U << i)); 20411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 20511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick this->base_ir->insert_before(assign); 20611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assigned++; 20711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick } 20811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 20911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick assert(assigned == expr->type->vector_elements); 21011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 21111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick *rvalue = new(mem_ctx) ir_dereference_variable(temp); 21211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick this->progress = true; 21311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick} 21411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 21511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickbool 21611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanicklower_quadop_vector(exec_list *instructions, bool dont_lower_swz) 21711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick{ 21811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick lower_vector_visitor v; 21911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 22011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick v.dont_lower_swz = dont_lower_swz; 22111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick visit_list_elements(&v, instructions); 22211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick 22311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick return v.progress; 22411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick} 225