111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick/*
211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Copyright © 2010 Intel Corporation
311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick *
411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Permission is hereby granted, free of charge, to any person obtaining a
511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * copy of this software and associated documentation files (the "Software"),
611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * to deal in the Software without restriction, including without limitation
711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * the rights to use, copy, modify, merge, publish, distribute, sublicense,
811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * and/or sell copies of the Software, and to permit persons to whom the
911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Software is furnished to do so, subject to the following conditions:
1011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick *
1111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * The above copyright notice and this permission notice (including the next
1211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * paragraph) shall be included in all copies or substantial portions of the
1311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Software.
1411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick *
1511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
1611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
1711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
1811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
1911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
2011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
2111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * DEALINGS IN THE SOFTWARE.
2211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */
2311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
2411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick/**
2511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * \file lower_vector.cpp
2611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * IR lowering pass to remove some types of ir_quadop_vector
2711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick *
2811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * \author Ian Romanick <ian.d.romanick@intel.com>
2911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */
3011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
3111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick#include "ir.h"
3211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick#include "ir_rvalue_visitor.h"
3311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
3411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickclass lower_vector_visitor : public ir_rvalue_visitor {
3511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickpublic:
3611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   lower_vector_visitor() : progress(false)
3711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   {
3811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      /* empty */
3911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   }
4011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
4111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   void handle_rvalue(ir_rvalue **rvalue);
4211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
4311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /**
4411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    * Should SWZ-like expressions be lowered?
4511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
4611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   bool dont_lower_swz;
4711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
4811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   bool progress;
4911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick};
5011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
5111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick/**
5211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Determine if an IR expression tree looks like an extended swizzle
5311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick *
5411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * Extended swizzles consist of access of a single vector source (with possible
5511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick * per component negation) and the constants -1, 0, or 1.
5611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick */
5711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickbool
5811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickis_extended_swizzle(ir_expression *ir)
5911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick{
6011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* Track any variables that are accessed by this expression.
6111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
6211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   ir_variable *var = NULL;
6311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
6411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   assert(ir->operation == ir_quadop_vector);
6511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
6611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   for (unsigned i = 0; i < ir->type->vector_elements; i++) {
6711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      ir_rvalue *op = ir->operands[i];
6811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
6911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      while (op != NULL) {
7011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 switch (op->ir_type) {
7111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 case ir_type_constant: {
7211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    const ir_constant *const c = op->as_constant();
7311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
7411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    if (!c->is_one() && !c->is_zero() && !c->is_negative_one())
7511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	       return false;
7611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
7711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    op = NULL;
7811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    break;
7911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 }
8011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
8111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 case ir_type_dereference_variable: {
8211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    ir_dereference_variable *const d = (ir_dereference_variable *) op;
8311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
8411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    if ((var != NULL) && (var != d->var))
8511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	       return false;
8611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
8711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    var = d->var;
8811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    op = NULL;
8911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    break;
9011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 }
9111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
9211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 case ir_type_expression: {
9311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    ir_expression *const ex = (ir_expression *) op;
9411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
9511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    if (ex->operation != ir_unop_neg)
9611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	       return false;
9711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
9811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    op = ex->operands[0];
9911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    break;
10011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 }
10111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
10211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 case ir_type_swizzle:
10311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    op = ((ir_swizzle *) op)->val;
10411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    break;
10511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
10611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 default:
10711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	    return false;
10811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 }
10911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      }
11011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   }
11111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
11211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   return true;
11311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick}
11411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
11511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickvoid
11611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanicklower_vector_visitor::handle_rvalue(ir_rvalue **rvalue)
11711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick{
11811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   if (!*rvalue)
11911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      return;
12011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
12111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   ir_expression *expr = (*rvalue)->as_expression();
12211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   if ((expr == NULL) || (expr->operation != ir_quadop_vector))
12311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      return;
12411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
12511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   if (this->dont_lower_swz && is_extended_swizzle(expr))
12611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      return;
12711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
128d3073f58c17d8675a2ecdd5dfa83e5520c78e1a8Kenneth Graunke   /* FINISHME: Is this the right thing to use for the ralloc context?
12911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
13011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   void *const mem_ctx = expr;
13111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
13211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   assert(expr->type->vector_elements == expr->get_num_operands());
13311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
13411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* Generate a temporary with the same type as the ir_quadop_operation.
13511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
13611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   ir_variable *const temp =
13711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      new(mem_ctx) ir_variable(expr->type, "vecop_tmp", ir_var_temporary);
13811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
13911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   this->base_ir->insert_before(temp);
14011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
14111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* Counter of the number of components collected so far.
14211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
14311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   unsigned assigned;
14411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
14511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* Write-mask in the destination that receives counted by 'assigned'.
14611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
14711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   unsigned write_mask;
14811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
14911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
15011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* Generate upto four assignments to that variable.  Try to group component
15111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    * assignments together:
15211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    *
15311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    * - All constant components can be assigned at once.
15411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    * - All assigments of components from a single variable with the same
15511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    *   unary operator can be assigned at once.
15611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
15711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   ir_constant_data d = { { 0 } };
15811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
15911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   assigned = 0;
16011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   write_mask = 0;
16111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   for (unsigned i = 0; i < expr->type->vector_elements; i++) {
16211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      const ir_constant *const c = expr->operands[i]->as_constant();
16311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
16411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      if (c == NULL)
16511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 continue;
16611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
16711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      switch (expr->type->base_type) {
16811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      case GLSL_TYPE_UINT:  d.u[assigned] = c->value.u[0]; break;
16911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      case GLSL_TYPE_INT:   d.i[assigned] = c->value.i[0]; break;
17011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      case GLSL_TYPE_FLOAT: d.f[assigned] = c->value.f[0]; break;
17111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      case GLSL_TYPE_BOOL:  d.b[assigned] = c->value.b[0]; break;
172a172368ef1500fd2c7c1e55133e8e098b73d97a5Vinson Lee      default:              assert(!"Should not get here."); break;
17311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      }
17411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
17511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      write_mask |= (1U << i);
17611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      assigned++;
17711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   }
17811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
17911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   assert((write_mask == 0) == (assigned == 0));
18011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
18111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* If there were constant values, generate an assignment.
18211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
18311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   if (assigned > 0) {
18411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      ir_constant *const c =
18511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 new(mem_ctx) ir_constant(glsl_type::get_instance(expr->type->base_type,
1869d998a2a592ed688c90b408604b9dbec26b752ffIan Romanick							  assigned, 1),
18711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick				  &d);
18811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      ir_dereference *const lhs = new(mem_ctx) ir_dereference_variable(temp);
18911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      ir_assignment *const assign =
19011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 new(mem_ctx) ir_assignment(lhs, c, NULL, write_mask);
19111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
19211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      this->base_ir->insert_before(assign);
19311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   }
19411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
19511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   /* FINISHME: This should try to coalesce assignments.
19611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick    */
19711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   for (unsigned i = 0; i < expr->type->vector_elements; i++) {
19811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      if (expr->operands[i]->ir_type == ir_type_constant)
19911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 continue;
20011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
20111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      ir_dereference *const lhs = new(mem_ctx) ir_dereference_variable(temp);
20211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      ir_assignment *const assign =
20311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick	 new(mem_ctx) ir_assignment(lhs, expr->operands[i], NULL, (1U << i));
20411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
20511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      this->base_ir->insert_before(assign);
20611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick      assigned++;
20711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   }
20811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
20911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   assert(assigned == expr->type->vector_elements);
21011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
21111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   *rvalue = new(mem_ctx) ir_dereference_variable(temp);
21211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   this->progress = true;
21311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick}
21411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
21511d6f1c69871d0b7edc28f639256460839fccd2dIan Romanickbool
21611d6f1c69871d0b7edc28f639256460839fccd2dIan Romanicklower_quadop_vector(exec_list *instructions, bool dont_lower_swz)
21711d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick{
21811d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   lower_vector_visitor v;
21911d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
22011d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   v.dont_lower_swz = dont_lower_swz;
22111d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   visit_list_elements(&v, instructions);
22211d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick
22311d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick   return v.progress;
22411d6f1c69871d0b7edc28f639256460839fccd2dIan Romanick}
225