1f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/**************************************************************************
2f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
3f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Copyright 2009 VMware, Inc.
4f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * All Rights Reserved.
5f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
6f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Permission is hereby granted, free of charge, to any person obtaining a
7f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * copy of this software and associated documentation files (the
8f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * "Software"), to deal in the Software without restriction, including
9f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * without limitation the rights to use, copy, modify, merge, publish,
10f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * distribute, sub license, and/or sell copies of the Software, and to
11f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * permit persons to whom the Software is furnished to do so, subject to
12f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * the following conditions:
13f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
14f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * The above copyright notice and this permission notice (including the
15f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * next paragraph) shall be included in all copies or substantial portions
16f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * of the Software.
17f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
18f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
26f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org **************************************************************************/
27f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
28f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
29f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/**
30f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * @file
31f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Helpers for emiting intrinsic calls.
32f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
33f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * LLVM vanilla IR doesn't represent all basic arithmetic operations we care
34f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * about, and it is often necessary to resort target-specific intrinsics for
35f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * performance, convenience.
36f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
37f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Ideally we would like to stay away from target specific intrinsics and
38f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * move all the instruction selection logic into upstream LLVM where it belongs.
39f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
40f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * These functions are also used for calling C functions provided by us from
41f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * generated LLVM code.
42f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
43f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * @author Jose Fonseca <jfonseca@vmware.com>
44f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */
45f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
46f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
47f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "util/u_debug.h"
48f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
49f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_const.h"
50f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_intr.h"
51f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_type.h"
52f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_pack.h"
53f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
54f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
55f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
56f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_declare_intrinsic(LLVMModuleRef module,
57f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     const char *name,
58f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     LLVMTypeRef ret_type,
59f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     LLVMTypeRef *arg_types,
60f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                     unsigned num_args)
61f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
62f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMTypeRef function_type;
63f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef function;
64f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
65f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   assert(!LLVMGetNamedFunction(module, name));
66f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
67f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   function_type = LLVMFunctionType(ret_type, arg_types, num_args, 0);
68f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   function = LLVMAddFunction(module, name, function_type);
69f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
70f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMSetFunctionCallConv(function, LLVMCCallConv);
71f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMSetLinkage(function, LLVMExternalLinkage);
72f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
73f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   assert(LLVMIsDeclaration(function));
74f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
75f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return function;
76f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
77f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
78f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
79f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
80f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic(LLVMBuilderRef builder,
81f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                   const char *name,
82f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                   LLVMTypeRef ret_type,
83f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                   LLVMValueRef *args,
84f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                   unsigned num_args)
85f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
86f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMModuleRef module = LLVMGetGlobalParent(LLVMGetBasicBlockParent(LLVMGetInsertBlock(builder)));
87f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef function;
88f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
89f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   function = LLVMGetNamedFunction(module, name);
90f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if(!function) {
91f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMTypeRef arg_types[LP_MAX_FUNC_ARGS];
92f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      unsigned i;
93f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
94f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      assert(num_args <= LP_MAX_FUNC_ARGS);
95f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
96f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      for(i = 0; i < num_args; ++i) {
97f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         assert(args[i]);
98f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         arg_types[i] = LLVMTypeOf(args[i]);
99f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
100f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
101f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      function = lp_declare_intrinsic(module, name, ret_type, arg_types, num_args);
102f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
103f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
104f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return LLVMBuildCall(builder, function, args, num_args, "");
105f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
106f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
107f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
108f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
109f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_unary(LLVMBuilderRef builder,
110f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                         const char *name,
111f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                         LLVMTypeRef ret_type,
112f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                         LLVMValueRef a)
113f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
114f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return lp_build_intrinsic(builder, name, ret_type, &a, 1);
115f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
116f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
117f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
118f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
119f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_binary(LLVMBuilderRef builder,
120f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                          const char *name,
121f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                          LLVMTypeRef ret_type,
122f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                          LLVMValueRef a,
123f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                          LLVMValueRef b)
124f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
125f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef args[2];
126f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
127f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   args[0] = a;
128f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   args[1] = b;
129f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
130f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return lp_build_intrinsic(builder, name, ret_type, args, 2);
131f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
132f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
133f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
134f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/**
135f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Call intrinsic with arguments adapted to intrinsic vector length.
136f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org *
137f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Split vectors which are too large for the hw, or expand them if they
138f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * are too small, so a caller calling a function which might use intrinsics
139f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * doesn't need to do splitting/expansion on its own.
140f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * This only supports intrinsics where src and dst types match.
141f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */
142f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
143f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_binary_anylength(struct gallivm_state *gallivm,
144f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                    const char *name,
145f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                    struct lp_type src_type,
146f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                    unsigned intr_size,
147f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                    LLVMValueRef a,
148f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                    LLVMValueRef b)
149f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
150f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   unsigned i;
151f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   struct lp_type intrin_type = src_type;
152f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMBuilderRef builder = gallivm->builder;
153f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef i32undef = LLVMGetUndef(LLVMInt32TypeInContext(gallivm->context));
154f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef anative, bnative;
155f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   unsigned intrin_length = intr_size / src_type.width;
156f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
157f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   intrin_type.length = intrin_length;
158f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
159f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   if (intrin_length > src_type.length) {
160f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMValueRef elems[LP_MAX_VECTOR_LENGTH];
161f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMValueRef constvec, tmp;
162f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
163f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      for (i = 0; i < src_type.length; i++) {
164f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         elems[i] = lp_build_const_int32(gallivm, i);
165f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
166f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      for (; i < intrin_length; i++) {
167f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         elems[i] = i32undef;
168f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
169f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      if (src_type.length == 1) {
170f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         LLVMTypeRef elem_type = lp_build_elem_type(gallivm, intrin_type);
171f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         a = LLVMBuildBitCast(builder, a, LLVMVectorType(elem_type, 1), "");
172f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         b = LLVMBuildBitCast(builder, b, LLVMVectorType(elem_type, 1), "");
173f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
174f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      constvec = LLVMConstVector(elems, intrin_length);
175f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      anative = LLVMBuildShuffleVector(builder, a, a, constvec, "");
176f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      bnative = LLVMBuildShuffleVector(builder, b, b, constvec, "");
177f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      tmp = lp_build_intrinsic_binary(builder, name,
178f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                      lp_build_vec_type(gallivm, intrin_type),
179f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                      anative, bnative);
180f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      if (src_type.length > 1) {
181f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         constvec = LLVMConstVector(elems, src_type.length);
182f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         return LLVMBuildShuffleVector(builder, tmp, tmp, constvec, "");
183f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
184f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      else {
185f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         return LLVMBuildExtractElement(builder, tmp, elems[0], "");
186f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
187f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
188f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   else if (intrin_length < src_type.length) {
189f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      unsigned num_vec = src_type.length / intrin_length;
190f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMValueRef tmp[LP_MAX_VECTOR_LENGTH];
191f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
192f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      /* don't support arbitrary size here as this is so yuck */
193f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      if (src_type.length % intrin_length) {
194f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         /* FIXME: This is something which should be supported
195f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org          * but there doesn't seem to be any need for it currently
196f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org          * so crash and burn.
197f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org          */
198f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         debug_printf("%s: should handle arbitrary vector size\n",
199f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                      __FUNCTION__);
200f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         assert(0);
201f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         return NULL;
202f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
203f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
204f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      for (i = 0; i < num_vec; i++) {
205f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         anative = lp_build_extract_range(gallivm, a, i*intrin_length,
206f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                        intrin_length);
207f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         bnative = lp_build_extract_range(gallivm, b, i*intrin_length,
208f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                        intrin_length);
209f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         tmp[i] = lp_build_intrinsic_binary(builder, name,
210f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                            lp_build_vec_type(gallivm, intrin_type),
211f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                            anative, bnative);
212f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      }
213f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      return lp_build_concat(gallivm, tmp, intrin_type, num_vec);
214f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
215f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   else {
216f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      return lp_build_intrinsic_binary(builder, name,
217f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                       lp_build_vec_type(gallivm, src_type),
218f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                                       a, b);
219f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
220f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
221f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
222f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
223f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
224f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_map(struct gallivm_state *gallivm,
225f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                       const char *name,
226f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                       LLVMTypeRef ret_type,
227f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                       LLVMValueRef *args,
228f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                       unsigned num_args)
229f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
230f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMBuilderRef builder = gallivm->builder;
231f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMTypeRef ret_elem_type = LLVMGetElementType(ret_type);
232f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   unsigned n = LLVMGetVectorSize(ret_type);
233f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   unsigned i, j;
234f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef res;
235f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
236f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   assert(num_args <= LP_MAX_FUNC_ARGS);
237f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
238f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   res = LLVMGetUndef(ret_type);
239f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   for(i = 0; i < n; ++i) {
240f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMValueRef index = lp_build_const_int32(gallivm, i);
241f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMValueRef arg_elems[LP_MAX_FUNC_ARGS];
242f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      LLVMValueRef res_elem;
243f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      for(j = 0; j < num_args; ++j)
244f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org         arg_elems[j] = LLVMBuildExtractElement(builder, args[j], index, "");
245f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      res_elem = lp_build_intrinsic(builder, name, ret_elem_type, arg_elems, num_args);
246f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org      res = LLVMBuildInsertElement(builder, res, res_elem, index, "");
247f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   }
248f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
249f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return res;
250f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
251f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
252f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
253f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
254f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_map_unary(struct gallivm_state *gallivm,
255f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                             const char *name,
256f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                             LLVMTypeRef ret_type,
257f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                             LLVMValueRef a)
258f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
259f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return lp_build_intrinsic_map(gallivm, name, ret_type, &a, 1);
260f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
261f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
262f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
263f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef
264f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_map_binary(struct gallivm_state *gallivm,
265f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                              const char *name,
266f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                              LLVMTypeRef ret_type,
267f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                              LLVMValueRef a,
268f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org                              LLVMValueRef b)
269f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{
270f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   LLVMValueRef args[2];
271f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
272f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   args[0] = a;
273f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   args[1] = b;
274f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
275f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org   return lp_build_intrinsic_map(gallivm, name, ret_type, args, 2);
276f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org}
277f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
278f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org
279