1f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/************************************************************************** 2f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 3f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Copyright 2009 VMware, Inc. 4f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * All Rights Reserved. 5f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 6f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Permission is hereby granted, free of charge, to any person obtaining a 7f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * copy of this software and associated documentation files (the 8f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * "Software"), to deal in the Software without restriction, including 9f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * without limitation the rights to use, copy, modify, merge, publish, 10f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * distribute, sub license, and/or sell copies of the Software, and to 11f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * permit persons to whom the Software is furnished to do so, subject to 12f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * the following conditions: 13f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 14f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * The above copyright notice and this permission notice (including the 15f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * next paragraph) shall be included in all copies or substantial portions 16f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * of the Software. 17f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 18f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS 19f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 20f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. 21f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR 22f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, 23f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE 24f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 25f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 26f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org **************************************************************************/ 27f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 28f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 29f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/** 30f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * @file 31f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Helpers for emiting intrinsic calls. 32f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 33f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * LLVM vanilla IR doesn't represent all basic arithmetic operations we care 34f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * about, and it is often necessary to resort target-specific intrinsics for 35f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * performance, convenience. 36f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 37f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Ideally we would like to stay away from target specific intrinsics and 38f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * move all the instruction selection logic into upstream LLVM where it belongs. 39f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 40f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * These functions are also used for calling C functions provided by us from 41f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * generated LLVM code. 42f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 43f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * @author Jose Fonseca <jfonseca@vmware.com> 44f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */ 45f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 46f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 47f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "util/u_debug.h" 48f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 49f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_const.h" 50f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_intr.h" 51f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_type.h" 52f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org#include "lp_bld_pack.h" 53f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 54f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 55f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 56f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_declare_intrinsic(LLVMModuleRef module, 57f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 58f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 59f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef *arg_types, 60f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned num_args) 61f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 62f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef function_type; 63f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef function; 64f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 65f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org assert(!LLVMGetNamedFunction(module, name)); 66f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 67f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org function_type = LLVMFunctionType(ret_type, arg_types, num_args, 0); 68f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org function = LLVMAddFunction(module, name, function_type); 69f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 70f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMSetFunctionCallConv(function, LLVMCCallConv); 71f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMSetLinkage(function, LLVMExternalLinkage); 72f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 73f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org assert(LLVMIsDeclaration(function)); 74f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 75f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return function; 76f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 77f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 78f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 79f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 80f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic(LLVMBuilderRef builder, 81f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 82f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 83f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef *args, 84f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned num_args) 85f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 86f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMModuleRef module = LLVMGetGlobalParent(LLVMGetBasicBlockParent(LLVMGetInsertBlock(builder))); 87f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef function; 88f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 89f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org function = LLVMGetNamedFunction(module, name); 90f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if(!function) { 91f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef arg_types[LP_MAX_FUNC_ARGS]; 92f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned i; 93f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 94f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org assert(num_args <= LP_MAX_FUNC_ARGS); 95f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 96f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org for(i = 0; i < num_args; ++i) { 97f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org assert(args[i]); 98f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org arg_types[i] = LLVMTypeOf(args[i]); 99f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 100f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 101f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org function = lp_declare_intrinsic(module, name, ret_type, arg_types, num_args); 102f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 103f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 104f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return LLVMBuildCall(builder, function, args, num_args, ""); 105f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 106f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 107f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 108f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 109f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_unary(LLVMBuilderRef builder, 110f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 111f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 112f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef a) 113f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 114f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return lp_build_intrinsic(builder, name, ret_type, &a, 1); 115f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 116f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 117f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 118f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 119f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_binary(LLVMBuilderRef builder, 120f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 121f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 122f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef a, 123f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef b) 124f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 125f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef args[2]; 126f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 127f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org args[0] = a; 128f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org args[1] = b; 129f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 130f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return lp_build_intrinsic(builder, name, ret_type, args, 2); 131f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 132f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 133f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 134f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org/** 135f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Call intrinsic with arguments adapted to intrinsic vector length. 136f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * 137f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * Split vectors which are too large for the hw, or expand them if they 138f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * are too small, so a caller calling a function which might use intrinsics 139f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * doesn't need to do splitting/expansion on its own. 140f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * This only supports intrinsics where src and dst types match. 141f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */ 142f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 143f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_binary_anylength(struct gallivm_state *gallivm, 144f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 145f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org struct lp_type src_type, 146f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned intr_size, 147f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef a, 148f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef b) 149f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 150f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned i; 151f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org struct lp_type intrin_type = src_type; 152f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMBuilderRef builder = gallivm->builder; 153f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef i32undef = LLVMGetUndef(LLVMInt32TypeInContext(gallivm->context)); 154f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef anative, bnative; 155f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned intrin_length = intr_size / src_type.width; 156f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 157f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org intrin_type.length = intrin_length; 158f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 159f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (intrin_length > src_type.length) { 160f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef elems[LP_MAX_VECTOR_LENGTH]; 161f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef constvec, tmp; 162f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 163f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org for (i = 0; i < src_type.length; i++) { 164f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org elems[i] = lp_build_const_int32(gallivm, i); 165f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 166f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org for (; i < intrin_length; i++) { 167f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org elems[i] = i32undef; 168f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 169f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (src_type.length == 1) { 170f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef elem_type = lp_build_elem_type(gallivm, intrin_type); 171f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org a = LLVMBuildBitCast(builder, a, LLVMVectorType(elem_type, 1), ""); 172f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org b = LLVMBuildBitCast(builder, b, LLVMVectorType(elem_type, 1), ""); 173f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 174f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org constvec = LLVMConstVector(elems, intrin_length); 175f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org anative = LLVMBuildShuffleVector(builder, a, a, constvec, ""); 176f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org bnative = LLVMBuildShuffleVector(builder, b, b, constvec, ""); 177f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org tmp = lp_build_intrinsic_binary(builder, name, 178f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org lp_build_vec_type(gallivm, intrin_type), 179f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org anative, bnative); 180f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (src_type.length > 1) { 181f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org constvec = LLVMConstVector(elems, src_type.length); 182f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return LLVMBuildShuffleVector(builder, tmp, tmp, constvec, ""); 183f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 184f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org else { 185f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return LLVMBuildExtractElement(builder, tmp, elems[0], ""); 186f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 187f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 188f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org else if (intrin_length < src_type.length) { 189f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned num_vec = src_type.length / intrin_length; 190f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef tmp[LP_MAX_VECTOR_LENGTH]; 191f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 192f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* don't support arbitrary size here as this is so yuck */ 193f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org if (src_type.length % intrin_length) { 194f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org /* FIXME: This is something which should be supported 195f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * but there doesn't seem to be any need for it currently 196f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org * so crash and burn. 197f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org */ 198f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org debug_printf("%s: should handle arbitrary vector size\n", 199f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org __FUNCTION__); 200f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org assert(0); 201f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return NULL; 202f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 203f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 204f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org for (i = 0; i < num_vec; i++) { 205f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org anative = lp_build_extract_range(gallivm, a, i*intrin_length, 206f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org intrin_length); 207f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org bnative = lp_build_extract_range(gallivm, b, i*intrin_length, 208f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org intrin_length); 209f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org tmp[i] = lp_build_intrinsic_binary(builder, name, 210f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org lp_build_vec_type(gallivm, intrin_type), 211f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org anative, bnative); 212f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 213f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return lp_build_concat(gallivm, tmp, intrin_type, num_vec); 214f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 215f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org else { 216f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return lp_build_intrinsic_binary(builder, name, 217f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org lp_build_vec_type(gallivm, src_type), 218f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org a, b); 219f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 220f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 221f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 222f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 223f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 224f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_map(struct gallivm_state *gallivm, 225f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 226f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 227f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef *args, 228f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned num_args) 229f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 230f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMBuilderRef builder = gallivm->builder; 231f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_elem_type = LLVMGetElementType(ret_type); 232f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned n = LLVMGetVectorSize(ret_type); 233f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org unsigned i, j; 234f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef res; 235f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 236f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org assert(num_args <= LP_MAX_FUNC_ARGS); 237f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 238f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org res = LLVMGetUndef(ret_type); 239f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org for(i = 0; i < n; ++i) { 240f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef index = lp_build_const_int32(gallivm, i); 241f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef arg_elems[LP_MAX_FUNC_ARGS]; 242f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef res_elem; 243f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org for(j = 0; j < num_args; ++j) 244f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org arg_elems[j] = LLVMBuildExtractElement(builder, args[j], index, ""); 245f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org res_elem = lp_build_intrinsic(builder, name, ret_elem_type, arg_elems, num_args); 246f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org res = LLVMBuildInsertElement(builder, res, res_elem, index, ""); 247f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org } 248f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 249f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return res; 250f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 251f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 252f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 253f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 254f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_map_unary(struct gallivm_state *gallivm, 255f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 256f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 257f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef a) 258f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 259f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return lp_build_intrinsic_map(gallivm, name, ret_type, &a, 1); 260f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 261f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 262f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 263f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orgLLVMValueRef 264f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.orglp_build_intrinsic_map_binary(struct gallivm_state *gallivm, 265f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org const char *name, 266f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMTypeRef ret_type, 267f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef a, 268f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef b) 269f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org{ 270f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org LLVMValueRef args[2]; 271f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 272f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org args[0] = a; 273f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org args[1] = b; 274f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 275f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org return lp_build_intrinsic_map(gallivm, name, ret_type, args, 2); 276f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org} 277f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 278f2ba7591b1407a7ee9209f842c50696914dc2dedkbr@chromium.org 279