1 /**************************************************************************
3 * Copyright 2009 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
31 * Helpers for emiting intrinsic calls.
33 * LLVM vanilla IR doesn't represent all basic arithmetic operations we care
34 * about, and it is often necessary to resort target-specific intrinsics for
35 * performance, convenience.
37 * Ideally we would like to stay away from target specific intrinsics and
38 * move all the instruction selection logic into upstream LLVM where it belongs.
40 * These functions are also used for calling C functions provided by us from
41 * generated LLVM code.
43 * @author Jose Fonseca <jfonseca@vmware.com>
47 #include "util/u_debug.h"
49 #include "lp_bld_const.h"
50 #include "lp_bld_intr.h"
51 #include "lp_bld_type.h"
52 #include "lp_bld_pack.h"
56 lp_declare_intrinsic(LLVMModuleRef module
,
59 LLVMTypeRef
*arg_types
,
62 LLVMTypeRef function_type
;
63 LLVMValueRef function
;
65 assert(!LLVMGetNamedFunction(module
, name
));
67 function_type
= LLVMFunctionType(ret_type
, arg_types
, num_args
, 0);
68 function
= LLVMAddFunction(module
, name
, function_type
);
70 LLVMSetFunctionCallConv(function
, LLVMCCallConv
);
71 LLVMSetLinkage(function
, LLVMExternalLinkage
);
73 assert(LLVMIsDeclaration(function
));
80 lp_build_intrinsic(LLVMBuilderRef builder
,
86 LLVMModuleRef module
= LLVMGetGlobalParent(LLVMGetBasicBlockParent(LLVMGetInsertBlock(builder
)));
87 LLVMValueRef function
;
89 function
= LLVMGetNamedFunction(module
, name
);
91 LLVMTypeRef arg_types
[LP_MAX_FUNC_ARGS
];
94 assert(num_args
<= LP_MAX_FUNC_ARGS
);
96 for(i
= 0; i
< num_args
; ++i
) {
98 arg_types
[i
] = LLVMTypeOf(args
[i
]);
101 function
= lp_declare_intrinsic(module
, name
, ret_type
, arg_types
, num_args
);
104 return LLVMBuildCall(builder
, function
, args
, num_args
, "");
109 lp_build_intrinsic_unary(LLVMBuilderRef builder
,
111 LLVMTypeRef ret_type
,
114 return lp_build_intrinsic(builder
, name
, ret_type
, &a
, 1);
119 lp_build_intrinsic_binary(LLVMBuilderRef builder
,
121 LLVMTypeRef ret_type
,
125 LLVMValueRef args
[2];
130 return lp_build_intrinsic(builder
, name
, ret_type
, args
, 2);
135 * Call intrinsic with arguments adapted to intrinsic vector length.
137 * Split vectors which are too large for the hw, or expand them if they
138 * are too small, so a caller calling a function which might use intrinsics
139 * doesn't need to do splitting/expansion on its own.
140 * This only supports intrinsics where src and dst types match.
143 lp_build_intrinsic_binary_anylength(struct gallivm_state
*gallivm
,
145 struct lp_type src_type
,
151 struct lp_type intrin_type
= src_type
;
152 LLVMBuilderRef builder
= gallivm
->builder
;
153 LLVMValueRef i32undef
= LLVMGetUndef(LLVMInt32TypeInContext(gallivm
->context
));
154 LLVMValueRef anative
, bnative
;
155 unsigned intrin_length
= intr_size
/ src_type
.width
;
157 intrin_type
.length
= intrin_length
;
159 if (intrin_length
> src_type
.length
) {
160 LLVMValueRef elems
[LP_MAX_VECTOR_LENGTH
];
161 LLVMValueRef constvec
, tmp
;
163 for (i
= 0; i
< src_type
.length
; i
++) {
164 elems
[i
] = lp_build_const_int32(gallivm
, i
);
166 for (; i
< intrin_length
; i
++) {
169 if (src_type
.length
== 1) {
170 LLVMTypeRef elem_type
= lp_build_elem_type(gallivm
, intrin_type
);
171 a
= LLVMBuildBitCast(builder
, a
, LLVMVectorType(elem_type
, 1), "");
172 b
= LLVMBuildBitCast(builder
, b
, LLVMVectorType(elem_type
, 1), "");
174 constvec
= LLVMConstVector(elems
, intrin_length
);
175 anative
= LLVMBuildShuffleVector(builder
, a
, a
, constvec
, "");
176 bnative
= LLVMBuildShuffleVector(builder
, b
, b
, constvec
, "");
177 tmp
= lp_build_intrinsic_binary(builder
, name
,
178 lp_build_vec_type(gallivm
, intrin_type
),
180 if (src_type
.length
> 1) {
181 constvec
= LLVMConstVector(elems
, src_type
.length
);
182 return LLVMBuildShuffleVector(builder
, tmp
, tmp
, constvec
, "");
185 return LLVMBuildExtractElement(builder
, tmp
, elems
[0], "");
188 else if (intrin_length
< src_type
.length
) {
189 unsigned num_vec
= src_type
.length
/ intrin_length
;
190 LLVMValueRef tmp
[LP_MAX_VECTOR_LENGTH
];
192 /* don't support arbitrary size here as this is so yuck */
193 if (src_type
.length
% intrin_length
) {
194 /* FIXME: This is something which should be supported
195 * but there doesn't seem to be any need for it currently
198 debug_printf("%s: should handle arbitrary vector size\n",
204 for (i
= 0; i
< num_vec
; i
++) {
205 anative
= lp_build_extract_range(gallivm
, a
, i
*intrin_length
,
207 bnative
= lp_build_extract_range(gallivm
, b
, i
*intrin_length
,
209 tmp
[i
] = lp_build_intrinsic_binary(builder
, name
,
210 lp_build_vec_type(gallivm
, intrin_type
),
213 return lp_build_concat(gallivm
, tmp
, intrin_type
, num_vec
);
216 return lp_build_intrinsic_binary(builder
, name
,
217 lp_build_vec_type(gallivm
, src_type
),
224 lp_build_intrinsic_map(struct gallivm_state
*gallivm
,
226 LLVMTypeRef ret_type
,
230 LLVMBuilderRef builder
= gallivm
->builder
;
231 LLVMTypeRef ret_elem_type
= LLVMGetElementType(ret_type
);
232 unsigned n
= LLVMGetVectorSize(ret_type
);
236 assert(num_args
<= LP_MAX_FUNC_ARGS
);
238 res
= LLVMGetUndef(ret_type
);
239 for(i
= 0; i
< n
; ++i
) {
240 LLVMValueRef index
= lp_build_const_int32(gallivm
, i
);
241 LLVMValueRef arg_elems
[LP_MAX_FUNC_ARGS
];
242 LLVMValueRef res_elem
;
243 for(j
= 0; j
< num_args
; ++j
)
244 arg_elems
[j
] = LLVMBuildExtractElement(builder
, args
[j
], index
, "");
245 res_elem
= lp_build_intrinsic(builder
, name
, ret_elem_type
, arg_elems
, num_args
);
246 res
= LLVMBuildInsertElement(builder
, res
, res_elem
, index
, "");
254 lp_build_intrinsic_map_unary(struct gallivm_state
*gallivm
,
256 LLVMTypeRef ret_type
,
259 return lp_build_intrinsic_map(gallivm
, name
, ret_type
, &a
, 1);
264 lp_build_intrinsic_map_binary(struct gallivm_state
*gallivm
,
266 LLVMTypeRef ret_type
,
270 LLVMValueRef args
[2];
275 return lp_build_intrinsic_map(gallivm
, name
, ret_type
, args
, 2);