1 /**************************************************************************
2 *
3 * Copyright 2009 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29 /**
30 * @file
31 * Helpers for emiting intrinsic calls.
32 *
33 * LLVM vanilla IR doesn't represent all basic arithmetic operations we care
34 * about, and it is often necessary to resort target-specific intrinsics for
35 * performance, convenience.
36 *
37 * Ideally we would like to stay away from target specific intrinsics and
38 * move all the instruction selection logic into upstream LLVM where it belongs.
39 *
40 * These functions are also used for calling C functions provided by us from
41 * generated LLVM code.
42 *
43 * @author Jose Fonseca <jfonseca@vmware.com>
44 */
45
46 #include <llvm/Config/llvm-config.h>
47
48 #include "util/u_debug.h"
49 #include "util/u_string.h"
50 #include "util/bitscan.h"
51
52 #include "lp_bld_const.h"
53 #include "lp_bld_intr.h"
54 #include "lp_bld_type.h"
55 #include "lp_bld_pack.h"
56 #include "lp_bld_debug.h"
57
58
59 void
lp_format_intrinsic(char * name,size_t size,const char * name_root,LLVMTypeRef type)60 lp_format_intrinsic(char *name,
61 size_t size,
62 const char *name_root,
63 LLVMTypeRef type)
64 {
65 unsigned length = 0;
66 unsigned width;
67 char c;
68
69 LLVMTypeKind kind = LLVMGetTypeKind(type);
70 if (kind == LLVMVectorTypeKind) {
71 length = LLVMGetVectorSize(type);
72 type = LLVMGetElementType(type);
73 kind = LLVMGetTypeKind(type);
74 }
75
76 switch (kind) {
77 case LLVMIntegerTypeKind:
78 c = 'i';
79 width = LLVMGetIntTypeWidth(type);
80 break;
81 case LLVMFloatTypeKind:
82 c = 'f';
83 width = 32;
84 break;
85 case LLVMDoubleTypeKind:
86 c = 'f';
87 width = 64;
88 break;
89 default:
90 unreachable("unexpected LLVMTypeKind");
91 }
92
93 if (length) {
94 snprintf(name, size, "%s.v%u%c%u", name_root, length, c, width);
95 } else {
96 snprintf(name, size, "%s.%c%u", name_root, c, width);
97 }
98 }
99
100
101 LLVMValueRef
lp_declare_intrinsic(LLVMModuleRef module,const char * name,LLVMTypeRef ret_type,LLVMTypeRef * arg_types,unsigned num_args)102 lp_declare_intrinsic(LLVMModuleRef module,
103 const char *name,
104 LLVMTypeRef ret_type,
105 LLVMTypeRef *arg_types,
106 unsigned num_args)
107 {
108 LLVMTypeRef function_type;
109 LLVMValueRef function;
110
111 assert(!LLVMGetNamedFunction(module, name));
112
113 function_type = LLVMFunctionType(ret_type, arg_types, num_args, 0);
114 function = LLVMAddFunction(module, name, function_type);
115
116 LLVMSetFunctionCallConv(function, LLVMCCallConv);
117 LLVMSetLinkage(function, LLVMExternalLinkage);
118
119 assert(LLVMIsDeclaration(function));
120
121 return function;
122 }
123
124
125 #if LLVM_VERSION_MAJOR < 4
lp_attr_to_llvm_attr(enum lp_func_attr attr)126 static LLVMAttribute lp_attr_to_llvm_attr(enum lp_func_attr attr)
127 {
128 switch (attr) {
129 case LP_FUNC_ATTR_ALWAYSINLINE: return LLVMAlwaysInlineAttribute;
130 case LP_FUNC_ATTR_INREG: return LLVMInRegAttribute;
131 case LP_FUNC_ATTR_NOALIAS: return LLVMNoAliasAttribute;
132 case LP_FUNC_ATTR_NOUNWIND: return LLVMNoUnwindAttribute;
133 case LP_FUNC_ATTR_READNONE: return LLVMReadNoneAttribute;
134 case LP_FUNC_ATTR_READONLY: return LLVMReadOnlyAttribute;
135 default:
136 _debug_printf("Unhandled function attribute: %x\n", attr);
137 return 0;
138 }
139 }
140
141 #else
142
attr_to_str(enum lp_func_attr attr)143 static const char *attr_to_str(enum lp_func_attr attr)
144 {
145 switch (attr) {
146 case LP_FUNC_ATTR_ALWAYSINLINE: return "alwaysinline";
147 case LP_FUNC_ATTR_INREG: return "inreg";
148 case LP_FUNC_ATTR_NOALIAS: return "noalias";
149 case LP_FUNC_ATTR_NOUNWIND: return "nounwind";
150 case LP_FUNC_ATTR_READNONE: return "readnone";
151 case LP_FUNC_ATTR_READONLY: return "readonly";
152 case LP_FUNC_ATTR_WRITEONLY: return "writeonly";
153 case LP_FUNC_ATTR_INACCESSIBLE_MEM_ONLY: return "inaccessiblememonly";
154 case LP_FUNC_ATTR_CONVERGENT: return "convergent";
155 default:
156 _debug_printf("Unhandled function attribute: %x\n", attr);
157 return 0;
158 }
159 }
160
161 #endif
162
163 void
lp_add_function_attr(LLVMValueRef function_or_call,int attr_idx,enum lp_func_attr attr)164 lp_add_function_attr(LLVMValueRef function_or_call,
165 int attr_idx, enum lp_func_attr attr)
166 {
167
168 #if LLVM_VERSION_MAJOR < 4
169 LLVMAttribute llvm_attr = lp_attr_to_llvm_attr(attr);
170 if (LLVMIsAFunction(function_or_call)) {
171 if (attr_idx == -1) {
172 LLVMAddFunctionAttr(function_or_call, llvm_attr);
173 } else {
174 LLVMAddAttribute(LLVMGetParam(function_or_call, attr_idx - 1), llvm_attr);
175 }
176 } else {
177 LLVMAddInstrAttribute(function_or_call, attr_idx, llvm_attr);
178 }
179 #else
180
181 LLVMModuleRef module;
182 if (LLVMIsAFunction(function_or_call)) {
183 module = LLVMGetGlobalParent(function_or_call);
184 } else {
185 LLVMBasicBlockRef bb = LLVMGetInstructionParent(function_or_call);
186 LLVMValueRef function = LLVMGetBasicBlockParent(bb);
187 module = LLVMGetGlobalParent(function);
188 }
189 LLVMContextRef ctx = LLVMGetModuleContext(module);
190
191 const char *attr_name = attr_to_str(attr);
192 unsigned kind_id = LLVMGetEnumAttributeKindForName(attr_name,
193 strlen(attr_name));
194 LLVMAttributeRef llvm_attr = LLVMCreateEnumAttribute(ctx, kind_id, 0);
195
196 if (LLVMIsAFunction(function_or_call))
197 LLVMAddAttributeAtIndex(function_or_call, attr_idx, llvm_attr);
198 else
199 LLVMAddCallSiteAttribute(function_or_call, attr_idx, llvm_attr);
200 #endif
201 }
202
203 static void
lp_add_func_attributes(LLVMValueRef function,unsigned attrib_mask)204 lp_add_func_attributes(LLVMValueRef function, unsigned attrib_mask)
205 {
206 /* NoUnwind indicates that the intrinsic never raises a C++ exception.
207 * Set it for all intrinsics.
208 */
209 attrib_mask |= LP_FUNC_ATTR_NOUNWIND;
210 attrib_mask &= ~LP_FUNC_ATTR_LEGACY;
211
212 while (attrib_mask) {
213 enum lp_func_attr attr = 1u << u_bit_scan(&attrib_mask);
214 lp_add_function_attr(function, -1, attr);
215 }
216 }
217
218 LLVMValueRef
lp_build_intrinsic(LLVMBuilderRef builder,const char * name,LLVMTypeRef ret_type,LLVMValueRef * args,unsigned num_args,unsigned attr_mask)219 lp_build_intrinsic(LLVMBuilderRef builder,
220 const char *name,
221 LLVMTypeRef ret_type,
222 LLVMValueRef *args,
223 unsigned num_args,
224 unsigned attr_mask)
225 {
226 LLVMModuleRef module = LLVMGetGlobalParent(LLVMGetBasicBlockParent(LLVMGetInsertBlock(builder)));
227 LLVMValueRef function, call;
228 bool set_callsite_attrs = LLVM_VERSION_MAJOR >= 4 &&
229 !(attr_mask & LP_FUNC_ATTR_LEGACY);
230
231 function = LLVMGetNamedFunction(module, name);
232 if(!function) {
233 LLVMTypeRef arg_types[LP_MAX_FUNC_ARGS];
234 unsigned i;
235
236 assert(num_args <= LP_MAX_FUNC_ARGS);
237
238 for(i = 0; i < num_args; ++i) {
239 assert(args[i]);
240 arg_types[i] = LLVMTypeOf(args[i]);
241 }
242
243 function = lp_declare_intrinsic(module, name, ret_type, arg_types, num_args);
244
245 /*
246 * If llvm removes an intrinsic we use, we'll hit this abort (rather
247 * than a call to address zero in the jited code).
248 */
249 if (LLVMGetIntrinsicID(function) == 0) {
250 _debug_printf("llvm (version " MESA_LLVM_VERSION_STRING
251 ") found no intrinsic for %s, going to crash...\n",
252 name);
253 abort();
254 }
255
256 if (!set_callsite_attrs)
257 lp_add_func_attributes(function, attr_mask);
258
259 if (gallivm_debug & GALLIVM_DEBUG_IR) {
260 lp_debug_dump_value(function);
261 }
262 }
263
264 call = LLVMBuildCall(builder, function, args, num_args, "");
265 if (set_callsite_attrs)
266 lp_add_func_attributes(call, attr_mask);
267 return call;
268 }
269
270
271 LLVMValueRef
lp_build_intrinsic_unary(LLVMBuilderRef builder,const char * name,LLVMTypeRef ret_type,LLVMValueRef a)272 lp_build_intrinsic_unary(LLVMBuilderRef builder,
273 const char *name,
274 LLVMTypeRef ret_type,
275 LLVMValueRef a)
276 {
277 return lp_build_intrinsic(builder, name, ret_type, &a, 1, 0);
278 }
279
280
281 LLVMValueRef
lp_build_intrinsic_binary(LLVMBuilderRef builder,const char * name,LLVMTypeRef ret_type,LLVMValueRef a,LLVMValueRef b)282 lp_build_intrinsic_binary(LLVMBuilderRef builder,
283 const char *name,
284 LLVMTypeRef ret_type,
285 LLVMValueRef a,
286 LLVMValueRef b)
287 {
288 LLVMValueRef args[2];
289
290 args[0] = a;
291 args[1] = b;
292
293 return lp_build_intrinsic(builder, name, ret_type, args, 2, 0);
294 }
295
296
297 /**
298 * Call intrinsic with arguments adapted to intrinsic vector length.
299 *
300 * Split vectors which are too large for the hw, or expand them if they
301 * are too small, so a caller calling a function which might use intrinsics
302 * doesn't need to do splitting/expansion on its own.
303 * This only supports intrinsics where src and dst types match.
304 */
305 LLVMValueRef
lp_build_intrinsic_binary_anylength(struct gallivm_state * gallivm,const char * name,struct lp_type src_type,unsigned intr_size,LLVMValueRef a,LLVMValueRef b)306 lp_build_intrinsic_binary_anylength(struct gallivm_state *gallivm,
307 const char *name,
308 struct lp_type src_type,
309 unsigned intr_size,
310 LLVMValueRef a,
311 LLVMValueRef b)
312 {
313 unsigned i;
314 struct lp_type intrin_type = src_type;
315 LLVMBuilderRef builder = gallivm->builder;
316 LLVMValueRef i32undef = LLVMGetUndef(LLVMInt32TypeInContext(gallivm->context));
317 LLVMValueRef anative, bnative;
318 unsigned intrin_length = intr_size / src_type.width;
319
320 intrin_type.length = intrin_length;
321
322 if (intrin_length > src_type.length) {
323 LLVMValueRef elems[LP_MAX_VECTOR_LENGTH];
324 LLVMValueRef constvec, tmp;
325
326 for (i = 0; i < src_type.length; i++) {
327 elems[i] = lp_build_const_int32(gallivm, i);
328 }
329 for (; i < intrin_length; i++) {
330 elems[i] = i32undef;
331 }
332 if (src_type.length == 1) {
333 LLVMTypeRef elem_type = lp_build_elem_type(gallivm, intrin_type);
334 a = LLVMBuildBitCast(builder, a, LLVMVectorType(elem_type, 1), "");
335 b = LLVMBuildBitCast(builder, b, LLVMVectorType(elem_type, 1), "");
336 }
337 constvec = LLVMConstVector(elems, intrin_length);
338 anative = LLVMBuildShuffleVector(builder, a, a, constvec, "");
339 bnative = LLVMBuildShuffleVector(builder, b, b, constvec, "");
340 tmp = lp_build_intrinsic_binary(builder, name,
341 lp_build_vec_type(gallivm, intrin_type),
342 anative, bnative);
343 if (src_type.length > 1) {
344 constvec = LLVMConstVector(elems, src_type.length);
345 return LLVMBuildShuffleVector(builder, tmp, tmp, constvec, "");
346 }
347 else {
348 return LLVMBuildExtractElement(builder, tmp, elems[0], "");
349 }
350 }
351 else if (intrin_length < src_type.length) {
352 unsigned num_vec = src_type.length / intrin_length;
353 LLVMValueRef tmp[LP_MAX_VECTOR_LENGTH];
354
355 /* don't support arbitrary size here as this is so yuck */
356 if (src_type.length % intrin_length) {
357 /* FIXME: This is something which should be supported
358 * but there doesn't seem to be any need for it currently
359 * so crash and burn.
360 */
361 debug_printf("%s: should handle arbitrary vector size\n",
362 __FUNCTION__);
363 assert(0);
364 return NULL;
365 }
366
367 for (i = 0; i < num_vec; i++) {
368 anative = lp_build_extract_range(gallivm, a, i*intrin_length,
369 intrin_length);
370 bnative = lp_build_extract_range(gallivm, b, i*intrin_length,
371 intrin_length);
372 tmp[i] = lp_build_intrinsic_binary(builder, name,
373 lp_build_vec_type(gallivm, intrin_type),
374 anative, bnative);
375 }
376 return lp_build_concat(gallivm, tmp, intrin_type, num_vec);
377 }
378 else {
379 return lp_build_intrinsic_binary(builder, name,
380 lp_build_vec_type(gallivm, src_type),
381 a, b);
382 }
383 }
384
385
386 LLVMValueRef
lp_build_intrinsic_map(struct gallivm_state * gallivm,const char * name,LLVMTypeRef ret_type,LLVMValueRef * args,unsigned num_args)387 lp_build_intrinsic_map(struct gallivm_state *gallivm,
388 const char *name,
389 LLVMTypeRef ret_type,
390 LLVMValueRef *args,
391 unsigned num_args)
392 {
393 LLVMBuilderRef builder = gallivm->builder;
394 LLVMTypeRef ret_elem_type = LLVMGetElementType(ret_type);
395 unsigned n = LLVMGetVectorSize(ret_type);
396 unsigned i, j;
397 LLVMValueRef res;
398
399 assert(num_args <= LP_MAX_FUNC_ARGS);
400
401 res = LLVMGetUndef(ret_type);
402 for(i = 0; i < n; ++i) {
403 LLVMValueRef index = lp_build_const_int32(gallivm, i);
404 LLVMValueRef arg_elems[LP_MAX_FUNC_ARGS];
405 LLVMValueRef res_elem;
406 for(j = 0; j < num_args; ++j)
407 arg_elems[j] = LLVMBuildExtractElement(builder, args[j], index, "");
408 res_elem = lp_build_intrinsic(builder, name, ret_elem_type, arg_elems, num_args, 0);
409 res = LLVMBuildInsertElement(builder, res, res_elem, index, "");
410 }
411
412 return res;
413 }
414
415
416 LLVMValueRef
lp_build_intrinsic_map_unary(struct gallivm_state * gallivm,const char * name,LLVMTypeRef ret_type,LLVMValueRef a)417 lp_build_intrinsic_map_unary(struct gallivm_state *gallivm,
418 const char *name,
419 LLVMTypeRef ret_type,
420 LLVMValueRef a)
421 {
422 return lp_build_intrinsic_map(gallivm, name, ret_type, &a, 1);
423 }
424
425
426 LLVMValueRef
lp_build_intrinsic_map_binary(struct gallivm_state * gallivm,const char * name,LLVMTypeRef ret_type,LLVMValueRef a,LLVMValueRef b)427 lp_build_intrinsic_map_binary(struct gallivm_state *gallivm,
428 const char *name,
429 LLVMTypeRef ret_type,
430 LLVMValueRef a,
431 LLVMValueRef b)
432 {
433 LLVMValueRef args[2];
434
435 args[0] = a;
436 args[1] = b;
437
438 return lp_build_intrinsic_map(gallivm, name, ret_type, args, 2);
439 }
440
441
442