1 /**************************************************************************
3 * Copyright 2011-2012 Advanced Micro Devices, Inc.
4 * Copyright 2009 VMware, Inc.
5 * Copyright 2007-2008 Tungsten Graphics, Inc., Cedar Park, Texas.
8 * Permission is hereby granted, free of charge, to any person obtaining a
9 * copy of this software and associated documentation files (the
10 * "Software"), to deal in the Software without restriction, including
11 * without limitation the rights to use, copy, modify, merge, publish,
12 * distribute, sub license, and/or sell copies of the Software, and to
13 * permit persons to whom the Software is furnished to do so, subject to
14 * the following conditions:
16 * The above copyright notice and this permission notice (including the
17 * next paragraph) shall be included in all copies or substantial portions
20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
21 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
22 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
23 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
24 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
25 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
26 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
28 **************************************************************************/
32 * TGSI to LLVM IR translation.
34 * @author Jose Fonseca <jfonseca@vmware.com>
35 * @author Tom Stellard <thomas.stellard@amd.com>
37 * Based on tgsi_sse2.c code written by Michal Krol, Keith Whitwell,
38 * Brian Paul, and others.
42 #include "lp_bld_tgsi_action.h"
44 #include "lp_bld_tgsi.h"
45 #include "lp_bld_arit.h"
46 #include "lp_bld_bitarit.h"
47 #include "lp_bld_const.h"
48 #include "lp_bld_gather.h"
49 #include "lp_bld_logic.h"
51 #include "tgsi/tgsi_exec.h"
53 /* XXX: The CPU only defaults should be repaced by generic ones. In most
54 * cases, the CPU defaults are just wrappers around a function in
55 * lp_build_arit.c and these functions should be inlined here and the CPU
56 * generic code should be removed and placed elsewhere.
61 /* Generic fetch_arg functions */
63 static void scalar_unary_fetch_args(
64 struct lp_build_tgsi_context
* bld_base
,
65 struct lp_build_emit_data
* emit_data
)
68 emit_data
->args
[0] = lp_build_emit_fetch(bld_base
, emit_data
->inst
, 0, 0);
69 emit_data
->arg_count
= 1;
70 emit_data
->dst_type
= LLVMTypeOf(emit_data
->args
[0]);
73 static void scalar_binary_fetch_args(
74 struct lp_build_tgsi_context
* bld_base
,
75 struct lp_build_emit_data
* emit_data
)
78 emit_data
->args
[0] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
81 emit_data
->args
[1] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
83 emit_data
->arg_count
= 2;
84 emit_data
->dst_type
= LLVMTypeOf(emit_data
->args
[0]);
90 const struct lp_build_tgsi_action
* action
,
91 struct lp_build_tgsi_context
* bld_base
,
92 struct lp_build_emit_data
* emit_data
)
94 emit_data
->output
[emit_data
->chan
] = LLVMBuildFAdd(
95 bld_base
->base
.gallivm
->builder
,
96 emit_data
->args
[0], emit_data
->args
[1], "");
102 const struct lp_build_tgsi_action
* action
,
103 struct lp_build_tgsi_context
* bld_base
,
104 struct lp_build_emit_data
* emit_data
)
106 LLVMValueRef tmp
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_ROUND
, emit_data
->args
[0]);
107 emit_data
->output
[emit_data
->chan
] = LLVMBuildFPToSI(bld_base
->base
.gallivm
->builder
, tmp
,
108 bld_base
->uint_bld
.vec_type
, "");
111 /* TGSI_OPCODE_CLAMP */
114 const struct lp_build_tgsi_action
* action
,
115 struct lp_build_tgsi_context
* bld_base
,
116 struct lp_build_emit_data
* emit_data
)
119 tmp
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MAX
,
122 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
123 TGSI_OPCODE_MIN
, tmp
, emit_data
->args
[2]);
130 struct lp_build_tgsi_context
* bld_base
,
131 struct lp_build_emit_data
* emit_data
,
132 unsigned dp_components
)
135 for (src
= 0; src
< 2; src
++) {
136 for (chan
= 0; chan
< dp_components
; chan
++) {
137 emit_data
->args
[(src
* dp_components
) + chan
] =
138 lp_build_emit_fetch(bld_base
, emit_data
->inst
, src
, chan
);
141 emit_data
->dst_type
= bld_base
->base
.elem_type
;
144 /* TGSI_OPCODE_DP2 */
147 struct lp_build_tgsi_context
* bld_base
,
148 struct lp_build_emit_data
* emit_data
)
150 dp_fetch_args(bld_base
, emit_data
, 2);
155 const struct lp_build_tgsi_action
* action
,
156 struct lp_build_tgsi_context
* bld_base
,
157 struct lp_build_emit_data
* emit_data
)
159 LLVMValueRef tmp0
, tmp1
;
160 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
161 emit_data
->args
[0] /* src0.x */,
162 emit_data
->args
[2] /* src1.x */);
163 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
164 emit_data
->args
[1] /* src0.y */,
165 emit_data
->args
[3] /* src1.y */);
166 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
167 TGSI_OPCODE_ADD
, tmp0
, tmp1
);
170 static struct lp_build_tgsi_action dp2_action
= {
171 dp2_fetch_args
, /* fetch_args */
175 /* TGSI_OPCODE_DP2A */
178 struct lp_build_tgsi_context
* bld_base
,
179 struct lp_build_emit_data
* emit_data
)
181 dp_fetch_args(bld_base
, emit_data
, 2);
182 emit_data
->args
[5] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
188 const struct lp_build_tgsi_action
* action
,
189 struct lp_build_tgsi_context
* bld_base
,
190 struct lp_build_emit_data
* emit_data
)
193 tmp
= lp_build_emit_llvm(bld_base
, TGSI_OPCODE_DP2
, emit_data
);
194 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_ADD
,
195 emit_data
->args
[5], tmp
);
198 static struct lp_build_tgsi_action dp2a_action
= {
199 dp2a_fetch_args
, /* fetch_args */
203 /* TGSI_OPCODE_DP3 */
206 struct lp_build_tgsi_context
* bld_base
,
207 struct lp_build_emit_data
* emit_data
)
209 dp_fetch_args(bld_base
, emit_data
, 3);
214 const struct lp_build_tgsi_action
* action
,
215 struct lp_build_tgsi_context
* bld_base
,
216 struct lp_build_emit_data
* emit_data
)
218 LLVMValueRef tmp0
, tmp1
;
219 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
220 emit_data
->args
[0] /* src0.x */,
221 emit_data
->args
[3] /* src1.x */);
222 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
223 emit_data
->args
[1] /* src0.y */,
224 emit_data
->args
[4] /* src1.y */);
225 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_ADD
, tmp1
, tmp0
);
226 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
227 emit_data
->args
[2] /* src0.z */,
228 emit_data
->args
[5] /* src1.z */);
229 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
230 TGSI_OPCODE_ADD
, tmp0
, tmp1
);
233 static struct lp_build_tgsi_action dp3_action
= {
234 dp3_fetch_args
, /* fetch_args */
238 /* TGSI_OPCODDE_DP4 */
242 struct lp_build_tgsi_context
* bld_base
,
243 struct lp_build_emit_data
* emit_data
)
245 dp_fetch_args(bld_base
, emit_data
, 4);
250 const struct lp_build_tgsi_action
* action
,
251 struct lp_build_tgsi_context
* bld_base
,
252 struct lp_build_emit_data
* emit_data
)
254 LLVMValueRef tmp0
, tmp1
;
255 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
256 emit_data
->args
[0] /* src0.x */,
257 emit_data
->args
[4] /* src1.x */);
258 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
259 emit_data
->args
[1] /* src0.y */,
260 emit_data
->args
[5] /* src1.y */);
261 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_ADD
, tmp0
, tmp1
);
262 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
263 emit_data
->args
[2] /* src0.z */,
264 emit_data
->args
[6] /* src1.z */);
265 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_ADD
, tmp0
, tmp1
);
266 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
267 emit_data
->args
[3] /* src0.w */,
268 emit_data
->args
[7] /* src1.w */);
269 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
270 TGSI_OPCODE_ADD
, tmp0
, tmp1
);
273 static struct lp_build_tgsi_action dp4_action
= {
274 dp4_fetch_args
, /* fetch_args */
278 /* TGSI_OPCODE_DPH */
281 struct lp_build_tgsi_context
* bld_base
,
282 struct lp_build_emit_data
* emit_data
)
284 dp_fetch_args(bld_base
, emit_data
, 4);
286 emit_data
->args
[3] = bld_base
->base
.one
;
289 const struct lp_build_tgsi_action dph_action
= {
290 dph_fetch_args
, /* fetch_args */
294 /* TGSI_OPCODE_DST */
297 struct lp_build_tgsi_context
* bld_base
,
298 struct lp_build_emit_data
* emit_data
)
301 emit_data
->args
[0] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
304 emit_data
->args
[1] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
307 emit_data
->args
[2] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
310 emit_data
->args
[3] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
316 const struct lp_build_tgsi_action
* action
,
317 struct lp_build_tgsi_context
* bld_base
,
318 struct lp_build_emit_data
* emit_data
)
321 emit_data
->output
[TGSI_CHAN_X
] = bld_base
->base
.one
;
324 emit_data
->output
[TGSI_CHAN_Y
] = lp_build_emit_llvm_binary(bld_base
,
326 emit_data
->args
[0] /* src0.y */,
327 emit_data
->args
[2] /* src1.y */);
329 emit_data
->output
[TGSI_CHAN_Z
] = emit_data
->args
[1]; /* src0.z */
332 emit_data
->output
[TGSI_CHAN_W
] = emit_data
->args
[3]; /* src1.w */
335 static struct lp_build_tgsi_action dst_action
= {
336 dst_fetch_args
, /* fetch_args */
340 /* TGSI_OPCODE_END */
343 const struct lp_build_tgsi_action
* action
,
344 struct lp_build_tgsi_context
* bld_base
,
345 struct lp_build_emit_data
* emit_data
)
350 /* TGSI_OPCODE_EXP */
354 const struct lp_build_tgsi_action
* action
,
355 struct lp_build_tgsi_context
* bld_base
,
356 struct lp_build_emit_data
* emit_data
)
358 LLVMValueRef floor_x
;
360 /* floor( src0.x ) */
361 floor_x
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_FLR
,
364 /* 2 ^ floor( src0.x ) */
365 emit_data
->output
[TGSI_CHAN_X
] = lp_build_emit_llvm_unary(bld_base
,
366 TGSI_OPCODE_EX2
, floor_x
);
368 /* src0.x - floor( src0.x ) */
369 emit_data
->output
[TGSI_CHAN_Y
] = lp_build_emit_llvm_binary(bld_base
,
370 TGSI_OPCODE_SUB
, emit_data
->args
[0] /* src0.x */, floor_x
);
373 emit_data
->output
[TGSI_CHAN_Z
] = lp_build_emit_llvm_unary(bld_base
,
374 TGSI_OPCODE_EX2
, emit_data
->args
[0] /* src0.x */);
376 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
379 const struct lp_build_tgsi_action exp_action
= {
380 scalar_unary_fetch_args
, /* fetch_args */
384 /* TGSI_OPCODE_FRC */
388 const struct lp_build_tgsi_action
* action
,
389 struct lp_build_tgsi_context
* bld_base
,
390 struct lp_build_emit_data
* emit_data
)
393 tmp
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_FLR
,
395 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
396 TGSI_OPCODE_SUB
, emit_data
->args
[0], tmp
);
399 /* TGSI_OPCODE_KIL */
403 struct lp_build_tgsi_context
* bld_base
,
404 struct lp_build_emit_data
* emit_data
)
407 emit_data
->args
[0] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
410 emit_data
->args
[1] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
413 emit_data
->args
[2] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
416 emit_data
->args
[3] = lp_build_emit_fetch(bld_base
, emit_data
->inst
,
418 emit_data
->arg_count
= 4;
419 emit_data
->dst_type
= LLVMVoidTypeInContext(bld_base
->base
.gallivm
->context
);
422 /* TGSI_OPCODE_KILP */
426 struct lp_build_tgsi_context
* bld_base
,
427 struct lp_build_emit_data
* emit_data
)
429 emit_data
->dst_type
= LLVMVoidTypeInContext(bld_base
->base
.gallivm
->context
);
432 /* TGSI_OPCODE_LIT */
436 struct lp_build_tgsi_context
* bld_base
,
437 struct lp_build_emit_data
* emit_data
)
440 emit_data
->args
[0] = lp_build_emit_fetch(bld_base
, emit_data
->inst
, 0, TGSI_CHAN_X
);
442 emit_data
->args
[1] = lp_build_emit_fetch(bld_base
, emit_data
->inst
, 0, TGSI_CHAN_Y
);
444 emit_data
->args
[2] = lp_build_emit_fetch(bld_base
, emit_data
->inst
, 0, TGSI_CHAN_W
);
445 emit_data
->arg_count
= 3;
450 const struct lp_build_tgsi_action
* action
,
451 struct lp_build_tgsi_context
* bld_base
,
452 struct lp_build_emit_data
* emit_data
)
454 LLVMValueRef tmp0
, tmp1
, tmp2
;
457 emit_data
->output
[TGSI_CHAN_X
] = bld_base
->base
.one
;
460 emit_data
->output
[TGSI_CHAN_Y
] = lp_build_emit_llvm_binary(bld_base
,
462 emit_data
->args
[0] /* src0.x */,
463 bld_base
->base
.zero
);
466 /* XMM[1] = SrcReg[0].yyyy */
467 tmp1
= emit_data
->args
[1];
468 /* XMM[1] = max(XMM[1], 0) */
469 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MAX
,
470 tmp1
, bld_base
->base
.zero
);
471 /* XMM[2] = SrcReg[0].wwww */
472 tmp2
= emit_data
->args
[2];
473 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_POW
,
475 tmp0
= emit_data
->args
[0];
476 emit_data
->output
[TGSI_CHAN_Z
] = lp_build_emit_llvm_ternary(bld_base
,
478 tmp0
, bld_base
->base
.zero
, tmp1
);
480 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
483 static struct lp_build_tgsi_action lit_action
= {
484 lit_fetch_args
, /* fetch_args */
488 /* TGSI_OPCODE_LOG */
492 const struct lp_build_tgsi_action
* action
,
493 struct lp_build_tgsi_context
* bld_base
,
494 struct lp_build_emit_data
* emit_data
)
497 LLVMValueRef abs_x
, log_abs_x
, flr_log_abs_x
, ex2_flr_log_abs_x
;
500 abs_x
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_ABS
,
501 emit_data
->args
[0] /* src0.x */);
503 /* log( abs( src0.x ) ) */
504 log_abs_x
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_LG2
,
507 /* floor( log( abs( src0.x ) ) ) */
508 flr_log_abs_x
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_FLR
,
511 emit_data
->output
[TGSI_CHAN_X
] = flr_log_abs_x
;
514 ex2_flr_log_abs_x
= lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_EX2
,
517 /* abs( src0.x ) / 2^( floor( lg2( abs( src0.x ) ) ) ) */
518 emit_data
->output
[TGSI_CHAN_Y
] = lp_build_emit_llvm_binary(bld_base
,
519 TGSI_OPCODE_DIV
, abs_x
, ex2_flr_log_abs_x
);
522 emit_data
->output
[TGSI_CHAN_Z
] = log_abs_x
;
525 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
528 static struct lp_build_tgsi_action log_action
= {
529 scalar_unary_fetch_args
, /* fetch_args */
533 /* TGSI_OPCODE_LRP */
537 const struct lp_build_tgsi_action
* action
,
538 struct lp_build_tgsi_context
* bld_base
,
539 struct lp_build_emit_data
* emit_data
)
542 tmp
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_SUB
,
545 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_ternary(bld_base
,
546 TGSI_OPCODE_MAD
, emit_data
->args
[0], tmp
, emit_data
->args
[2]);
549 /* TGSI_OPCODE_MAD */
553 const struct lp_build_tgsi_action
* action
,
554 struct lp_build_tgsi_context
* bld_base
,
555 struct lp_build_emit_data
* emit_data
)
558 tmp
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
,
561 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
562 TGSI_OPCODE_ADD
, tmp
, emit_data
->args
[2]);
565 /* TGSI_OPCODE_MOV */
569 const struct lp_build_tgsi_action
* action
,
570 struct lp_build_tgsi_context
* bld_base
,
571 struct lp_build_emit_data
* emit_data
)
573 emit_data
->output
[emit_data
->chan
] = emit_data
->args
[0];
576 /* TGSI_OPCODE_MUL */
579 const struct lp_build_tgsi_action
* action
,
580 struct lp_build_tgsi_context
* bld_base
,
581 struct lp_build_emit_data
* emit_data
)
583 emit_data
->output
[emit_data
->chan
] = lp_build_mul(&bld_base
->base
,
584 emit_data
->args
[0], emit_data
->args
[1]);
587 /*.TGSI_OPCODE_DIV.*/
588 static void fdiv_emit(
589 const struct lp_build_tgsi_action
* action
,
590 struct lp_build_tgsi_context
* bld_base
,
591 struct lp_build_emit_data
* emit_data
)
593 emit_data
->output
[emit_data
->chan
] = LLVMBuildFDiv(
594 bld_base
->base
.gallivm
->builder
,
595 emit_data
->args
[0], emit_data
->args
[1], "");
598 /*.TGSI_OPCODE_RCP.*/
599 static void rcp_emit(
600 const struct lp_build_tgsi_action
* action
,
601 struct lp_build_tgsi_context
* bld_base
,
602 struct lp_build_emit_data
* emit_data
)
605 one
= lp_build_const_float(bld_base
->base
.gallivm
, 1.0f
);
606 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
607 TGSI_OPCODE_DIV
, one
, emit_data
->args
[0]);
610 /* TGSI_OPCODE_POW */
614 const struct lp_build_tgsi_action
* action
,
615 struct lp_build_tgsi_context
* bld_base
,
616 struct lp_build_emit_data
* emit_data
)
618 emit_data
->output
[emit_data
->chan
] = lp_build_pow(&bld_base
->base
,
619 emit_data
->args
[0], emit_data
->args
[1]);
622 static struct lp_build_tgsi_action pow_action
= {
623 scalar_binary_fetch_args
, /* fetch_args */
627 /* TGSI_OPCODE_RSQ */
631 const struct lp_build_tgsi_action
* action
,
632 struct lp_build_tgsi_context
* bld_base
,
633 struct lp_build_emit_data
* emit_data
)
635 emit_data
->args
[0] = lp_build_emit_llvm_unary(bld_base
, TGSI_OPCODE_ABS
,
637 if (bld_base
->rsq_action
.emit
) {
638 bld_base
->rsq_action
.emit(&bld_base
->rsq_action
, bld_base
, emit_data
);
640 emit_data
->output
[emit_data
->chan
] = bld_base
->base
.undef
;
644 const struct lp_build_tgsi_action rsq_action
= {
645 scalar_unary_fetch_args
, /* fetch_args */
650 /* TGSI_OPCODE_SCS */
653 const struct lp_build_tgsi_action
* action
,
654 struct lp_build_tgsi_context
* bld_base
,
655 struct lp_build_emit_data
* emit_data
)
658 emit_data
->output
[TGSI_CHAN_X
] = lp_build_emit_llvm_unary(bld_base
,
659 TGSI_OPCODE_COS
, emit_data
->args
[0]);
661 emit_data
->output
[TGSI_CHAN_Y
] = lp_build_emit_llvm_unary(bld_base
,
662 TGSI_OPCODE_SIN
, emit_data
->args
[0]);
664 emit_data
->output
[TGSI_CHAN_Z
] = bld_base
->base
.zero
;
667 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
670 const struct lp_build_tgsi_action scs_action
= {
671 scalar_unary_fetch_args
, /* fetch_args */
675 /* TGSI_OPCODE_SFL */
679 const struct lp_build_tgsi_action
* action
,
680 struct lp_build_tgsi_context
* bld_base
,
681 struct lp_build_emit_data
* emit_data
)
683 emit_data
->output
[emit_data
->chan
] = bld_base
->base
.zero
;
686 /* TGSI_OPCODE_STR */
690 const struct lp_build_tgsi_action
* action
,
691 struct lp_build_tgsi_context
* bld_base
,
692 struct lp_build_emit_data
* emit_data
)
694 emit_data
->output
[emit_data
->chan
] = bld_base
->base
.one
;
697 /* TGSI_OPCODE_SUB */
700 const struct lp_build_tgsi_action
* action
,
701 struct lp_build_tgsi_context
* bld_base
,
702 struct lp_build_emit_data
* emit_data
)
704 emit_data
->output
[emit_data
->chan
] = LLVMBuildFSub(
705 bld_base
->base
.gallivm
->builder
,
707 emit_data
->args
[1], "");
710 /* TGSI_OPCODE_U2F */
713 const struct lp_build_tgsi_action
* action
,
714 struct lp_build_tgsi_context
* bld_base
,
715 struct lp_build_emit_data
* emit_data
)
717 emit_data
->output
[emit_data
->chan
] = LLVMBuildUIToFP(bld_base
->base
.gallivm
->builder
,
719 bld_base
->base
.vec_type
, "");
724 const struct lp_build_tgsi_action
* action
,
725 struct lp_build_tgsi_context
* bld_base
,
726 struct lp_build_emit_data
* emit_data
)
729 tmp
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_UMUL
,
732 emit_data
->output
[emit_data
->chan
] = lp_build_emit_llvm_binary(bld_base
,
733 TGSI_OPCODE_UADD
, tmp
, emit_data
->args
[2]);
736 /* TGSI_OPCODE_UMUL */
739 const struct lp_build_tgsi_action
* action
,
740 struct lp_build_tgsi_context
* bld_base
,
741 struct lp_build_emit_data
* emit_data
)
743 emit_data
->output
[emit_data
->chan
] = lp_build_mul(&bld_base
->uint_bld
,
744 emit_data
->args
[0], emit_data
->args
[1]);
747 /* TGSI_OPCODE_XPD */
751 struct lp_build_tgsi_context
* bld_base
,
752 struct lp_build_emit_data
* emit_data
)
754 dp_fetch_args(bld_base
, emit_data
, 3);
762 struct lp_build_tgsi_context
* bld_base
,
768 LLVMValueRef tmp0
, tmp1
;
770 tmp0
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
, a
, b
);
771 tmp1
= lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_MUL
, c
, d
);
773 return lp_build_emit_llvm_binary(bld_base
, TGSI_OPCODE_SUB
, tmp0
, tmp1
);
778 const struct lp_build_tgsi_action
* action
,
779 struct lp_build_tgsi_context
* bld_base
,
780 struct lp_build_emit_data
* emit_data
)
782 emit_data
->output
[TGSI_CHAN_X
] = xpd_helper(bld_base
,
783 emit_data
->args
[1] /* src0.y */, emit_data
->args
[5] /* src1.z */,
784 emit_data
->args
[4] /* src1.y */, emit_data
->args
[2] /* src0.z */);
786 emit_data
->output
[TGSI_CHAN_Y
] = xpd_helper(bld_base
,
787 emit_data
->args
[2] /* src0.z */, emit_data
->args
[3] /* src1.x */,
788 emit_data
->args
[5] /* src1.z */, emit_data
->args
[0] /* src0.x */);
790 emit_data
->output
[TGSI_CHAN_Z
] = xpd_helper(bld_base
,
791 emit_data
->args
[0] /* src0.x */, emit_data
->args
[4] /* src1.y */,
792 emit_data
->args
[3] /* src1.x */, emit_data
->args
[1] /* src0.y */);
794 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
797 const struct lp_build_tgsi_action xpd_action
= {
798 xpd_fetch_args
, /* fetch_args */
803 lp_set_default_actions(struct lp_build_tgsi_context
* bld_base
)
805 bld_base
->op_actions
[TGSI_OPCODE_DP2
] = dp2_action
;
806 bld_base
->op_actions
[TGSI_OPCODE_DP3
] = dp3_action
;
807 bld_base
->op_actions
[TGSI_OPCODE_DP4
] = dp4_action
;
808 bld_base
->op_actions
[TGSI_OPCODE_DP2A
] = dp2a_action
;
809 bld_base
->op_actions
[TGSI_OPCODE_DPH
] = dph_action
;
810 bld_base
->op_actions
[TGSI_OPCODE_DST
] = dst_action
;
811 bld_base
->op_actions
[TGSI_OPCODE_EXP
] = exp_action
;
812 bld_base
->op_actions
[TGSI_OPCODE_LIT
] = lit_action
;
813 bld_base
->op_actions
[TGSI_OPCODE_LOG
] = log_action
;
814 bld_base
->op_actions
[TGSI_OPCODE_RSQ
] = rsq_action
;
815 bld_base
->op_actions
[TGSI_OPCODE_POW
] = pow_action
;
816 bld_base
->op_actions
[TGSI_OPCODE_SCS
] = scs_action
;
817 bld_base
->op_actions
[TGSI_OPCODE_XPD
] = xpd_action
;
819 bld_base
->op_actions
[TGSI_OPCODE_COS
].fetch_args
= scalar_unary_fetch_args
;
820 bld_base
->op_actions
[TGSI_OPCODE_EX2
].fetch_args
= scalar_unary_fetch_args
;
821 bld_base
->op_actions
[TGSI_OPCODE_IF
].fetch_args
= scalar_unary_fetch_args
;
822 bld_base
->op_actions
[TGSI_OPCODE_KIL
].fetch_args
= kil_fetch_args
;
823 bld_base
->op_actions
[TGSI_OPCODE_KILP
].fetch_args
= kilp_fetch_args
;
824 bld_base
->op_actions
[TGSI_OPCODE_RCP
].fetch_args
= scalar_unary_fetch_args
;
825 bld_base
->op_actions
[TGSI_OPCODE_SIN
].fetch_args
= scalar_unary_fetch_args
;
826 bld_base
->op_actions
[TGSI_OPCODE_LG2
].fetch_args
= scalar_unary_fetch_args
;
828 bld_base
->op_actions
[TGSI_OPCODE_ADD
].emit
= add_emit
;
829 bld_base
->op_actions
[TGSI_OPCODE_ARR
].emit
= arr_emit
;
830 bld_base
->op_actions
[TGSI_OPCODE_CLAMP
].emit
= clamp_emit
;
831 bld_base
->op_actions
[TGSI_OPCODE_END
].emit
= end_emit
;
832 bld_base
->op_actions
[TGSI_OPCODE_FRC
].emit
= frc_emit
;
833 bld_base
->op_actions
[TGSI_OPCODE_LRP
].emit
= lrp_emit
;
834 bld_base
->op_actions
[TGSI_OPCODE_MAD
].emit
= mad_emit
;
835 bld_base
->op_actions
[TGSI_OPCODE_MOV
].emit
= mov_emit
;
836 bld_base
->op_actions
[TGSI_OPCODE_MUL
].emit
= mul_emit
;
837 bld_base
->op_actions
[TGSI_OPCODE_DIV
].emit
= fdiv_emit
;
838 bld_base
->op_actions
[TGSI_OPCODE_RCP
].emit
= rcp_emit
;
839 bld_base
->op_actions
[TGSI_OPCODE_SFL
].emit
= sfl_emit
;
840 bld_base
->op_actions
[TGSI_OPCODE_STR
].emit
= str_emit
;
841 bld_base
->op_actions
[TGSI_OPCODE_SUB
].emit
= sub_emit
;
843 bld_base
->op_actions
[TGSI_OPCODE_UARL
].emit
= mov_emit
;
844 bld_base
->op_actions
[TGSI_OPCODE_U2F
].emit
= u2f_emit
;
845 bld_base
->op_actions
[TGSI_OPCODE_UMAD
].emit
= umad_emit
;
846 bld_base
->op_actions
[TGSI_OPCODE_UMUL
].emit
= umul_emit
;
849 /* CPU Only default actions */
851 /* These actions are CPU only, because they could potentially output SSE
855 /* TGSI_OPCODE_ABS (CPU Only)*/
859 const struct lp_build_tgsi_action
* action
,
860 struct lp_build_tgsi_context
* bld_base
,
861 struct lp_build_emit_data
* emit_data
)
863 emit_data
->output
[emit_data
->chan
] = lp_build_abs(&bld_base
->base
,
867 /* TGSI_OPCODE_ADD (CPU Only) */
870 const struct lp_build_tgsi_action
* action
,
871 struct lp_build_tgsi_context
* bld_base
,
872 struct lp_build_emit_data
* emit_data
)
874 emit_data
->output
[emit_data
->chan
] = lp_build_add(&bld_base
->base
,
875 emit_data
->args
[0], emit_data
->args
[1]);
878 /* TGSI_OPCODE_AND (CPU Only) */
881 const struct lp_build_tgsi_action
* action
,
882 struct lp_build_tgsi_context
* bld_base
,
883 struct lp_build_emit_data
* emit_data
)
885 emit_data
->output
[emit_data
->chan
] = lp_build_and(&bld_base
->uint_bld
,
886 emit_data
->args
[0], emit_data
->args
[1]);
889 /* TGSI_OPCODE_ARL (CPU Only) */
892 const struct lp_build_tgsi_action
* action
,
893 struct lp_build_tgsi_context
* bld_base
,
894 struct lp_build_emit_data
* emit_data
)
897 tmp
= lp_build_floor(&bld_base
->base
,
899 emit_data
->output
[emit_data
->chan
] = LLVMBuildFPToSI(bld_base
->base
.gallivm
->builder
, tmp
,
900 bld_base
->uint_bld
.vec_type
, "");
903 /* TGSI_OPCODE_ARR (CPU Only) */
906 const struct lp_build_tgsi_action
* action
,
907 struct lp_build_tgsi_context
* bld_base
,
908 struct lp_build_emit_data
* emit_data
)
910 emit_data
->output
[emit_data
->chan
] = lp_build_iround(&bld_base
->base
, emit_data
->args
[0]);
913 /* TGSI_OPCODE_CEIL (CPU Only) */
916 const struct lp_build_tgsi_action
* action
,
917 struct lp_build_tgsi_context
* bld_base
,
918 struct lp_build_emit_data
* emit_data
)
920 emit_data
->output
[emit_data
->chan
] = lp_build_ceil(&bld_base
->base
,
924 /* TGSI_OPCODE_CMP (CPU Only) */
927 const struct lp_build_tgsi_action
* action
,
928 struct lp_build_tgsi_context
* bld_base
,
929 struct lp_build_emit_data
* emit_data
)
931 LLVMValueRef cond
= lp_build_cmp(&bld_base
->base
, PIPE_FUNC_LESS
,
932 emit_data
->args
[0], bld_base
->base
.zero
);
933 emit_data
->output
[emit_data
->chan
] = lp_build_select(&bld_base
->base
,
934 cond
, emit_data
->args
[1], emit_data
->args
[2]);
937 /* TGSI_OPCODE_CND (CPU Only) */
940 const struct lp_build_tgsi_action
* action
,
941 struct lp_build_tgsi_context
* bld_base
,
942 struct lp_build_emit_data
* emit_data
)
944 LLVMValueRef half
, tmp
;
945 half
= lp_build_const_vec(bld_base
->base
.gallivm
, bld_base
->base
.type
, 0.5);
946 tmp
= lp_build_cmp(&bld_base
->base
, PIPE_FUNC_GREATER
,
947 emit_data
->args
[2], half
);
948 emit_data
->output
[emit_data
->chan
] = lp_build_select(&bld_base
->base
,
954 /* TGSI_OPCODE_COS (CPU Only) */
957 const struct lp_build_tgsi_action
* action
,
958 struct lp_build_tgsi_context
* bld_base
,
959 struct lp_build_emit_data
* emit_data
)
961 emit_data
->output
[emit_data
->chan
] = lp_build_cos(&bld_base
->base
,
965 /* TGSI_OPCODE_DIV (CPU Only) */
968 const struct lp_build_tgsi_action
* action
,
969 struct lp_build_tgsi_context
* bld_base
,
970 struct lp_build_emit_data
* emit_data
)
972 emit_data
->output
[emit_data
->chan
] = lp_build_div(&bld_base
->base
,
973 emit_data
->args
[0], emit_data
->args
[1]);
976 /* TGSI_OPCODE_EX2 (CPU Only) */
979 const struct lp_build_tgsi_action
* action
,
980 struct lp_build_tgsi_context
* bld_base
,
981 struct lp_build_emit_data
* emit_data
)
983 emit_data
->output
[emit_data
->chan
] = lp_build_exp2(&bld_base
->base
,
987 /* TGSI_OPCODE_EXP (CPU Only) */
990 const struct lp_build_tgsi_action
* action
,
991 struct lp_build_tgsi_context
* bld_base
,
992 struct lp_build_emit_data
* emit_data
)
994 lp_build_exp2_approx(&bld_base
->base
, emit_data
->args
[0],
995 &emit_data
->output
[TGSI_CHAN_X
],
996 &emit_data
->output
[TGSI_CHAN_Y
],
997 &emit_data
->output
[TGSI_CHAN_Z
]);
998 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
1001 /* TGSI_OPCODE_F2I (CPU Only) */
1004 const struct lp_build_tgsi_action
* action
,
1005 struct lp_build_tgsi_context
* bld_base
,
1006 struct lp_build_emit_data
* emit_data
)
1008 emit_data
->output
[emit_data
->chan
] = lp_build_itrunc(&bld_base
->base
,
1009 emit_data
->args
[0]);
1012 /* TGSI_OPCODE_F2U (CPU Only) */
1015 const struct lp_build_tgsi_action
* action
,
1016 struct lp_build_tgsi_context
* bld_base
,
1017 struct lp_build_emit_data
* emit_data
)
1019 /* FIXME: implement and use lp_build_utrunc() */
1020 emit_data
->output
[emit_data
->chan
] = lp_build_itrunc(&bld_base
->base
,
1021 emit_data
->args
[0]);
1024 /* TGSI_OPCODE_FLR (CPU Only) */
1028 const struct lp_build_tgsi_action
* action
,
1029 struct lp_build_tgsi_context
* bld_base
,
1030 struct lp_build_emit_data
* emit_data
)
1032 emit_data
->output
[emit_data
->chan
] = lp_build_floor(&bld_base
->base
,
1033 emit_data
->args
[0]);
1036 /* TGSI_OPCODE_I2F (CPU Only) */
1039 const struct lp_build_tgsi_action
* action
,
1040 struct lp_build_tgsi_context
* bld_base
,
1041 struct lp_build_emit_data
* emit_data
)
1043 emit_data
->output
[emit_data
->chan
] = lp_build_int_to_float(&bld_base
->base
,
1044 emit_data
->args
[0]);
1047 /* TGSI_OPCODE_IABS (CPU Only) */
1050 const struct lp_build_tgsi_action
* action
,
1051 struct lp_build_tgsi_context
* bld_base
,
1052 struct lp_build_emit_data
* emit_data
)
1054 emit_data
->output
[emit_data
->chan
] = lp_build_abs(&bld_base
->int_bld
,
1055 emit_data
->args
[0]);
1058 /* TGSI_OPCODE_IDIV (CPU Only) */
1061 const struct lp_build_tgsi_action
* action
,
1062 struct lp_build_tgsi_context
* bld_base
,
1063 struct lp_build_emit_data
* emit_data
)
1065 emit_data
->output
[emit_data
->chan
] = lp_build_div(&bld_base
->int_bld
,
1066 emit_data
->args
[0], emit_data
->args
[1]);
1069 /* TGSI_OPCODE_INEG (CPU Only) */
1072 const struct lp_build_tgsi_action
* action
,
1073 struct lp_build_tgsi_context
* bld_base
,
1074 struct lp_build_emit_data
* emit_data
)
1076 emit_data
->output
[emit_data
->chan
] = lp_build_sub(&bld_base
->int_bld
,
1077 bld_base
->int_bld
.zero
,
1078 emit_data
->args
[0]);
1081 /* TGSI_OPCODE_ISET Helper (CPU Only) */
1084 const struct lp_build_tgsi_action
* action
,
1085 struct lp_build_tgsi_context
* bld_base
,
1086 struct lp_build_emit_data
* emit_data
,
1089 LLVMValueRef nz
= lp_build_const_vec(bld_base
->base
.gallivm
,
1090 bld_base
->int_bld
.type
, ~0U);
1091 LLVMValueRef cond
= lp_build_cmp(&bld_base
->int_bld
, pipe_func
,
1092 emit_data
->args
[0], emit_data
->args
[1]);
1093 emit_data
->output
[emit_data
->chan
] = lp_build_select(&bld_base
->int_bld
,
1096 bld_base
->int_bld
.zero
);
1099 /* TGSI_OPCODE_IMAX (CPU Only) */
1102 const struct lp_build_tgsi_action
* action
,
1103 struct lp_build_tgsi_context
* bld_base
,
1104 struct lp_build_emit_data
* emit_data
)
1106 emit_data
->output
[emit_data
->chan
] = lp_build_max(&bld_base
->int_bld
,
1107 emit_data
->args
[0], emit_data
->args
[1]);
1110 /* TGSI_OPCODE_IMIN (CPU Only) */
1113 const struct lp_build_tgsi_action
* action
,
1114 struct lp_build_tgsi_context
* bld_base
,
1115 struct lp_build_emit_data
* emit_data
)
1117 emit_data
->output
[emit_data
->chan
] = lp_build_min(&bld_base
->int_bld
,
1118 emit_data
->args
[0], emit_data
->args
[1]);
1121 /* TGSI_OPCODE_ISGE (CPU Only) */
1124 const struct lp_build_tgsi_action
* action
,
1125 struct lp_build_tgsi_context
* bld_base
,
1126 struct lp_build_emit_data
* emit_data
)
1128 iset_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_GEQUAL
);
1131 /* TGSI_OPCODE_ISHR (CPU Only) */
1134 const struct lp_build_tgsi_action
* action
,
1135 struct lp_build_tgsi_context
* bld_base
,
1136 struct lp_build_emit_data
* emit_data
)
1138 emit_data
->output
[emit_data
->chan
] = lp_build_shr(&bld_base
->int_bld
,
1139 emit_data
->args
[0], emit_data
->args
[1]);
1142 /* TGSI_OPCODE_ISLT (CPU Only) */
1145 const struct lp_build_tgsi_action
* action
,
1146 struct lp_build_tgsi_context
* bld_base
,
1147 struct lp_build_emit_data
* emit_data
)
1149 iset_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_LESS
);
1153 /* TGSI_OPCODE_ISSG (CPU Only) */
1156 const struct lp_build_tgsi_action
* action
,
1157 struct lp_build_tgsi_context
* bld_base
,
1158 struct lp_build_emit_data
* emit_data
)
1160 emit_data
->output
[emit_data
->chan
] = lp_build_sgn(&bld_base
->int_bld
,
1161 emit_data
->args
[0]);
1164 /* TGSI_OPCODE_LG2 (CPU Only) */
1167 const struct lp_build_tgsi_action
* action
,
1168 struct lp_build_tgsi_context
* bld_base
,
1169 struct lp_build_emit_data
* emit_data
)
1171 emit_data
->output
[emit_data
->chan
] = lp_build_log2(&bld_base
->base
,
1172 emit_data
->args
[0]);
1175 /* TGSI_OPCODE_LOG (CPU Only) */
1178 const struct lp_build_tgsi_action
* action
,
1179 struct lp_build_tgsi_context
* bld_base
,
1180 struct lp_build_emit_data
* emit_data
)
1182 LLVMValueRef p_floor_log2
;
1184 LLVMValueRef p_log2
;
1185 LLVMValueRef src0
= emit_data
->args
[0];
1187 lp_build_log2_approx(&bld_base
->base
, src0
,
1188 &p_exp
, &p_floor_log2
, &p_log2
);
1190 emit_data
->output
[TGSI_CHAN_X
] = p_floor_log2
;
1192 emit_data
->output
[TGSI_CHAN_Y
] = lp_build_emit_llvm_binary(bld_base
,
1195 emit_data
->output
[TGSI_CHAN_Z
] = p_log2
;
1197 emit_data
->output
[TGSI_CHAN_W
] = bld_base
->base
.one
;
1201 /* TGSI_OPCODE_MAX (CPU Only) */
1205 const struct lp_build_tgsi_action
* action
,
1206 struct lp_build_tgsi_context
* bld_base
,
1207 struct lp_build_emit_data
* emit_data
)
1209 emit_data
->output
[emit_data
->chan
] = lp_build_max(&bld_base
->base
,
1210 emit_data
->args
[0], emit_data
->args
[1]);
1213 /* TGSI_OPCODE_MIN (CPU Only) */
1216 const struct lp_build_tgsi_action
* action
,
1217 struct lp_build_tgsi_context
* bld_base
,
1218 struct lp_build_emit_data
* emit_data
)
1220 emit_data
->output
[emit_data
->chan
] = lp_build_min(&bld_base
->base
,
1221 emit_data
->args
[0], emit_data
->args
[1]);
1224 /* TGSI_OPCODE_MOD (CPU Only) */
1227 const struct lp_build_tgsi_action
* action
,
1228 struct lp_build_tgsi_context
* bld_base
,
1229 struct lp_build_emit_data
* emit_data
)
1231 emit_data
->output
[emit_data
->chan
] = lp_build_mod(&bld_base
->int_bld
,
1232 emit_data
->args
[0], emit_data
->args
[1]);
1235 /* TGSI_OPCODE_NOT */
1238 const struct lp_build_tgsi_action
* action
,
1239 struct lp_build_tgsi_context
* bld_base
,
1240 struct lp_build_emit_data
* emit_data
)
1242 emit_data
->output
[emit_data
->chan
] = lp_build_not(&bld_base
->base
,
1243 emit_data
->args
[0]);
1246 /* TGSI_OPCODE_OR (CPU Only) */
1249 const struct lp_build_tgsi_action
* action
,
1250 struct lp_build_tgsi_context
* bld_base
,
1251 struct lp_build_emit_data
* emit_data
)
1253 emit_data
->output
[emit_data
->chan
] = lp_build_or(&bld_base
->uint_bld
,
1254 emit_data
->args
[0], emit_data
->args
[1]);
1257 /* TGSI_OPCODE_POW (CPU Only) */
1260 const struct lp_build_tgsi_action
* action
,
1261 struct lp_build_tgsi_context
* bld_base
,
1262 struct lp_build_emit_data
* emit_data
)
1264 emit_data
->output
[emit_data
->chan
] = lp_build_pow(&bld_base
->base
,
1265 emit_data
->args
[0], emit_data
->args
[1]);
1269 /* TGSI_OPCODE_RCP (CPU Only) */
1273 const struct lp_build_tgsi_action
* action
,
1274 struct lp_build_tgsi_context
* bld_base
,
1275 struct lp_build_emit_data
* emit_data
)
1277 emit_data
->output
[emit_data
->chan
] = lp_build_rcp(&bld_base
->base
,
1278 emit_data
->args
[0]);
1281 /* Reciprical squareroot (CPU Only) */
1283 /* This is not the same as TGSI_OPCODE_RSQ, which requres the argument to be
1284 * greater than or equal to 0 */
1286 recip_sqrt_emit_cpu(
1287 const struct lp_build_tgsi_action
* action
,
1288 struct lp_build_tgsi_context
* bld_base
,
1289 struct lp_build_emit_data
* emit_data
)
1291 emit_data
->output
[emit_data
->chan
] = lp_build_rsqrt(&bld_base
->base
,
1292 emit_data
->args
[0]);
1295 /* TGSI_OPCODE_ROUND (CPU Only) */
1298 const struct lp_build_tgsi_action
* action
,
1299 struct lp_build_tgsi_context
* bld_base
,
1300 struct lp_build_emit_data
* emit_data
)
1302 emit_data
->output
[emit_data
->chan
] = lp_build_round(&bld_base
->base
,
1303 emit_data
->args
[0]);
1306 /* TGSI_OPCODE_SET Helper (CPU Only) */
1310 const struct lp_build_tgsi_action
* action
,
1311 struct lp_build_tgsi_context
* bld_base
,
1312 struct lp_build_emit_data
* emit_data
,
1315 LLVMValueRef cond
= lp_build_cmp(&bld_base
->base
, pipe_func
,
1316 emit_data
->args
[0], emit_data
->args
[1]);
1317 emit_data
->output
[emit_data
->chan
] = lp_build_select(&bld_base
->base
,
1320 bld_base
->base
.zero
);
1323 /* TGSI_OPCODE_SEQ (CPU Only) */
1327 const struct lp_build_tgsi_action
* action
,
1328 struct lp_build_tgsi_context
* bld_base
,
1329 struct lp_build_emit_data
* emit_data
)
1331 set_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_EQUAL
);
1334 /* TGSI_OPCODE_SGE (CPU Only) */
1337 const struct lp_build_tgsi_action
* action
,
1338 struct lp_build_tgsi_context
* bld_base
,
1339 struct lp_build_emit_data
* emit_data
)
1341 set_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_GEQUAL
);
1344 /* TGSI_OPCODE_SGT (CPU Only)*/
1348 const struct lp_build_tgsi_action
* action
,
1349 struct lp_build_tgsi_context
* bld_base
,
1350 struct lp_build_emit_data
* emit_data
)
1352 set_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_GREATER
);
1355 /* TGSI_OPCODE_SHL (CPU Only) */
1358 const struct lp_build_tgsi_action
* action
,
1359 struct lp_build_tgsi_context
* bld_base
,
1360 struct lp_build_emit_data
* emit_data
)
1362 emit_data
->output
[emit_data
->chan
] = lp_build_shl(&bld_base
->uint_bld
,
1363 emit_data
->args
[0], emit_data
->args
[1]);
1366 /* TGSI_OPCODE_SIN (CPU Only) */
1369 const struct lp_build_tgsi_action
* action
,
1370 struct lp_build_tgsi_context
* bld_base
,
1371 struct lp_build_emit_data
* emit_data
)
1373 emit_data
->output
[emit_data
->chan
] = lp_build_sin(&bld_base
->base
,
1374 emit_data
->args
[0]);
1377 /* TGSI_OPCODE_SLE (CPU Only) */
1380 const struct lp_build_tgsi_action
* action
,
1381 struct lp_build_tgsi_context
* bld_base
,
1382 struct lp_build_emit_data
* emit_data
)
1384 set_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_LEQUAL
);
1387 /* TGSI_OPCODE_SLT (CPU Only) */
1390 const struct lp_build_tgsi_action
* action
,
1391 struct lp_build_tgsi_context
* bld_base
,
1392 struct lp_build_emit_data
* emit_data
)
1394 set_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_LESS
);
1397 /* TGSI_OPCODE_SNE (CPU Only) */
1401 const struct lp_build_tgsi_action
* action
,
1402 struct lp_build_tgsi_context
* bld_base
,
1403 struct lp_build_emit_data
* emit_data
)
1405 set_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_NOTEQUAL
);
1408 /* TGSI_OPCODE_SSG (CPU Only) */
1412 const struct lp_build_tgsi_action
* action
,
1413 struct lp_build_tgsi_context
* bld_base
,
1414 struct lp_build_emit_data
* emit_data
)
1416 emit_data
->output
[emit_data
->chan
] = lp_build_sgn(&bld_base
->base
,
1417 emit_data
->args
[0]);
1420 /* TGSI_OPCODE_SUB (CPU Only) */
1424 const struct lp_build_tgsi_action
* action
,
1425 struct lp_build_tgsi_context
* bld_base
,
1426 struct lp_build_emit_data
* emit_data
)
1428 emit_data
->output
[emit_data
->chan
] = lp_build_sub(&bld_base
->base
,
1430 emit_data
->args
[1]);
1433 /* TGSI_OPCODE_TRUNC (CPU Only) */
1437 const struct lp_build_tgsi_action
* action
,
1438 struct lp_build_tgsi_context
* bld_base
,
1439 struct lp_build_emit_data
* emit_data
)
1441 emit_data
->output
[emit_data
->chan
] = lp_build_trunc(&bld_base
->base
,
1442 emit_data
->args
[0]);
1445 /* TGSI_OPCODE_UADD (CPU Only) */
1448 const struct lp_build_tgsi_action
* action
,
1449 struct lp_build_tgsi_context
* bld_base
,
1450 struct lp_build_emit_data
* emit_data
)
1452 emit_data
->output
[emit_data
->chan
] = lp_build_add(&bld_base
->uint_bld
,
1453 emit_data
->args
[0], emit_data
->args
[1]);
1456 /* TGSI_OPCODE_UDIV (CPU Only) */
1459 const struct lp_build_tgsi_action
* action
,
1460 struct lp_build_tgsi_context
* bld_base
,
1461 struct lp_build_emit_data
* emit_data
)
1463 emit_data
->output
[emit_data
->chan
] = lp_build_div(&bld_base
->uint_bld
,
1464 emit_data
->args
[0], emit_data
->args
[1]);
1467 /* TGSI_OPCODE_UMAX (CPU Only) */
1470 const struct lp_build_tgsi_action
* action
,
1471 struct lp_build_tgsi_context
* bld_base
,
1472 struct lp_build_emit_data
* emit_data
)
1474 emit_data
->output
[emit_data
->chan
] = lp_build_max(&bld_base
->uint_bld
,
1475 emit_data
->args
[0], emit_data
->args
[1]);
1478 /* TGSI_OPCODE_UMIN (CPU Only) */
1481 const struct lp_build_tgsi_action
* action
,
1482 struct lp_build_tgsi_context
* bld_base
,
1483 struct lp_build_emit_data
* emit_data
)
1485 emit_data
->output
[emit_data
->chan
] = lp_build_min(&bld_base
->uint_bld
,
1486 emit_data
->args
[0], emit_data
->args
[1]);
1489 /* TGSI_OPCODE_UMOD (CPU Only) */
1492 const struct lp_build_tgsi_action
* action
,
1493 struct lp_build_tgsi_context
* bld_base
,
1494 struct lp_build_emit_data
* emit_data
)
1496 emit_data
->output
[emit_data
->chan
] = lp_build_mod(&bld_base
->uint_bld
,
1497 emit_data
->args
[0], emit_data
->args
[1]);
1500 /* TGSI_OPCODE_USET Helper (CPU Only) */
1503 const struct lp_build_tgsi_action
* action
,
1504 struct lp_build_tgsi_context
* bld_base
,
1505 struct lp_build_emit_data
* emit_data
,
1508 LLVMValueRef nz
= lp_build_const_vec(bld_base
->base
.gallivm
,
1509 bld_base
->uint_bld
.type
, ~0U);
1510 LLVMValueRef cond
= lp_build_cmp(&bld_base
->uint_bld
, pipe_func
,
1511 emit_data
->args
[0], emit_data
->args
[1]);
1512 emit_data
->output
[emit_data
->chan
] = lp_build_select(&bld_base
->uint_bld
,
1515 bld_base
->uint_bld
.zero
);
1519 /* TGSI_OPCODE_USEQ (CPU Only) */
1522 const struct lp_build_tgsi_action
* action
,
1523 struct lp_build_tgsi_context
* bld_base
,
1524 struct lp_build_emit_data
* emit_data
)
1526 uset_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_EQUAL
);
1529 /* TGSI_OPCODE_ISGE (CPU Only) */
1532 const struct lp_build_tgsi_action
* action
,
1533 struct lp_build_tgsi_context
* bld_base
,
1534 struct lp_build_emit_data
* emit_data
)
1536 uset_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_GEQUAL
);
1539 /* TGSI_OPCODE_USHR (CPU Only) */
1542 const struct lp_build_tgsi_action
* action
,
1543 struct lp_build_tgsi_context
* bld_base
,
1544 struct lp_build_emit_data
* emit_data
)
1546 emit_data
->output
[emit_data
->chan
] = lp_build_shr(&bld_base
->uint_bld
,
1547 emit_data
->args
[0], emit_data
->args
[1]);
1550 /* TGSI_OPCODE_ISLT (CPU Only) */
1553 const struct lp_build_tgsi_action
* action
,
1554 struct lp_build_tgsi_context
* bld_base
,
1555 struct lp_build_emit_data
* emit_data
)
1557 uset_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_LESS
);
1560 /* TGSI_OPCODE_USNE (CPU Only) */
1564 const struct lp_build_tgsi_action
* action
,
1565 struct lp_build_tgsi_context
* bld_base
,
1566 struct lp_build_emit_data
* emit_data
)
1568 uset_emit_cpu(action
, bld_base
, emit_data
, PIPE_FUNC_NOTEQUAL
);
1571 /* TGSI_OPCODE_XOR */
1574 const struct lp_build_tgsi_action
* action
,
1575 struct lp_build_tgsi_context
* bld_base
,
1576 struct lp_build_emit_data
* emit_data
)
1578 emit_data
->output
[emit_data
->chan
] = lp_build_xor(&bld_base
->uint_bld
,
1580 emit_data
->args
[1]);
1584 lp_set_default_actions_cpu(
1585 struct lp_build_tgsi_context
* bld_base
)
1587 lp_set_default_actions(bld_base
);
1588 bld_base
->op_actions
[TGSI_OPCODE_ABS
].emit
= abs_emit_cpu
;
1589 bld_base
->op_actions
[TGSI_OPCODE_ADD
].emit
= add_emit_cpu
;
1590 bld_base
->op_actions
[TGSI_OPCODE_AND
].emit
= and_emit_cpu
;
1591 bld_base
->op_actions
[TGSI_OPCODE_ARL
].emit
= arl_emit_cpu
;
1592 bld_base
->op_actions
[TGSI_OPCODE_ARR
].emit
= arr_emit_cpu
;
1593 bld_base
->op_actions
[TGSI_OPCODE_CEIL
].emit
= ceil_emit_cpu
;
1594 bld_base
->op_actions
[TGSI_OPCODE_CND
].emit
= cnd_emit_cpu
;
1595 bld_base
->op_actions
[TGSI_OPCODE_COS
].emit
= cos_emit_cpu
;
1596 bld_base
->op_actions
[TGSI_OPCODE_CMP
].emit
= cmp_emit_cpu
;
1597 bld_base
->op_actions
[TGSI_OPCODE_DIV
].emit
= div_emit_cpu
;
1598 bld_base
->op_actions
[TGSI_OPCODE_EX2
].emit
= ex2_emit_cpu
;
1599 bld_base
->op_actions
[TGSI_OPCODE_EXP
].emit
= exp_emit_cpu
;
1600 bld_base
->op_actions
[TGSI_OPCODE_F2I
].emit
= f2i_emit_cpu
;
1601 bld_base
->op_actions
[TGSI_OPCODE_F2U
].emit
= f2u_emit_cpu
;
1602 bld_base
->op_actions
[TGSI_OPCODE_FLR
].emit
= flr_emit_cpu
;
1604 bld_base
->op_actions
[TGSI_OPCODE_I2F
].emit
= i2f_emit_cpu
;
1605 bld_base
->op_actions
[TGSI_OPCODE_IABS
].emit
= iabs_emit_cpu
;
1606 bld_base
->op_actions
[TGSI_OPCODE_IDIV
].emit
= idiv_emit_cpu
;
1607 bld_base
->op_actions
[TGSI_OPCODE_INEG
].emit
= ineg_emit_cpu
;
1608 bld_base
->op_actions
[TGSI_OPCODE_IMAX
].emit
= imax_emit_cpu
;
1609 bld_base
->op_actions
[TGSI_OPCODE_IMIN
].emit
= imin_emit_cpu
;
1610 bld_base
->op_actions
[TGSI_OPCODE_ISGE
].emit
= isge_emit_cpu
;
1611 bld_base
->op_actions
[TGSI_OPCODE_ISHR
].emit
= ishr_emit_cpu
;
1612 bld_base
->op_actions
[TGSI_OPCODE_ISLT
].emit
= islt_emit_cpu
;
1613 bld_base
->op_actions
[TGSI_OPCODE_ISSG
].emit
= issg_emit_cpu
;
1615 bld_base
->op_actions
[TGSI_OPCODE_LG2
].emit
= lg2_emit_cpu
;
1616 bld_base
->op_actions
[TGSI_OPCODE_LOG
].emit
= log_emit_cpu
;
1617 bld_base
->op_actions
[TGSI_OPCODE_MAX
].emit
= max_emit_cpu
;
1618 bld_base
->op_actions
[TGSI_OPCODE_MIN
].emit
= min_emit_cpu
;
1619 bld_base
->op_actions
[TGSI_OPCODE_MOD
].emit
= mod_emit_cpu
;
1620 bld_base
->op_actions
[TGSI_OPCODE_NOT
].emit
= not_emit_cpu
;
1621 bld_base
->op_actions
[TGSI_OPCODE_OR
].emit
= or_emit_cpu
;
1622 bld_base
->op_actions
[TGSI_OPCODE_POW
].emit
= pow_emit_cpu
;
1623 bld_base
->op_actions
[TGSI_OPCODE_RCP
].emit
= rcp_emit_cpu
;
1624 bld_base
->op_actions
[TGSI_OPCODE_ROUND
].emit
= round_emit_cpu
;
1625 bld_base
->op_actions
[TGSI_OPCODE_SEQ
].emit
= seq_emit_cpu
;
1626 bld_base
->op_actions
[TGSI_OPCODE_SGE
].emit
= sge_emit_cpu
;
1627 bld_base
->op_actions
[TGSI_OPCODE_SGT
].emit
= sgt_emit_cpu
;
1628 bld_base
->op_actions
[TGSI_OPCODE_SIN
].emit
= sin_emit_cpu
;
1629 bld_base
->op_actions
[TGSI_OPCODE_SHL
].emit
= shl_emit_cpu
;
1630 bld_base
->op_actions
[TGSI_OPCODE_SLE
].emit
= sle_emit_cpu
;
1631 bld_base
->op_actions
[TGSI_OPCODE_SLT
].emit
= slt_emit_cpu
;
1632 bld_base
->op_actions
[TGSI_OPCODE_SNE
].emit
= sne_emit_cpu
;
1633 bld_base
->op_actions
[TGSI_OPCODE_SSG
].emit
= ssg_emit_cpu
;
1634 bld_base
->op_actions
[TGSI_OPCODE_SUB
].emit
= sub_emit_cpu
;
1635 bld_base
->op_actions
[TGSI_OPCODE_TRUNC
].emit
= trunc_emit_cpu
;
1637 bld_base
->rsq_action
.emit
= recip_sqrt_emit_cpu
;
1639 bld_base
->op_actions
[TGSI_OPCODE_UADD
].emit
= uadd_emit_cpu
;
1640 bld_base
->op_actions
[TGSI_OPCODE_UDIV
].emit
= udiv_emit_cpu
;
1641 bld_base
->op_actions
[TGSI_OPCODE_UMAX
].emit
= umax_emit_cpu
;
1642 bld_base
->op_actions
[TGSI_OPCODE_UMIN
].emit
= umin_emit_cpu
;
1643 bld_base
->op_actions
[TGSI_OPCODE_UMOD
].emit
= umod_emit_cpu
;
1644 bld_base
->op_actions
[TGSI_OPCODE_USEQ
].emit
= useq_emit_cpu
;
1645 bld_base
->op_actions
[TGSI_OPCODE_USGE
].emit
= usge_emit_cpu
;
1646 bld_base
->op_actions
[TGSI_OPCODE_USHR
].emit
= ushr_emit_cpu
;
1647 bld_base
->op_actions
[TGSI_OPCODE_USLT
].emit
= uslt_emit_cpu
;
1648 bld_base
->op_actions
[TGSI_OPCODE_USNE
].emit
= usne_emit_cpu
;
1650 bld_base
->op_actions
[TGSI_OPCODE_XOR
].emit
= xor_emit_cpu
;