1 /**************************************************************************
3 * Copyright 2010 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
17 * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
18 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
19 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
20 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 * The above copyright notice and this permission notice (including the
23 * next paragraph) shall be included in all copies or substantial portions
26 **************************************************************************/
29 #include "lp_bld_type.h"
30 #include "lp_bld_arit.h"
31 #include "lp_bld_const.h"
32 #include "lp_bld_swizzle.h"
33 #include "lp_bld_quad.h"
34 #include "lp_bld_pack.h"
37 static const unsigned char
39 LP_BLD_QUAD_TOP_LEFT
, LP_BLD_QUAD_TOP_LEFT
,
40 LP_BLD_QUAD_BOTTOM_LEFT
, LP_BLD_QUAD_BOTTOM_LEFT
43 static const unsigned char
45 LP_BLD_QUAD_TOP_RIGHT
, LP_BLD_QUAD_TOP_RIGHT
,
46 LP_BLD_QUAD_BOTTOM_RIGHT
, LP_BLD_QUAD_BOTTOM_RIGHT
49 static const unsigned char
51 LP_BLD_QUAD_TOP_LEFT
, LP_BLD_QUAD_TOP_RIGHT
,
52 LP_BLD_QUAD_TOP_LEFT
, LP_BLD_QUAD_TOP_RIGHT
55 static const unsigned char
57 LP_BLD_QUAD_BOTTOM_LEFT
, LP_BLD_QUAD_BOTTOM_RIGHT
,
58 LP_BLD_QUAD_BOTTOM_LEFT
, LP_BLD_QUAD_BOTTOM_RIGHT
63 lp_build_ddx(struct lp_build_context
*bld
,
66 LLVMValueRef a_left
= lp_build_swizzle_aos(bld
, a
, swizzle_left
);
67 LLVMValueRef a_right
= lp_build_swizzle_aos(bld
, a
, swizzle_right
);
68 return lp_build_sub(bld
, a_right
, a_left
);
73 lp_build_ddy(struct lp_build_context
*bld
,
76 LLVMValueRef a_top
= lp_build_swizzle_aos(bld
, a
, swizzle_top
);
77 LLVMValueRef a_bottom
= lp_build_swizzle_aos(bld
, a
, swizzle_bottom
);
78 return lp_build_sub(bld
, a_bottom
, a_top
);
82 * Helper for building packed ddx/ddy vector for one coord (scalar per quad
83 * values). The vector will look like this (8-wide):
84 * dr1dx _____ -dr1dy _____ dr2dx _____ -dr2dy _____
85 * This only requires one shuffle instead of two for more straightforward packing.
88 lp_build_packed_ddx_ddy_onecoord(struct lp_build_context
*bld
,
91 struct gallivm_state
*gallivm
= bld
->gallivm
;
92 LLVMBuilderRef builder
= gallivm
->builder
;
93 LLVMValueRef vec1
, vec2
;
95 /* use aos swizzle helper */
97 static const unsigned char swizzle1
[] = { /* no-op swizzle */
98 LP_BLD_QUAD_TOP_LEFT
, LP_BLD_SWIZZLE_DONTCARE
,
99 LP_BLD_QUAD_BOTTOM_LEFT
, LP_BLD_SWIZZLE_DONTCARE
101 static const unsigned char swizzle2
[] = {
102 LP_BLD_QUAD_TOP_RIGHT
, LP_BLD_SWIZZLE_DONTCARE
,
103 LP_BLD_QUAD_TOP_LEFT
, LP_BLD_SWIZZLE_DONTCARE
106 vec1
= lp_build_swizzle_aos(bld
, a
, swizzle1
);
107 vec2
= lp_build_swizzle_aos(bld
, a
, swizzle2
);
109 if (bld
->type
.floating
)
110 return LLVMBuildFSub(builder
, vec2
, vec1
, "ddxddy");
112 return LLVMBuildSub(builder
, vec2
, vec1
, "ddxddy");
117 * Helper for building packed ddx/ddy vector for one coord (scalar per quad
118 * values). The vector will look like this (8-wide):
119 * ds1dx ds1dy dt1dx dt1dy ds2dx ds2dy dt2dx dt2dy
120 * This only needs 2 (v)shufps.
123 lp_build_packed_ddx_ddy_twocoord(struct lp_build_context
*bld
,
124 LLVMValueRef a
, LLVMValueRef b
)
126 struct gallivm_state
*gallivm
= bld
->gallivm
;
127 LLVMBuilderRef builder
= gallivm
->builder
;
128 LLVMValueRef shuffles1
[LP_MAX_VECTOR_LENGTH
/4];
129 LLVMValueRef shuffles2
[LP_MAX_VECTOR_LENGTH
/4];
130 LLVMValueRef vec1
, vec2
;
131 unsigned length
, num_quads
, i
;
133 /* XXX: do hsub version */
134 length
= bld
->type
.length
;
135 num_quads
= length
/ 4;
136 for (i
= 0; i
< num_quads
; i
++) {
138 unsigned s2
= 4 * i
+ length
;
139 shuffles1
[4*i
+ 0] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_TOP_LEFT
+ s1
);
140 shuffles1
[4*i
+ 1] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_TOP_LEFT
+ s1
);
141 shuffles1
[4*i
+ 2] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_TOP_LEFT
+ s2
);
142 shuffles1
[4*i
+ 3] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_TOP_LEFT
+ s2
);
143 shuffles2
[4*i
+ 0] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_TOP_RIGHT
+ s1
);
144 shuffles2
[4*i
+ 1] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_BOTTOM_LEFT
+ s1
);
145 shuffles2
[4*i
+ 2] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_TOP_RIGHT
+ s2
);
146 shuffles2
[4*i
+ 3] = lp_build_const_int32(gallivm
, LP_BLD_QUAD_BOTTOM_LEFT
+ s2
);
148 vec1
= LLVMBuildShuffleVector(builder
, a
, b
,
149 LLVMConstVector(shuffles1
, length
), "");
150 vec2
= LLVMBuildShuffleVector(builder
, a
, b
,
151 LLVMConstVector(shuffles2
, length
), "");
152 if (bld
->type
.floating
)
153 return LLVMBuildFSub(builder
, vec2
, vec1
, "ddxddyddxddy");
155 return LLVMBuildSub(builder
, vec2
, vec1
, "ddxddyddxddy");
160 * Twiddle from quad format to row format
163 * ######### ######### #################
164 * # 0 | 1 # # 4 | 5 # # 0 | 1 | 4 | 5 # src0
165 * #---+---# #---+---# -> #################
166 * # 2 | 3 # # 6 | 7 # # 2 | 3 | 6 | 7 # src1
167 * ######### ######### #################
171 lp_bld_quad_twiddle(struct gallivm_state
*gallivm
,
172 struct lp_type lp_dst_type
,
173 const LLVMValueRef
* src
,
177 LLVMBuilderRef builder
= gallivm
->builder
;
178 LLVMTypeRef dst_type_ref
;
179 LLVMTypeRef type2_ref
;
180 struct lp_type type2
;
183 assert((src_count
% 2) == 0);
185 /* Create a type with only 2 elements */
187 type2
.width
= (lp_dst_type
.width
* lp_dst_type
.length
) / 2;
191 type2_ref
= lp_build_vec_type(gallivm
, type2
);
192 dst_type_ref
= lp_build_vec_type(gallivm
, lp_dst_type
);
194 for (i
= 0; i
< src_count
; i
+= 2) {
195 LLVMValueRef src0
, src1
;
197 src0
= LLVMBuildBitCast(builder
, src
[i
+ 0], type2_ref
, "");
198 src1
= LLVMBuildBitCast(builder
, src
[i
+ 1], type2_ref
, "");
200 dst
[i
+ 0] = lp_build_interleave2(gallivm
, type2
, src0
, src1
, 0);
201 dst
[i
+ 1] = lp_build_interleave2(gallivm
, type2
, src0
, src1
, 1);
203 dst
[i
+ 0] = LLVMBuildBitCast(builder
, dst
[i
+ 0], dst_type_ref
, "");
204 dst
[i
+ 1] = LLVMBuildBitCast(builder
, dst
[i
+ 1], dst_type_ref
, "");