1 /**************************************************************************
3 * Copyright 2009 VMware, Inc.
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
26 **************************************************************************/
30 * Texture sampling -- common code.
32 * @author Jose Fonseca <jfonseca@vmware.com>
35 #include "pipe/p_defines.h"
36 #include "pipe/p_state.h"
37 #include "util/u_format.h"
38 #include "util/u_math.h"
39 #include "lp_bld_debug.h"
40 #include "lp_bld_const.h"
41 #include "lp_bld_arit.h"
42 #include "lp_bld_type.h"
43 #include "lp_bld_format.h"
44 #include "lp_bld_sample.h"
48 * Initialize lp_sampler_static_state object with the gallium sampler
50 * The former is considered to be static and the later dynamic.
53 lp_sampler_static_state(struct lp_sampler_static_state
*state
,
54 const struct pipe_texture
*texture
,
55 const struct pipe_sampler_state
*sampler
)
57 memset(state
, 0, sizeof *state
);
66 * We don't copy sampler state over unless it is actually enabled, to avoid
67 * spurious recompiles, as the sampler static state is part of the shader
70 * Ideally the state tracker or cso_cache module would make all state
71 * canonical, but until that happens it's better to be safe than sorry here.
73 * XXX: Actually there's much more than can be done here, especially
74 * regarding 1D/2D/3D/CUBE textures, wrap modes, etc.
77 state
->format
= texture
->format
;
78 state
->target
= texture
->target
;
79 state
->pot_width
= util_is_pot(texture
->width0
);
80 state
->pot_height
= util_is_pot(texture
->height0
);
81 state
->pot_depth
= util_is_pot(texture
->depth0
);
83 state
->wrap_s
= sampler
->wrap_s
;
84 state
->wrap_t
= sampler
->wrap_t
;
85 state
->wrap_r
= sampler
->wrap_r
;
86 state
->min_img_filter
= sampler
->min_img_filter
;
87 state
->min_mip_filter
= sampler
->min_mip_filter
;
88 state
->mag_img_filter
= sampler
->mag_img_filter
;
90 state
->compare_mode
= sampler
->compare_mode
;
91 if (sampler
->compare_mode
!= PIPE_TEX_COMPARE_NONE
) {
92 state
->compare_func
= sampler
->compare_func
;
95 state
->normalized_coords
= sampler
->normalized_coords
;
96 state
->lod_bias
= sampler
->lod_bias
;
97 state
->min_lod
= sampler
->min_lod
;
98 state
->max_lod
= sampler
->max_lod
;
99 state
->border_color
[0] = sampler
->border_color
[0];
100 state
->border_color
[1] = sampler
->border_color
[1];
101 state
->border_color
[2] = sampler
->border_color
[2];
102 state
->border_color
[3] = sampler
->border_color
[3];
107 * Gather elements from scatter positions in memory into a single vector.
109 * @param src_width src element width
110 * @param dst_width result element width (source will be expanded to fit)
111 * @param length length of the offsets,
112 * @param base_ptr base pointer, should be a i8 pointer type.
113 * @param offsets vector with offsets
116 lp_build_gather(LLVMBuilderRef builder
,
120 LLVMValueRef base_ptr
,
121 LLVMValueRef offsets
)
123 LLVMTypeRef src_type
= LLVMIntType(src_width
);
124 LLVMTypeRef src_ptr_type
= LLVMPointerType(src_type
, 0);
125 LLVMTypeRef dst_elem_type
= LLVMIntType(dst_width
);
126 LLVMTypeRef dst_vec_type
= LLVMVectorType(dst_elem_type
, length
);
130 res
= LLVMGetUndef(dst_vec_type
);
131 for(i
= 0; i
< length
; ++i
) {
132 LLVMValueRef index
= LLVMConstInt(LLVMInt32Type(), i
, 0);
133 LLVMValueRef elem_offset
;
134 LLVMValueRef elem_ptr
;
137 elem_offset
= LLVMBuildExtractElement(builder
, offsets
, index
, "");
138 elem_ptr
= LLVMBuildGEP(builder
, base_ptr
, &elem_offset
, 1, "");
139 elem_ptr
= LLVMBuildBitCast(builder
, elem_ptr
, src_ptr_type
, "");
140 elem
= LLVMBuildLoad(builder
, elem_ptr
, "");
142 assert(src_width
<= dst_width
);
143 if(src_width
> dst_width
)
144 elem
= LLVMBuildTrunc(builder
, elem
, dst_elem_type
, "");
145 if(src_width
< dst_width
)
146 elem
= LLVMBuildZExt(builder
, elem
, dst_elem_type
, "");
148 res
= LLVMBuildInsertElement(builder
, res
, elem
, index
, "");
156 * Compute the offset of a pixel.
158 * x, y, y_stride are vectors
161 lp_build_sample_offset(struct lp_build_context
*bld
,
162 const struct util_format_description
*format_desc
,
165 LLVMValueRef y_stride
)
167 LLVMValueRef x_stride
;
170 x_stride
= lp_build_const_scalar(bld
->type
, format_desc
->block
.bits
/8);
172 if(format_desc
->colorspace
== UTIL_FORMAT_COLORSPACE_ZS
) {
173 LLVMValueRef x_lo
, x_hi
;
174 LLVMValueRef y_lo
, y_hi
;
175 LLVMValueRef x_stride_lo
, x_stride_hi
;
176 LLVMValueRef y_stride_lo
, y_stride_hi
;
177 LLVMValueRef x_offset_lo
, x_offset_hi
;
178 LLVMValueRef y_offset_lo
, y_offset_hi
;
179 LLVMValueRef offset_lo
, offset_hi
;
181 x_lo
= LLVMBuildAnd(bld
->builder
, x
, bld
->one
, "");
182 y_lo
= LLVMBuildAnd(bld
->builder
, y
, bld
->one
, "");
184 x_hi
= LLVMBuildLShr(bld
->builder
, x
, bld
->one
, "");
185 y_hi
= LLVMBuildLShr(bld
->builder
, y
, bld
->one
, "");
187 x_stride_lo
= x_stride
;
188 y_stride_lo
= lp_build_const_scalar(bld
->type
, 2*format_desc
->block
.bits
/8);
190 x_stride_hi
= lp_build_const_scalar(bld
->type
, 4*format_desc
->block
.bits
/8);
191 y_stride_hi
= LLVMBuildShl(bld
->builder
, y_stride
, bld
->one
, "");
193 x_offset_lo
= lp_build_mul(bld
, x_lo
, x_stride_lo
);
194 y_offset_lo
= lp_build_mul(bld
, y_lo
, y_stride_lo
);
195 offset_lo
= lp_build_add(bld
, x_offset_lo
, y_offset_lo
);
197 x_offset_hi
= lp_build_mul(bld
, x_hi
, x_stride_hi
);
198 y_offset_hi
= lp_build_mul(bld
, y_hi
, y_stride_hi
);
199 offset_hi
= lp_build_add(bld
, x_offset_hi
, y_offset_hi
);
201 offset
= lp_build_add(bld
, offset_hi
, offset_lo
);
204 LLVMValueRef x_offset
;
205 LLVMValueRef y_offset
;
207 x_offset
= lp_build_mul(bld
, x
, x_stride
);
208 y_offset
= lp_build_mul(bld
, y
, y_stride
);
210 offset
= lp_build_add(bld
, x_offset
, y_offset
);