Merge branch '7.8'
[mesa.git] / src / gallium / auxiliary / gallivm / lp_bld_sample.c
1 /**************************************************************************
2 *
3 * Copyright 2009 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * @file
30 * Texture sampling -- common code.
31 *
32 * @author Jose Fonseca <jfonseca@vmware.com>
33 */
34
35 #include "pipe/p_defines.h"
36 #include "pipe/p_state.h"
37 #include "util/u_format.h"
38 #include "util/u_math.h"
39 #include "lp_bld_debug.h"
40 #include "lp_bld_const.h"
41 #include "lp_bld_arit.h"
42 #include "lp_bld_type.h"
43 #include "lp_bld_format.h"
44 #include "lp_bld_sample.h"
45
46
47 /**
48 * Initialize lp_sampler_static_state object with the gallium sampler
49 * and texture state.
50 * The former is considered to be static and the later dynamic.
51 */
52 void
53 lp_sampler_static_state(struct lp_sampler_static_state *state,
54 const struct pipe_texture *texture,
55 const struct pipe_sampler_state *sampler)
56 {
57 memset(state, 0, sizeof *state);
58
59 if(!texture)
60 return;
61
62 if(!sampler)
63 return;
64
65 /*
66 * We don't copy sampler state over unless it is actually enabled, to avoid
67 * spurious recompiles, as the sampler static state is part of the shader
68 * key.
69 *
70 * Ideally the state tracker or cso_cache module would make all state
71 * canonical, but until that happens it's better to be safe than sorry here.
72 *
73 * XXX: Actually there's much more than can be done here, especially
74 * regarding 1D/2D/3D/CUBE textures, wrap modes, etc.
75 */
76
77 state->format = texture->format;
78 state->target = texture->target;
79 state->pot_width = util_is_pot(texture->width0);
80 state->pot_height = util_is_pot(texture->height0);
81 state->pot_depth = util_is_pot(texture->depth0);
82
83 state->wrap_s = sampler->wrap_s;
84 state->wrap_t = sampler->wrap_t;
85 state->wrap_r = sampler->wrap_r;
86 state->min_img_filter = sampler->min_img_filter;
87 state->min_mip_filter = sampler->min_mip_filter;
88 state->mag_img_filter = sampler->mag_img_filter;
89
90 state->compare_mode = sampler->compare_mode;
91 if (sampler->compare_mode != PIPE_TEX_COMPARE_NONE) {
92 state->compare_func = sampler->compare_func;
93 }
94
95 state->normalized_coords = sampler->normalized_coords;
96 state->lod_bias = sampler->lod_bias;
97 state->min_lod = sampler->min_lod;
98 state->max_lod = sampler->max_lod;
99 state->border_color[0] = sampler->border_color[0];
100 state->border_color[1] = sampler->border_color[1];
101 state->border_color[2] = sampler->border_color[2];
102 state->border_color[3] = sampler->border_color[3];
103 }
104
105
106 /**
107 * Gather elements from scatter positions in memory into a single vector.
108 *
109 * @param src_width src element width
110 * @param dst_width result element width (source will be expanded to fit)
111 * @param length length of the offsets,
112 * @param base_ptr base pointer, should be a i8 pointer type.
113 * @param offsets vector with offsets
114 */
115 LLVMValueRef
116 lp_build_gather(LLVMBuilderRef builder,
117 unsigned length,
118 unsigned src_width,
119 unsigned dst_width,
120 LLVMValueRef base_ptr,
121 LLVMValueRef offsets)
122 {
123 LLVMTypeRef src_type = LLVMIntType(src_width);
124 LLVMTypeRef src_ptr_type = LLVMPointerType(src_type, 0);
125 LLVMTypeRef dst_elem_type = LLVMIntType(dst_width);
126 LLVMTypeRef dst_vec_type = LLVMVectorType(dst_elem_type, length);
127 LLVMValueRef res;
128 unsigned i;
129
130 res = LLVMGetUndef(dst_vec_type);
131 for(i = 0; i < length; ++i) {
132 LLVMValueRef index = LLVMConstInt(LLVMInt32Type(), i, 0);
133 LLVMValueRef elem_offset;
134 LLVMValueRef elem_ptr;
135 LLVMValueRef elem;
136
137 elem_offset = LLVMBuildExtractElement(builder, offsets, index, "");
138 elem_ptr = LLVMBuildGEP(builder, base_ptr, &elem_offset, 1, "");
139 elem_ptr = LLVMBuildBitCast(builder, elem_ptr, src_ptr_type, "");
140 elem = LLVMBuildLoad(builder, elem_ptr, "");
141
142 assert(src_width <= dst_width);
143 if(src_width > dst_width)
144 elem = LLVMBuildTrunc(builder, elem, dst_elem_type, "");
145 if(src_width < dst_width)
146 elem = LLVMBuildZExt(builder, elem, dst_elem_type, "");
147
148 res = LLVMBuildInsertElement(builder, res, elem, index, "");
149 }
150
151 return res;
152 }
153
154
155 /**
156 * Compute the offset of a pixel.
157 *
158 * x, y, y_stride are vectors
159 */
160 LLVMValueRef
161 lp_build_sample_offset(struct lp_build_context *bld,
162 const struct util_format_description *format_desc,
163 LLVMValueRef x,
164 LLVMValueRef y,
165 LLVMValueRef y_stride)
166 {
167 LLVMValueRef x_stride;
168 LLVMValueRef offset;
169
170 x_stride = lp_build_const_scalar(bld->type, format_desc->block.bits/8);
171
172 if(format_desc->colorspace == UTIL_FORMAT_COLORSPACE_ZS) {
173 LLVMValueRef x_lo, x_hi;
174 LLVMValueRef y_lo, y_hi;
175 LLVMValueRef x_stride_lo, x_stride_hi;
176 LLVMValueRef y_stride_lo, y_stride_hi;
177 LLVMValueRef x_offset_lo, x_offset_hi;
178 LLVMValueRef y_offset_lo, y_offset_hi;
179 LLVMValueRef offset_lo, offset_hi;
180
181 x_lo = LLVMBuildAnd(bld->builder, x, bld->one, "");
182 y_lo = LLVMBuildAnd(bld->builder, y, bld->one, "");
183
184 x_hi = LLVMBuildLShr(bld->builder, x, bld->one, "");
185 y_hi = LLVMBuildLShr(bld->builder, y, bld->one, "");
186
187 x_stride_lo = x_stride;
188 y_stride_lo = lp_build_const_scalar(bld->type, 2*format_desc->block.bits/8);
189
190 x_stride_hi = lp_build_const_scalar(bld->type, 4*format_desc->block.bits/8);
191 y_stride_hi = LLVMBuildShl(bld->builder, y_stride, bld->one, "");
192
193 x_offset_lo = lp_build_mul(bld, x_lo, x_stride_lo);
194 y_offset_lo = lp_build_mul(bld, y_lo, y_stride_lo);
195 offset_lo = lp_build_add(bld, x_offset_lo, y_offset_lo);
196
197 x_offset_hi = lp_build_mul(bld, x_hi, x_stride_hi);
198 y_offset_hi = lp_build_mul(bld, y_hi, y_stride_hi);
199 offset_hi = lp_build_add(bld, x_offset_hi, y_offset_hi);
200
201 offset = lp_build_add(bld, offset_hi, offset_lo);
202 }
203 else {
204 LLVMValueRef x_offset;
205 LLVMValueRef y_offset;
206
207 x_offset = lp_build_mul(bld, x, x_stride);
208 y_offset = lp_build_mul(bld, y, y_stride);
209
210 offset = lp_build_add(bld, x_offset, y_offset);
211 }
212
213 return offset;
214 }