gallivm: Vectorize the rho computation.
[mesa.git] / src / gallium / auxiliary / gallivm / lp_bld_sample.h
1 /**************************************************************************
2 *
3 * Copyright 2009 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28 /**
29 * @file
30 * Texture sampling.
31 *
32 * @author Jose Fonseca <jfonseca@vmware.com>
33 */
34
35 #ifndef LP_BLD_SAMPLE_H
36 #define LP_BLD_SAMPLE_H
37
38
39 #include "pipe/p_format.h"
40 #include "util/u_debug.h"
41 #include "gallivm/lp_bld.h"
42 #include "gallivm/lp_bld_type.h"
43 #include "gallivm/lp_bld_swizzle.h"
44
45
46 struct pipe_resource;
47 struct pipe_sampler_view;
48 struct pipe_sampler_state;
49 struct util_format_description;
50 struct lp_type;
51 struct lp_build_context;
52
53
54 /**
55 * Sampler static state.
56 *
57 * These are the bits of state from pipe_resource and pipe_sampler_state that
58 * are embedded in the generated code.
59 */
60 struct lp_sampler_static_state
61 {
62 /* pipe_sampler_view's state */
63 enum pipe_format format;
64 unsigned swizzle_r:3; /**< PIPE_SWIZZLE_* */
65 unsigned swizzle_g:3;
66 unsigned swizzle_b:3;
67 unsigned swizzle_a:3;
68
69 /* pipe_texture's state */
70 unsigned target:3; /**< PIPE_TEXTURE_* */
71 unsigned pot_width:1; /**< is the width a power of two? */
72 unsigned pot_height:1;
73 unsigned pot_depth:1;
74
75 /* pipe_sampler_state's state */
76 unsigned wrap_s:3;
77 unsigned wrap_t:3;
78 unsigned wrap_r:3;
79 unsigned min_img_filter:2;
80 unsigned min_mip_filter:2;
81 unsigned mag_img_filter:2;
82 unsigned compare_mode:1;
83 unsigned compare_func:3;
84 unsigned normalized_coords:1;
85 unsigned min_max_lod_equal:1; /**< min_lod == max_lod ? */
86 unsigned lod_bias_non_zero:1;
87 unsigned apply_min_lod:1; /**< min_lod > 0 ? */
88 unsigned apply_max_lod:1; /**< max_lod < last_level ? */
89 };
90
91
92 /**
93 * Sampler dynamic state.
94 *
95 * These are the bits of state from pipe_resource and pipe_sampler_state that
96 * are computed in runtime.
97 *
98 * There are obtained through callbacks, as we don't want to tie the texture
99 * sampling code generation logic to any particular texture layout or pipe
100 * driver.
101 */
102 struct lp_sampler_dynamic_state
103 {
104
105 /** Obtain the base texture width (returns int32) */
106 LLVMValueRef
107 (*width)( const struct lp_sampler_dynamic_state *state,
108 LLVMBuilderRef builder,
109 unsigned unit);
110
111 /** Obtain the base texture height (returns int32) */
112 LLVMValueRef
113 (*height)( const struct lp_sampler_dynamic_state *state,
114 LLVMBuilderRef builder,
115 unsigned unit);
116
117 /** Obtain the base texture depth (returns int32) */
118 LLVMValueRef
119 (*depth)( const struct lp_sampler_dynamic_state *state,
120 LLVMBuilderRef builder,
121 unsigned unit);
122
123 /** Obtain the number of mipmap levels minus one (returns int32) */
124 LLVMValueRef
125 (*last_level)( const struct lp_sampler_dynamic_state *state,
126 LLVMBuilderRef builder,
127 unsigned unit);
128
129 /** Obtain stride in bytes between image rows/blocks (returns int32) */
130 LLVMValueRef
131 (*row_stride)( const struct lp_sampler_dynamic_state *state,
132 LLVMBuilderRef builder,
133 unsigned unit);
134
135 /** Obtain stride in bytes between image slices (returns int32) */
136 LLVMValueRef
137 (*img_stride)( const struct lp_sampler_dynamic_state *state,
138 LLVMBuilderRef builder,
139 unsigned unit);
140
141 /** Obtain pointer to array of pointers to mimpap levels */
142 LLVMValueRef
143 (*data_ptr)( const struct lp_sampler_dynamic_state *state,
144 LLVMBuilderRef builder,
145 unsigned unit);
146
147 /** Obtain texture min lod (returns float) */
148 LLVMValueRef
149 (*min_lod)(const struct lp_sampler_dynamic_state *state,
150 LLVMBuilderRef builder, unsigned unit);
151
152 /** Obtain texture max lod (returns float) */
153 LLVMValueRef
154 (*max_lod)(const struct lp_sampler_dynamic_state *state,
155 LLVMBuilderRef builder, unsigned unit);
156
157 /** Obtain texture lod bias (returns float) */
158 LLVMValueRef
159 (*lod_bias)(const struct lp_sampler_dynamic_state *state,
160 LLVMBuilderRef builder, unsigned unit);
161
162 /** Obtain texture border color (returns ptr to float[4]) */
163 LLVMValueRef
164 (*border_color)(const struct lp_sampler_dynamic_state *state,
165 LLVMBuilderRef builder, unsigned unit);
166 };
167
168
169 /**
170 * Keep all information for sampling code generation in a single place.
171 */
172 struct lp_build_sample_context
173 {
174 LLVMBuilderRef builder;
175
176 const struct lp_sampler_static_state *static_state;
177
178 struct lp_sampler_dynamic_state *dynamic_state;
179
180 const struct util_format_description *format_desc;
181
182 /** regular scalar float type */
183 struct lp_type float_type;
184 struct lp_build_context float_bld;
185
186 /** float vector type */
187 struct lp_build_context float_vec_bld;
188
189 /** regular scalar float type */
190 struct lp_type int_type;
191 struct lp_build_context int_bld;
192
193 /** Incoming coordinates type and build context */
194 struct lp_type coord_type;
195 struct lp_build_context coord_bld;
196
197 /** Unsigned integer coordinates */
198 struct lp_type uint_coord_type;
199 struct lp_build_context uint_coord_bld;
200
201 /** Signed integer coordinates */
202 struct lp_type int_coord_type;
203 struct lp_build_context int_coord_bld;
204
205 /** Unsigned integer texture size */
206 struct lp_type uint_size_type;
207 struct lp_build_context uint_size_bld;
208
209 /** Unsigned integer texture size */
210 struct lp_type float_size_type;
211 struct lp_build_context float_size_bld;
212
213 /** Output texels type and build context */
214 struct lp_type texel_type;
215 struct lp_build_context texel_bld;
216
217 /** Unsigned vector with texture width, height, depth */
218 LLVMValueRef uint_size;
219 };
220
221
222
223 /**
224 * We only support a few wrap modes in lp_build_sample_wrap_linear_int() at
225 * this time. Return whether the given mode is supported by that function.
226 */
227 static INLINE boolean
228 lp_is_simple_wrap_mode(unsigned mode)
229 {
230 switch (mode) {
231 case PIPE_TEX_WRAP_REPEAT:
232 case PIPE_TEX_WRAP_CLAMP_TO_EDGE:
233 return TRUE;
234 default:
235 return FALSE;
236 }
237 }
238
239
240 static INLINE void
241 apply_sampler_swizzle(struct lp_build_sample_context *bld,
242 LLVMValueRef *texel)
243 {
244 unsigned char swizzles[4];
245
246 swizzles[0] = bld->static_state->swizzle_r;
247 swizzles[1] = bld->static_state->swizzle_g;
248 swizzles[2] = bld->static_state->swizzle_b;
249 swizzles[3] = bld->static_state->swizzle_a;
250
251 lp_build_swizzle_soa_inplace(&bld->texel_bld, texel, swizzles);
252 }
253
254
255 static INLINE unsigned
256 texture_dims(enum pipe_texture_target tex)
257 {
258 switch (tex) {
259 case PIPE_TEXTURE_1D:
260 return 1;
261 case PIPE_TEXTURE_2D:
262 case PIPE_TEXTURE_RECT:
263 case PIPE_TEXTURE_CUBE:
264 return 2;
265 case PIPE_TEXTURE_3D:
266 return 3;
267 default:
268 assert(0 && "bad texture target in texture_dims()");
269 return 2;
270 }
271 }
272
273
274 boolean
275 lp_sampler_wrap_mode_uses_border_color(unsigned mode,
276 unsigned min_img_filter,
277 unsigned mag_img_filter);
278
279 /**
280 * Derive the sampler static state.
281 */
282 void
283 lp_sampler_static_state(struct lp_sampler_static_state *state,
284 const struct pipe_sampler_view *view,
285 const struct pipe_sampler_state *sampler);
286
287
288 void
289 lp_build_lod_selector(struct lp_build_sample_context *bld,
290 unsigned unit,
291 const LLVMValueRef ddx[4],
292 const LLVMValueRef ddy[4],
293 LLVMValueRef lod_bias, /* optional */
294 LLVMValueRef explicit_lod, /* optional */
295 LLVMValueRef width,
296 LLVMValueRef height,
297 LLVMValueRef depth,
298 unsigned mip_filter,
299 LLVMValueRef *out_lod_ipart,
300 LLVMValueRef *out_lod_fpart);
301
302 void
303 lp_build_nearest_mip_level(struct lp_build_sample_context *bld,
304 unsigned unit,
305 LLVMValueRef lod,
306 LLVMValueRef *level_out);
307
308 void
309 lp_build_linear_mip_levels(struct lp_build_sample_context *bld,
310 unsigned unit,
311 LLVMValueRef lod_ipart,
312 LLVMValueRef *level0_out,
313 LLVMValueRef *level1_out);
314
315 LLVMValueRef
316 lp_build_get_mipmap_level(struct lp_build_sample_context *bld,
317 LLVMValueRef data_array, LLVMValueRef level);
318
319 LLVMValueRef
320 lp_build_get_const_mipmap_level(struct lp_build_sample_context *bld,
321 LLVMValueRef data_array, int level);
322
323
324 void
325 lp_build_mipmap_level_sizes(struct lp_build_sample_context *bld,
326 unsigned dims,
327 LLVMValueRef width_vec,
328 LLVMValueRef height_vec,
329 LLVMValueRef depth_vec,
330 LLVMValueRef ilevel0,
331 LLVMValueRef ilevel1,
332 LLVMValueRef row_stride_array,
333 LLVMValueRef img_stride_array,
334 LLVMValueRef *width0_vec,
335 LLVMValueRef *width1_vec,
336 LLVMValueRef *height0_vec,
337 LLVMValueRef *height1_vec,
338 LLVMValueRef *depth0_vec,
339 LLVMValueRef *depth1_vec,
340 LLVMValueRef *row_stride0_vec,
341 LLVMValueRef *row_stride1_vec,
342 LLVMValueRef *img_stride0_vec,
343 LLVMValueRef *img_stride1_vec);
344
345
346 void
347 lp_build_cube_lookup(struct lp_build_sample_context *bld,
348 LLVMValueRef s,
349 LLVMValueRef t,
350 LLVMValueRef r,
351 LLVMValueRef *face,
352 LLVMValueRef *face_s,
353 LLVMValueRef *face_t);
354
355
356 void
357 lp_build_sample_partial_offset(struct lp_build_context *bld,
358 unsigned block_length,
359 LLVMValueRef coord,
360 LLVMValueRef stride,
361 LLVMValueRef *out_offset,
362 LLVMValueRef *out_i);
363
364
365 void
366 lp_build_sample_offset(struct lp_build_context *bld,
367 const struct util_format_description *format_desc,
368 LLVMValueRef x,
369 LLVMValueRef y,
370 LLVMValueRef z,
371 LLVMValueRef y_stride,
372 LLVMValueRef z_stride,
373 LLVMValueRef *out_offset,
374 LLVMValueRef *out_i,
375 LLVMValueRef *out_j);
376
377
378 void
379 lp_build_sample_soa(LLVMBuilderRef builder,
380 const struct lp_sampler_static_state *static_state,
381 struct lp_sampler_dynamic_state *dynamic_state,
382 struct lp_type fp_type,
383 unsigned unit,
384 unsigned num_coords,
385 const LLVMValueRef *coords,
386 const LLVMValueRef *ddx,
387 const LLVMValueRef *ddy,
388 LLVMValueRef lod_bias,
389 LLVMValueRef explicit_lod,
390 LLVMValueRef texel_out[4]);
391
392 void
393 lp_build_sample_nop(struct lp_type type,
394 LLVMValueRef texel_out[4]);
395
396
397 #endif /* LP_BLD_SAMPLE_H */