gallivm,llvmpipe: handle TXF (texelFetch) instruction, including offsets
[mesa.git] / src / gallium / drivers / llvmpipe / lp_screen.c
1 /**************************************************************************
2 *
3 * Copyright 2008 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29 #include "util/u_memory.h"
30 #include "util/u_math.h"
31 #include "util/u_cpu_detect.h"
32 #include "util/u_format.h"
33 #include "util/u_string.h"
34 #include "util/u_format_s3tc.h"
35 #include "pipe/p_defines.h"
36 #include "pipe/p_screen.h"
37 #include "draw/draw_context.h"
38 #include "gallivm/lp_bld_type.h"
39
40 #include "lp_texture.h"
41 #include "lp_fence.h"
42 #include "lp_jit.h"
43 #include "lp_screen.h"
44 #include "lp_context.h"
45 #include "lp_debug.h"
46 #include "lp_public.h"
47 #include "lp_limits.h"
48 #include "lp_rast.h"
49
50 #include "state_tracker/sw_winsys.h"
51
52 #ifdef DEBUG
53 int LP_DEBUG = 0;
54
55 static const struct debug_named_value lp_debug_flags[] = {
56 { "pipe", DEBUG_PIPE, NULL },
57 { "tgsi", DEBUG_TGSI, NULL },
58 { "tex", DEBUG_TEX, NULL },
59 { "setup", DEBUG_SETUP, NULL },
60 { "rast", DEBUG_RAST, NULL },
61 { "query", DEBUG_QUERY, NULL },
62 { "screen", DEBUG_SCREEN, NULL },
63 { "show_tiles", DEBUG_SHOW_TILES, NULL },
64 { "show_subtiles", DEBUG_SHOW_SUBTILES, NULL },
65 { "counters", DEBUG_COUNTERS, NULL },
66 { "scene", DEBUG_SCENE, NULL },
67 { "fence", DEBUG_FENCE, NULL },
68 { "mem", DEBUG_MEM, NULL },
69 { "fs", DEBUG_FS, NULL },
70 DEBUG_NAMED_VALUE_END
71 };
72 #endif
73
74 int LP_PERF = 0;
75 static const struct debug_named_value lp_perf_flags[] = {
76 { "texmem", PERF_TEX_MEM, NULL },
77 { "no_mipmap", PERF_NO_MIPMAPS, NULL },
78 { "no_linear", PERF_NO_LINEAR, NULL },
79 { "no_mip_linear", PERF_NO_MIP_LINEAR, NULL },
80 { "no_tex", PERF_NO_TEX, NULL },
81 { "no_blend", PERF_NO_BLEND, NULL },
82 { "no_depth", PERF_NO_DEPTH, NULL },
83 { "no_alphatest", PERF_NO_ALPHATEST, NULL },
84 DEBUG_NAMED_VALUE_END
85 };
86
87
88 static const char *
89 llvmpipe_get_vendor(struct pipe_screen *screen)
90 {
91 return "VMware, Inc.";
92 }
93
94
95 static const char *
96 llvmpipe_get_name(struct pipe_screen *screen)
97 {
98 static char buf[100];
99 util_snprintf(buf, sizeof(buf), "llvmpipe (LLVM %u.%u, %u bits)",
100 HAVE_LLVM >> 8, HAVE_LLVM & 0xff,
101 lp_native_vector_width );
102 return buf;
103 }
104
105
106 static int
107 llvmpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)
108 {
109 switch (param) {
110 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
111 return 2 * PIPE_MAX_SAMPLERS; /* VS + FS samplers */
112 case PIPE_CAP_NPOT_TEXTURES:
113 return 1;
114 case PIPE_CAP_TWO_SIDED_STENCIL:
115 return 1;
116 case PIPE_CAP_SM3:
117 return 1;
118 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
119 return 0;
120 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
121 return 0;
122 case PIPE_CAP_ANISOTROPIC_FILTER:
123 return 0;
124 case PIPE_CAP_POINT_SPRITE:
125 return 1;
126 case PIPE_CAP_MAX_RENDER_TARGETS:
127 return PIPE_MAX_COLOR_BUFS;
128 case PIPE_CAP_OCCLUSION_QUERY:
129 return 1;
130 case PIPE_CAP_TIMER_QUERY:
131 return 0;
132 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
133 return 1;
134 case PIPE_CAP_TEXTURE_SHADOW_MAP:
135 return 1;
136 case PIPE_CAP_TEXTURE_SWIZZLE:
137 return 1;
138 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
139 return LP_MAX_TEXTURE_2D_LEVELS;
140 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
141 return LP_MAX_TEXTURE_3D_LEVELS;
142 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
143 return LP_MAX_TEXTURE_CUBE_LEVELS;
144 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
145 return 1;
146 case PIPE_CAP_INDEP_BLEND_ENABLE:
147 return 1;
148 case PIPE_CAP_INDEP_BLEND_FUNC:
149 return 1;
150 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
151 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
152 return 1;
153 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
154 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
155 return 0;
156 case PIPE_CAP_PRIMITIVE_RESTART:
157 return 1;
158 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
159 return 1;
160 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
161 return 0;
162 case PIPE_CAP_DEPTH_CLIP_DISABLE:
163 return 0;
164 case PIPE_CAP_SHADER_STENCIL_EXPORT:
165 return 0;
166 case PIPE_CAP_TGSI_INSTANCEID:
167 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
168 return 1;
169 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
170 return 0;
171 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
172 return 1;
173 case PIPE_CAP_SEAMLESS_CUBE_MAP:
174 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
175 return 0;
176 case PIPE_CAP_SCALED_RESOLVE:
177 return 0;
178 /* this is a lie could support arbitrary large offsets */
179 case PIPE_CAP_MIN_TEXEL_OFFSET:
180 return -8;
181 case PIPE_CAP_MAX_TEXEL_OFFSET:
182 return 7;
183 case PIPE_CAP_CONDITIONAL_RENDER:
184 return 1;
185 case PIPE_CAP_TEXTURE_BARRIER:
186 return 0;
187 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
188 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
189 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
190 return 0;
191 case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS:
192 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
193 return 0;
194 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
195 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
196 return 0;
197 case PIPE_CAP_GLSL_FEATURE_LEVEL:
198 return 120;
199 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
200 return 0;
201 case PIPE_CAP_COMPUTE:
202 return 0;
203 case PIPE_CAP_USER_VERTEX_BUFFERS:
204 case PIPE_CAP_USER_INDEX_BUFFERS:
205 case PIPE_CAP_USER_CONSTANT_BUFFERS:
206 return 1;
207 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
208 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
209 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
210 return 0;
211
212 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
213 return 16;
214 case PIPE_CAP_START_INSTANCE:
215 case PIPE_CAP_QUERY_TIMESTAMP:
216 case PIPE_CAP_TEXTURE_MULTISAMPLE:
217 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
218 case PIPE_CAP_CUBE_MAP_ARRAY:
219 return 0;
220 }
221 /* should only get here on unhandled cases */
222 debug_printf("Unexpected PIPE_CAP %d query\n", param);
223 return 0;
224 }
225
226 static int
227 llvmpipe_get_shader_param(struct pipe_screen *screen, unsigned shader, enum pipe_shader_cap param)
228 {
229 switch(shader)
230 {
231 case PIPE_SHADER_FRAGMENT:
232 switch (param) {
233 default:
234 return gallivm_get_shader_param(param);
235 }
236 case PIPE_SHADER_VERTEX:
237 case PIPE_SHADER_GEOMETRY:
238 switch (param) {
239 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
240 /* At this time, the draw module and llvmpipe driver only
241 * support vertex shader texture lookups when LLVM is enabled in
242 * the draw module.
243 */
244 if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))
245 return PIPE_MAX_SAMPLERS;
246 else
247 return 0;
248 default:
249 return draw_get_shader_param(shader, param);
250 }
251 default:
252 return 0;
253 }
254 }
255
256 static float
257 llvmpipe_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
258 {
259 switch (param) {
260 case PIPE_CAPF_MAX_LINE_WIDTH:
261 /* fall-through */
262 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
263 return 255.0; /* arbitrary */
264 case PIPE_CAPF_MAX_POINT_WIDTH:
265 /* fall-through */
266 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
267 return 255.0; /* arbitrary */
268 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
269 return 16.0; /* not actually signficant at this time */
270 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
271 return 16.0; /* arbitrary */
272 case PIPE_CAPF_GUARD_BAND_LEFT:
273 case PIPE_CAPF_GUARD_BAND_TOP:
274 case PIPE_CAPF_GUARD_BAND_RIGHT:
275 case PIPE_CAPF_GUARD_BAND_BOTTOM:
276 return 0.0;
277 }
278 /* should only get here on unhandled cases */
279 debug_printf("Unexpected PIPE_CAP %d query\n", param);
280 return 0.0;
281 }
282
283
284 /**
285 * Query format support for creating a texture, drawing surface, etc.
286 * \param format the format to test
287 * \param type one of PIPE_TEXTURE, PIPE_SURFACE
288 */
289 static boolean
290 llvmpipe_is_format_supported( struct pipe_screen *_screen,
291 enum pipe_format format,
292 enum pipe_texture_target target,
293 unsigned sample_count,
294 unsigned bind)
295 {
296 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
297 struct sw_winsys *winsys = screen->winsys;
298 const struct util_format_description *format_desc;
299
300 format_desc = util_format_description(format);
301 if (!format_desc)
302 return FALSE;
303
304 /* Z16 support is missing, which breaks the blit */
305 if (format == PIPE_FORMAT_Z16_UNORM)
306 return FALSE;
307
308 assert(target == PIPE_BUFFER ||
309 target == PIPE_TEXTURE_1D ||
310 target == PIPE_TEXTURE_2D ||
311 target == PIPE_TEXTURE_RECT ||
312 target == PIPE_TEXTURE_3D ||
313 target == PIPE_TEXTURE_CUBE);
314
315 if (sample_count > 1)
316 return FALSE;
317
318 if (format_desc->format == PIPE_FORMAT_R11G11B10_FLOAT ||
319 format_desc->format == PIPE_FORMAT_R9G9B9E5_FLOAT)
320 return TRUE;
321
322 if (bind & PIPE_BIND_RENDER_TARGET) {
323 if (format_desc->colorspace == UTIL_FORMAT_COLORSPACE_ZS ||
324 format_desc->colorspace == UTIL_FORMAT_COLORSPACE_SRGB)
325 return FALSE;
326
327 if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN)
328 return FALSE;
329
330 if (format_desc->block.width != 1 ||
331 format_desc->block.height != 1)
332 return FALSE;
333 }
334
335 if (bind & PIPE_BIND_DISPLAY_TARGET) {
336 if(!winsys->is_displaytarget_format_supported(winsys, bind, format))
337 return FALSE;
338 }
339
340 if (bind & PIPE_BIND_DEPTH_STENCIL) {
341 if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN)
342 return FALSE;
343
344 if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS)
345 return FALSE;
346
347 /* FIXME: Temporary restriction. See lp_state_fs.c. */
348 if (format_desc->block.bits != 32)
349 return FALSE;
350 }
351
352 if (format_desc->layout == UTIL_FORMAT_LAYOUT_S3TC) {
353 return util_format_s3tc_enabled;
354 }
355
356 /*
357 * Everything can be supported by u_format.
358 */
359
360 if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS &&
361 !format_desc->fetch_rgba_float) {
362 return FALSE;
363 }
364
365 return TRUE;
366 }
367
368
369
370
371 static void
372 llvmpipe_flush_frontbuffer(struct pipe_screen *_screen,
373 struct pipe_resource *resource,
374 unsigned level, unsigned layer,
375 void *context_private)
376 {
377 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
378 struct sw_winsys *winsys = screen->winsys;
379 struct llvmpipe_resource *texture = llvmpipe_resource(resource);
380
381 assert(texture->dt);
382 if (texture->dt)
383 winsys->displaytarget_display(winsys, texture->dt, context_private);
384 }
385
386
387 static void
388 llvmpipe_destroy_screen( struct pipe_screen *_screen )
389 {
390 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
391 struct sw_winsys *winsys = screen->winsys;
392
393 if (screen->rast)
394 lp_rast_destroy(screen->rast);
395
396 lp_jit_screen_cleanup(screen);
397
398 if(winsys->destroy)
399 winsys->destroy(winsys);
400
401 pipe_mutex_destroy(screen->rast_mutex);
402
403 FREE(screen);
404 }
405
406
407
408
409 /**
410 * Fence reference counting.
411 */
412 static void
413 llvmpipe_fence_reference(struct pipe_screen *screen,
414 struct pipe_fence_handle **ptr,
415 struct pipe_fence_handle *fence)
416 {
417 struct lp_fence **old = (struct lp_fence **) ptr;
418 struct lp_fence *f = (struct lp_fence *) fence;
419
420 lp_fence_reference(old, f);
421 }
422
423
424 /**
425 * Has the fence been executed/finished?
426 */
427 static boolean
428 llvmpipe_fence_signalled(struct pipe_screen *screen,
429 struct pipe_fence_handle *fence)
430 {
431 struct lp_fence *f = (struct lp_fence *) fence;
432 return lp_fence_signalled(f);
433 }
434
435
436 /**
437 * Wait for the fence to finish.
438 */
439 static boolean
440 llvmpipe_fence_finish(struct pipe_screen *screen,
441 struct pipe_fence_handle *fence_handle,
442 uint64_t timeout)
443 {
444 struct lp_fence *f = (struct lp_fence *) fence_handle;
445
446 lp_fence_wait(f);
447 return TRUE;
448 }
449
450
451
452 /**
453 * Create a new pipe_screen object
454 * Note: we're not presently subclassing pipe_screen (no llvmpipe_screen).
455 */
456 struct pipe_screen *
457 llvmpipe_create_screen(struct sw_winsys *winsys)
458 {
459 struct llvmpipe_screen *screen;
460
461 #ifdef PIPE_ARCH_X86
462 /* require SSE2 due to LLVM PR6960. */
463 util_cpu_detect();
464 if (!util_cpu_caps.has_sse2)
465 return NULL;
466 #endif
467
468 #ifdef DEBUG
469 LP_DEBUG = debug_get_flags_option("LP_DEBUG", lp_debug_flags, 0 );
470 #endif
471
472 LP_PERF = debug_get_flags_option("LP_PERF", lp_perf_flags, 0 );
473
474 screen = CALLOC_STRUCT(llvmpipe_screen);
475 if (!screen)
476 return NULL;
477
478 screen->winsys = winsys;
479
480 screen->base.destroy = llvmpipe_destroy_screen;
481
482 screen->base.get_name = llvmpipe_get_name;
483 screen->base.get_vendor = llvmpipe_get_vendor;
484 screen->base.get_param = llvmpipe_get_param;
485 screen->base.get_shader_param = llvmpipe_get_shader_param;
486 screen->base.get_paramf = llvmpipe_get_paramf;
487 screen->base.is_format_supported = llvmpipe_is_format_supported;
488
489 screen->base.context_create = llvmpipe_create_context;
490 screen->base.flush_frontbuffer = llvmpipe_flush_frontbuffer;
491 screen->base.fence_reference = llvmpipe_fence_reference;
492 screen->base.fence_signalled = llvmpipe_fence_signalled;
493 screen->base.fence_finish = llvmpipe_fence_finish;
494
495 llvmpipe_init_screen_resource_funcs(&screen->base);
496
497 lp_jit_screen_init(screen);
498
499 screen->num_threads = util_cpu_caps.nr_cpus > 1 ? util_cpu_caps.nr_cpus : 0;
500 #ifdef PIPE_SUBSYSTEM_EMBEDDED
501 screen->num_threads = 0;
502 #endif
503 screen->num_threads = debug_get_num_option("LP_NUM_THREADS", screen->num_threads);
504 screen->num_threads = MIN2(screen->num_threads, LP_MAX_THREADS);
505
506 screen->rast = lp_rast_create(screen->num_threads);
507 if (!screen->rast) {
508 lp_jit_screen_cleanup(screen);
509 FREE(screen);
510 return NULL;
511 }
512 pipe_mutex_init(screen->rast_mutex);
513
514 util_format_s3tc_init();
515
516 return &screen->base;
517 }