gallium: add facilities for indirect drawing
[mesa.git] / src / gallium / drivers / llvmpipe / lp_screen.c
1 /**************************************************************************
2 *
3 * Copyright 2008 VMware, Inc.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29 #include "util/u_memory.h"
30 #include "util/u_math.h"
31 #include "util/u_cpu_detect.h"
32 #include "util/u_format.h"
33 #include "util/u_string.h"
34 #include "util/u_format_s3tc.h"
35 #include "pipe/p_defines.h"
36 #include "pipe/p_screen.h"
37 #include "draw/draw_context.h"
38 #include "gallivm/lp_bld_type.h"
39
40 #include "os/os_time.h"
41 #include "lp_texture.h"
42 #include "lp_fence.h"
43 #include "lp_jit.h"
44 #include "lp_screen.h"
45 #include "lp_context.h"
46 #include "lp_debug.h"
47 #include "lp_public.h"
48 #include "lp_limits.h"
49 #include "lp_rast.h"
50
51 #include "state_tracker/sw_winsys.h"
52
53 #ifdef DEBUG
54 int LP_DEBUG = 0;
55
56 static const struct debug_named_value lp_debug_flags[] = {
57 { "pipe", DEBUG_PIPE, NULL },
58 { "tgsi", DEBUG_TGSI, NULL },
59 { "tex", DEBUG_TEX, NULL },
60 { "setup", DEBUG_SETUP, NULL },
61 { "rast", DEBUG_RAST, NULL },
62 { "query", DEBUG_QUERY, NULL },
63 { "screen", DEBUG_SCREEN, NULL },
64 { "counters", DEBUG_COUNTERS, NULL },
65 { "scene", DEBUG_SCENE, NULL },
66 { "fence", DEBUG_FENCE, NULL },
67 { "mem", DEBUG_MEM, NULL },
68 { "fs", DEBUG_FS, NULL },
69 DEBUG_NAMED_VALUE_END
70 };
71 #endif
72
73 int LP_PERF = 0;
74 static const struct debug_named_value lp_perf_flags[] = {
75 { "texmem", PERF_TEX_MEM, NULL },
76 { "no_mipmap", PERF_NO_MIPMAPS, NULL },
77 { "no_linear", PERF_NO_LINEAR, NULL },
78 { "no_mip_linear", PERF_NO_MIP_LINEAR, NULL },
79 { "no_tex", PERF_NO_TEX, NULL },
80 { "no_blend", PERF_NO_BLEND, NULL },
81 { "no_depth", PERF_NO_DEPTH, NULL },
82 { "no_alphatest", PERF_NO_ALPHATEST, NULL },
83 DEBUG_NAMED_VALUE_END
84 };
85
86
87 static const char *
88 llvmpipe_get_vendor(struct pipe_screen *screen)
89 {
90 return "VMware, Inc.";
91 }
92
93
94 static const char *
95 llvmpipe_get_name(struct pipe_screen *screen)
96 {
97 static char buf[100];
98 util_snprintf(buf, sizeof(buf), "llvmpipe (LLVM %u.%u, %u bits)",
99 HAVE_LLVM >> 8, HAVE_LLVM & 0xff,
100 lp_native_vector_width );
101 return buf;
102 }
103
104
105 static int
106 llvmpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)
107 {
108 switch (param) {
109 case PIPE_CAP_NPOT_TEXTURES:
110 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
111 return 1;
112 case PIPE_CAP_TWO_SIDED_STENCIL:
113 return 1;
114 case PIPE_CAP_SM3:
115 return 1;
116 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
117 return 1;
118 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
119 return PIPE_MAX_SO_BUFFERS;
120 case PIPE_CAP_ANISOTROPIC_FILTER:
121 return 0;
122 case PIPE_CAP_POINT_SPRITE:
123 return 1;
124 case PIPE_CAP_MAX_RENDER_TARGETS:
125 return PIPE_MAX_COLOR_BUFS;
126 case PIPE_CAP_OCCLUSION_QUERY:
127 return 1;
128 case PIPE_CAP_QUERY_TIME_ELAPSED:
129 return 0;
130 case PIPE_CAP_QUERY_TIMESTAMP:
131 return 1;
132 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
133 return 0;
134 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
135 return 1;
136 case PIPE_CAP_TEXTURE_SHADOW_MAP:
137 return 1;
138 case PIPE_CAP_TEXTURE_SWIZZLE:
139 return 1;
140 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
141 return 0;
142 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
143 return LP_MAX_TEXTURE_2D_LEVELS;
144 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
145 return LP_MAX_TEXTURE_3D_LEVELS;
146 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
147 return LP_MAX_TEXTURE_CUBE_LEVELS;
148 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
149 return LP_MAX_TEXTURE_ARRAY_LAYERS;
150 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
151 return 1;
152 case PIPE_CAP_INDEP_BLEND_ENABLE:
153 return 1;
154 case PIPE_CAP_INDEP_BLEND_FUNC:
155 return 1;
156 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
157 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
158 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
159 return 1;
160 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
161 return 0;
162 case PIPE_CAP_PRIMITIVE_RESTART:
163 return 1;
164 case PIPE_CAP_DEPTH_CLIP_DISABLE:
165 return 1;
166 case PIPE_CAP_SHADER_STENCIL_EXPORT:
167 return 0;
168 case PIPE_CAP_TGSI_INSTANCEID:
169 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
170 return 1;
171 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
172 return 0;
173 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
174 return 1;
175 case PIPE_CAP_SEAMLESS_CUBE_MAP:
176 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
177 return 1;
178 /* this is a lie could support arbitrary large offsets */
179 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
180 case PIPE_CAP_MIN_TEXEL_OFFSET:
181 return -8;
182 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
183 case PIPE_CAP_MAX_TEXEL_OFFSET:
184 return 7;
185 case PIPE_CAP_CONDITIONAL_RENDER:
186 return 1;
187 case PIPE_CAP_TEXTURE_BARRIER:
188 return 0;
189 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
190 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
191 return 16*4;
192 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
193 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
194 return 1024;
195 case PIPE_CAP_MAX_VERTEX_STREAMS:
196 return 1;
197 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
198 return 1;
199 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
200 return 0;
201 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
202 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
203 return 1;
204 case PIPE_CAP_GLSL_FEATURE_LEVEL:
205 return 330;
206 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
207 return 0;
208 case PIPE_CAP_COMPUTE:
209 return 0;
210 case PIPE_CAP_USER_VERTEX_BUFFERS:
211 case PIPE_CAP_USER_INDEX_BUFFERS:
212 return 1;
213 case PIPE_CAP_USER_CONSTANT_BUFFERS:
214 return 0;
215 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
216 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
217 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
218 case PIPE_CAP_TGSI_TEXCOORD:
219 return 0;
220 case PIPE_CAP_DRAW_INDIRECT:
221 return 1;
222
223 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
224 return 16;
225 case PIPE_CAP_START_INSTANCE:
226 case PIPE_CAP_TEXTURE_MULTISAMPLE:
227 case PIPE_CAP_CUBE_MAP_ARRAY:
228 return 0;
229 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
230 return 64;
231 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
232 return 1;
233 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
234 return 65536;
235 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
236 return 1;
237 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
238 return 0;
239 case PIPE_CAP_MAX_VIEWPORTS:
240 return PIPE_MAX_VIEWPORTS;
241 case PIPE_CAP_ENDIANNESS:
242 return PIPE_ENDIAN_NATIVE;
243 case PIPE_CAP_TGSI_VS_LAYER:
244 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
245 case PIPE_CAP_TEXTURE_GATHER_SM5:
246 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
247 case PIPE_CAP_TEXTURE_QUERY_LOD:
248 case PIPE_CAP_SAMPLE_SHADING:
249 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
250 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
251 return 0;
252 case PIPE_CAP_FAKE_SW_MSAA:
253 return 1;
254 }
255 /* should only get here on unhandled cases */
256 debug_printf("Unexpected PIPE_CAP %d query\n", param);
257 return 0;
258 }
259
260 static int
261 llvmpipe_get_shader_param(struct pipe_screen *screen, unsigned shader, enum pipe_shader_cap param)
262 {
263 switch(shader)
264 {
265 case PIPE_SHADER_FRAGMENT:
266 switch (param) {
267 default:
268 return gallivm_get_shader_param(param);
269 }
270 case PIPE_SHADER_VERTEX:
271 case PIPE_SHADER_GEOMETRY:
272 switch (param) {
273 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
274 /* At this time, the draw module and llvmpipe driver only
275 * support vertex shader texture lookups when LLVM is enabled in
276 * the draw module.
277 */
278 if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))
279 return PIPE_MAX_SAMPLERS;
280 else
281 return 0;
282 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
283 if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))
284 return PIPE_MAX_SHADER_SAMPLER_VIEWS;
285 else
286 return 0;
287 default:
288 return draw_get_shader_param(shader, param);
289 }
290 default:
291 return 0;
292 }
293 }
294
295 static float
296 llvmpipe_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
297 {
298 switch (param) {
299 case PIPE_CAPF_MAX_LINE_WIDTH:
300 /* fall-through */
301 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
302 return 255.0; /* arbitrary */
303 case PIPE_CAPF_MAX_POINT_WIDTH:
304 /* fall-through */
305 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
306 return 255.0; /* arbitrary */
307 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
308 return 16.0; /* not actually signficant at this time */
309 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
310 return 16.0; /* arbitrary */
311 case PIPE_CAPF_GUARD_BAND_LEFT:
312 case PIPE_CAPF_GUARD_BAND_TOP:
313 case PIPE_CAPF_GUARD_BAND_RIGHT:
314 case PIPE_CAPF_GUARD_BAND_BOTTOM:
315 return 0.0;
316 }
317 /* should only get here on unhandled cases */
318 debug_printf("Unexpected PIPE_CAP %d query\n", param);
319 return 0.0;
320 }
321
322
323 /**
324 * Query format support for creating a texture, drawing surface, etc.
325 * \param format the format to test
326 * \param type one of PIPE_TEXTURE, PIPE_SURFACE
327 */
328 static boolean
329 llvmpipe_is_format_supported( struct pipe_screen *_screen,
330 enum pipe_format format,
331 enum pipe_texture_target target,
332 unsigned sample_count,
333 unsigned bind)
334 {
335 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
336 struct sw_winsys *winsys = screen->winsys;
337 const struct util_format_description *format_desc;
338
339 format_desc = util_format_description(format);
340 if (!format_desc)
341 return FALSE;
342
343 assert(target == PIPE_BUFFER ||
344 target == PIPE_TEXTURE_1D ||
345 target == PIPE_TEXTURE_1D_ARRAY ||
346 target == PIPE_TEXTURE_2D ||
347 target == PIPE_TEXTURE_2D_ARRAY ||
348 target == PIPE_TEXTURE_RECT ||
349 target == PIPE_TEXTURE_3D ||
350 target == PIPE_TEXTURE_CUBE);
351
352 if (sample_count > 1)
353 return FALSE;
354
355 if (bind & PIPE_BIND_RENDER_TARGET) {
356 if (format_desc->colorspace == UTIL_FORMAT_COLORSPACE_SRGB) {
357 /* this is a lie actually other formats COULD exist where we would fail */
358 if (format_desc->nr_channels < 3)
359 return FALSE;
360 }
361 else if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_RGB)
362 return FALSE;
363
364 if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN &&
365 format != PIPE_FORMAT_R11G11B10_FLOAT)
366 return FALSE;
367
368 assert(format_desc->block.width == 1);
369 assert(format_desc->block.height == 1);
370
371 if (format_desc->is_mixed)
372 return FALSE;
373
374 if (!format_desc->is_array && !format_desc->is_bitmask &&
375 format != PIPE_FORMAT_R11G11B10_FLOAT)
376 return FALSE;
377
378 /*
379 * XXX refuse formats known to crash in generate_unswizzled_blend().
380 * These include all 3-channel 24bit RGB8 variants, plus 48bit
381 * (except those using floats) 3-channel RGB16 variants (the latter
382 * seems to be more of a llvm bug though).
383 * The mesa state tracker only seems to use these for SINT/UINT formats.
384 */
385 if (format_desc->is_array && format_desc->nr_channels == 3) {
386 if (format_desc->block.bits == 24 || (format_desc->block.bits == 48 &&
387 !util_format_is_float(format))) {
388 return FALSE;
389 }
390 }
391 }
392
393 if (bind & PIPE_BIND_DISPLAY_TARGET) {
394 if(!winsys->is_displaytarget_format_supported(winsys, bind, format))
395 return FALSE;
396 }
397
398 if (bind & PIPE_BIND_DEPTH_STENCIL) {
399 if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN)
400 return FALSE;
401
402 if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS)
403 return FALSE;
404
405 /* TODO: Support stencil-only formats */
406 if (format_desc->swizzle[0] == UTIL_FORMAT_SWIZZLE_NONE) {
407 return FALSE;
408 }
409 }
410
411 if (format_desc->layout == UTIL_FORMAT_LAYOUT_S3TC) {
412 return util_format_s3tc_enabled;
413 }
414
415 /*
416 * Everything can be supported by u_format
417 * (those without fetch_rgba_float might be not but shouldn't hit that)
418 */
419
420 return TRUE;
421 }
422
423
424
425
426 static void
427 llvmpipe_flush_frontbuffer(struct pipe_screen *_screen,
428 struct pipe_resource *resource,
429 unsigned level, unsigned layer,
430 void *context_private,
431 struct pipe_box *sub_box)
432 {
433 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
434 struct sw_winsys *winsys = screen->winsys;
435 struct llvmpipe_resource *texture = llvmpipe_resource(resource);
436
437 assert(texture->dt);
438 if (texture->dt)
439 winsys->displaytarget_display(winsys, texture->dt, context_private, sub_box);
440 }
441
442 static void
443 llvmpipe_destroy_screen( struct pipe_screen *_screen )
444 {
445 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
446 struct sw_winsys *winsys = screen->winsys;
447
448 if (screen->rast)
449 lp_rast_destroy(screen->rast);
450
451 lp_jit_screen_cleanup(screen);
452
453 if(winsys->destroy)
454 winsys->destroy(winsys);
455
456 pipe_mutex_destroy(screen->rast_mutex);
457
458 FREE(screen);
459 }
460
461
462
463
464 /**
465 * Fence reference counting.
466 */
467 static void
468 llvmpipe_fence_reference(struct pipe_screen *screen,
469 struct pipe_fence_handle **ptr,
470 struct pipe_fence_handle *fence)
471 {
472 struct lp_fence **old = (struct lp_fence **) ptr;
473 struct lp_fence *f = (struct lp_fence *) fence;
474
475 lp_fence_reference(old, f);
476 }
477
478
479 /**
480 * Has the fence been executed/finished?
481 */
482 static boolean
483 llvmpipe_fence_signalled(struct pipe_screen *screen,
484 struct pipe_fence_handle *fence)
485 {
486 struct lp_fence *f = (struct lp_fence *) fence;
487 return lp_fence_signalled(f);
488 }
489
490
491 /**
492 * Wait for the fence to finish.
493 */
494 static boolean
495 llvmpipe_fence_finish(struct pipe_screen *screen,
496 struct pipe_fence_handle *fence_handle,
497 uint64_t timeout)
498 {
499 struct lp_fence *f = (struct lp_fence *) fence_handle;
500
501 lp_fence_wait(f);
502 return TRUE;
503 }
504
505 static uint64_t
506 llvmpipe_get_timestamp(struct pipe_screen *_screen)
507 {
508 return os_time_get_nano();
509 }
510
511 /**
512 * Create a new pipe_screen object
513 * Note: we're not presently subclassing pipe_screen (no llvmpipe_screen).
514 */
515 struct pipe_screen *
516 llvmpipe_create_screen(struct sw_winsys *winsys)
517 {
518 struct llvmpipe_screen *screen;
519
520 util_cpu_detect();
521
522 #if defined(PIPE_ARCH_X86) && HAVE_LLVM < 0x0302
523 /* require SSE2 due to LLVM PR6960. */
524 if (!util_cpu_caps.has_sse2)
525 return NULL;
526 #endif
527
528 #ifdef DEBUG
529 LP_DEBUG = debug_get_flags_option("LP_DEBUG", lp_debug_flags, 0 );
530 #endif
531
532 LP_PERF = debug_get_flags_option("LP_PERF", lp_perf_flags, 0 );
533
534 screen = CALLOC_STRUCT(llvmpipe_screen);
535 if (!screen)
536 return NULL;
537
538 screen->winsys = winsys;
539
540 screen->base.destroy = llvmpipe_destroy_screen;
541
542 screen->base.get_name = llvmpipe_get_name;
543 screen->base.get_vendor = llvmpipe_get_vendor;
544 screen->base.get_param = llvmpipe_get_param;
545 screen->base.get_shader_param = llvmpipe_get_shader_param;
546 screen->base.get_paramf = llvmpipe_get_paramf;
547 screen->base.is_format_supported = llvmpipe_is_format_supported;
548
549 screen->base.context_create = llvmpipe_create_context;
550 screen->base.flush_frontbuffer = llvmpipe_flush_frontbuffer;
551 screen->base.fence_reference = llvmpipe_fence_reference;
552 screen->base.fence_signalled = llvmpipe_fence_signalled;
553 screen->base.fence_finish = llvmpipe_fence_finish;
554
555 screen->base.get_timestamp = llvmpipe_get_timestamp;
556
557 llvmpipe_init_screen_resource_funcs(&screen->base);
558
559 lp_jit_screen_init(screen);
560
561 screen->num_threads = util_cpu_caps.nr_cpus > 1 ? util_cpu_caps.nr_cpus : 0;
562 #ifdef PIPE_SUBSYSTEM_EMBEDDED
563 screen->num_threads = 0;
564 #endif
565 screen->num_threads = debug_get_num_option("LP_NUM_THREADS", screen->num_threads);
566 screen->num_threads = MIN2(screen->num_threads, LP_MAX_THREADS);
567
568 screen->rast = lp_rast_create(screen->num_threads);
569 if (!screen->rast) {
570 lp_jit_screen_cleanup(screen);
571 FREE(screen);
572 return NULL;
573 }
574 pipe_mutex_init(screen->rast_mutex);
575
576 util_format_s3tc_init();
577
578 return &screen->base;
579 }