gallium: add support for AMD_vertex_shader_layer
[mesa.git] / src / gallium / drivers / llvmpipe / lp_screen.c
1 /**************************************************************************
2 *
3 * Copyright 2008 Tungsten Graphics, Inc., Cedar Park, Texas.
4 * All Rights Reserved.
5 *
6 * Permission is hereby granted, free of charge, to any person obtaining a
7 * copy of this software and associated documentation files (the
8 * "Software"), to deal in the Software without restriction, including
9 * without limitation the rights to use, copy, modify, merge, publish,
10 * distribute, sub license, and/or sell copies of the Software, and to
11 * permit persons to whom the Software is furnished to do so, subject to
12 * the following conditions:
13 *
14 * The above copyright notice and this permission notice (including the
15 * next paragraph) shall be included in all copies or substantial portions
16 * of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
19 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
20 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
21 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
22 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
23 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
24 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
25 *
26 **************************************************************************/
27
28
29 #include "util/u_memory.h"
30 #include "util/u_math.h"
31 #include "util/u_cpu_detect.h"
32 #include "util/u_format.h"
33 #include "util/u_string.h"
34 #include "util/u_format_s3tc.h"
35 #include "pipe/p_defines.h"
36 #include "pipe/p_screen.h"
37 #include "draw/draw_context.h"
38 #include "gallivm/lp_bld_type.h"
39
40 #include "os/os_time.h"
41 #include "lp_texture.h"
42 #include "lp_fence.h"
43 #include "lp_jit.h"
44 #include "lp_screen.h"
45 #include "lp_context.h"
46 #include "lp_debug.h"
47 #include "lp_public.h"
48 #include "lp_limits.h"
49 #include "lp_rast.h"
50
51 #include "state_tracker/sw_winsys.h"
52
53 #ifdef DEBUG
54 int LP_DEBUG = 0;
55
56 static const struct debug_named_value lp_debug_flags[] = {
57 { "pipe", DEBUG_PIPE, NULL },
58 { "tgsi", DEBUG_TGSI, NULL },
59 { "tex", DEBUG_TEX, NULL },
60 { "setup", DEBUG_SETUP, NULL },
61 { "rast", DEBUG_RAST, NULL },
62 { "query", DEBUG_QUERY, NULL },
63 { "screen", DEBUG_SCREEN, NULL },
64 { "counters", DEBUG_COUNTERS, NULL },
65 { "scene", DEBUG_SCENE, NULL },
66 { "fence", DEBUG_FENCE, NULL },
67 { "mem", DEBUG_MEM, NULL },
68 { "fs", DEBUG_FS, NULL },
69 DEBUG_NAMED_VALUE_END
70 };
71 #endif
72
73 int LP_PERF = 0;
74 static const struct debug_named_value lp_perf_flags[] = {
75 { "texmem", PERF_TEX_MEM, NULL },
76 { "no_mipmap", PERF_NO_MIPMAPS, NULL },
77 { "no_linear", PERF_NO_LINEAR, NULL },
78 { "no_mip_linear", PERF_NO_MIP_LINEAR, NULL },
79 { "no_tex", PERF_NO_TEX, NULL },
80 { "no_blend", PERF_NO_BLEND, NULL },
81 { "no_depth", PERF_NO_DEPTH, NULL },
82 { "no_alphatest", PERF_NO_ALPHATEST, NULL },
83 DEBUG_NAMED_VALUE_END
84 };
85
86
87 static const char *
88 llvmpipe_get_vendor(struct pipe_screen *screen)
89 {
90 return "VMware, Inc.";
91 }
92
93
94 static const char *
95 llvmpipe_get_name(struct pipe_screen *screen)
96 {
97 static char buf[100];
98 util_snprintf(buf, sizeof(buf), "llvmpipe (LLVM %u.%u, %u bits)",
99 HAVE_LLVM >> 8, HAVE_LLVM & 0xff,
100 lp_native_vector_width );
101 return buf;
102 }
103
104
105 static int
106 llvmpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)
107 {
108 switch (param) {
109 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
110 return 2 * PIPE_MAX_SAMPLERS; /* VS + FS samplers */
111 case PIPE_CAP_NPOT_TEXTURES:
112 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
113 return 1;
114 case PIPE_CAP_TWO_SIDED_STENCIL:
115 return 1;
116 case PIPE_CAP_SM3:
117 return 1;
118 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
119 return 1;
120 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
121 return PIPE_MAX_SO_BUFFERS;
122 case PIPE_CAP_ANISOTROPIC_FILTER:
123 return 0;
124 case PIPE_CAP_POINT_SPRITE:
125 return 1;
126 case PIPE_CAP_MAX_RENDER_TARGETS:
127 return PIPE_MAX_COLOR_BUFS;
128 case PIPE_CAP_OCCLUSION_QUERY:
129 return 1;
130 case PIPE_CAP_QUERY_TIME_ELAPSED:
131 return 0;
132 case PIPE_CAP_QUERY_TIMESTAMP:
133 return 1;
134 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
135 return 0;
136 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
137 return 1;
138 case PIPE_CAP_TEXTURE_SHADOW_MAP:
139 return 1;
140 case PIPE_CAP_TEXTURE_SWIZZLE:
141 return 1;
142 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
143 return 0;
144 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
145 return LP_MAX_TEXTURE_2D_LEVELS;
146 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
147 return LP_MAX_TEXTURE_3D_LEVELS;
148 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
149 return LP_MAX_TEXTURE_CUBE_LEVELS;
150 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
151 return LP_MAX_TEXTURE_ARRAY_LAYERS;
152 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
153 return 1;
154 case PIPE_CAP_INDEP_BLEND_ENABLE:
155 return 1;
156 case PIPE_CAP_INDEP_BLEND_FUNC:
157 return 1;
158 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
159 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
160 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
161 return 1;
162 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
163 return 0;
164 case PIPE_CAP_PRIMITIVE_RESTART:
165 return 1;
166 case PIPE_CAP_DEPTH_CLIP_DISABLE:
167 return 1;
168 case PIPE_CAP_SHADER_STENCIL_EXPORT:
169 return 0;
170 case PIPE_CAP_TGSI_INSTANCEID:
171 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
172 return 1;
173 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
174 return 0;
175 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
176 return 1;
177 case PIPE_CAP_SEAMLESS_CUBE_MAP:
178 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
179 return 1;
180 case PIPE_CAP_SCALED_RESOLVE:
181 return 0;
182 /* this is a lie could support arbitrary large offsets */
183 case PIPE_CAP_MIN_TEXEL_OFFSET:
184 return -8;
185 case PIPE_CAP_MAX_TEXEL_OFFSET:
186 return 7;
187 case PIPE_CAP_CONDITIONAL_RENDER:
188 return 1;
189 case PIPE_CAP_TEXTURE_BARRIER:
190 return 0;
191 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
192 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
193 return 16*4;
194 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
195 return 1;
196 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
197 return 0;
198 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
199 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
200 return 1;
201 case PIPE_CAP_GLSL_FEATURE_LEVEL:
202 return 140;
203 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
204 return 0;
205 case PIPE_CAP_COMPUTE:
206 return 0;
207 case PIPE_CAP_USER_VERTEX_BUFFERS:
208 case PIPE_CAP_USER_INDEX_BUFFERS:
209 return 1;
210 case PIPE_CAP_USER_CONSTANT_BUFFERS:
211 return 0;
212 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
213 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
214 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
215 case PIPE_CAP_TGSI_TEXCOORD:
216 return 0;
217
218 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
219 return 16;
220 case PIPE_CAP_START_INSTANCE:
221 case PIPE_CAP_TEXTURE_MULTISAMPLE:
222 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
223 case PIPE_CAP_CUBE_MAP_ARRAY:
224 return 0;
225 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
226 return 1;
227 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
228 return 65536;
229 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
230 return 1;
231 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
232 return 0;
233 case PIPE_CAP_MAX_VIEWPORTS:
234 return PIPE_MAX_VIEWPORTS;
235 case PIPE_CAP_ENDIANNESS:
236 return PIPE_ENDIAN_NATIVE;
237 case PIPE_CAP_TGSI_VS_LAYER:
238 return 0;
239 }
240 /* should only get here on unhandled cases */
241 debug_printf("Unexpected PIPE_CAP %d query\n", param);
242 return 0;
243 }
244
245 static int
246 llvmpipe_get_shader_param(struct pipe_screen *screen, unsigned shader, enum pipe_shader_cap param)
247 {
248 switch(shader)
249 {
250 case PIPE_SHADER_FRAGMENT:
251 switch (param) {
252 default:
253 return gallivm_get_shader_param(param);
254 }
255 case PIPE_SHADER_VERTEX:
256 case PIPE_SHADER_GEOMETRY:
257 switch (param) {
258 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
259 /* At this time, the draw module and llvmpipe driver only
260 * support vertex shader texture lookups when LLVM is enabled in
261 * the draw module.
262 */
263 if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))
264 return PIPE_MAX_SAMPLERS;
265 else
266 return 0;
267 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
268 if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))
269 return PIPE_MAX_SHADER_SAMPLER_VIEWS;
270 else
271 return 0;
272 default:
273 return draw_get_shader_param(shader, param);
274 }
275 default:
276 return 0;
277 }
278 }
279
280 static float
281 llvmpipe_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
282 {
283 switch (param) {
284 case PIPE_CAPF_MAX_LINE_WIDTH:
285 /* fall-through */
286 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
287 return 255.0; /* arbitrary */
288 case PIPE_CAPF_MAX_POINT_WIDTH:
289 /* fall-through */
290 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
291 return 255.0; /* arbitrary */
292 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
293 return 16.0; /* not actually signficant at this time */
294 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
295 return 16.0; /* arbitrary */
296 case PIPE_CAPF_GUARD_BAND_LEFT:
297 case PIPE_CAPF_GUARD_BAND_TOP:
298 case PIPE_CAPF_GUARD_BAND_RIGHT:
299 case PIPE_CAPF_GUARD_BAND_BOTTOM:
300 return 0.0;
301 }
302 /* should only get here on unhandled cases */
303 debug_printf("Unexpected PIPE_CAP %d query\n", param);
304 return 0.0;
305 }
306
307
308 /**
309 * Query format support for creating a texture, drawing surface, etc.
310 * \param format the format to test
311 * \param type one of PIPE_TEXTURE, PIPE_SURFACE
312 */
313 static boolean
314 llvmpipe_is_format_supported( struct pipe_screen *_screen,
315 enum pipe_format format,
316 enum pipe_texture_target target,
317 unsigned sample_count,
318 unsigned bind)
319 {
320 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
321 struct sw_winsys *winsys = screen->winsys;
322 const struct util_format_description *format_desc;
323
324 format_desc = util_format_description(format);
325 if (!format_desc)
326 return FALSE;
327
328 assert(target == PIPE_BUFFER ||
329 target == PIPE_TEXTURE_1D ||
330 target == PIPE_TEXTURE_1D_ARRAY ||
331 target == PIPE_TEXTURE_2D ||
332 target == PIPE_TEXTURE_2D_ARRAY ||
333 target == PIPE_TEXTURE_RECT ||
334 target == PIPE_TEXTURE_3D ||
335 target == PIPE_TEXTURE_CUBE);
336
337 if (sample_count > 1)
338 return FALSE;
339
340 if (bind & PIPE_BIND_RENDER_TARGET) {
341 if (format_desc->colorspace == UTIL_FORMAT_COLORSPACE_SRGB) {
342 if (format_desc->nr_channels < 3)
343 return FALSE;
344 }
345 else if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_RGB)
346 return FALSE;
347
348 if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN &&
349 format != PIPE_FORMAT_R11G11B10_FLOAT)
350 return FALSE;
351
352 assert(format_desc->block.width == 1);
353 assert(format_desc->block.height == 1);
354
355 if (format_desc->is_mixed)
356 return FALSE;
357
358 if (!format_desc->is_array && !format_desc->is_bitmask &&
359 format != PIPE_FORMAT_R11G11B10_FLOAT)
360 return FALSE;
361
362 /*
363 * XXX refuse formats known to crash in generate_unswizzled_blend().
364 * These include all 3-channel 24bit RGB8 variants, plus 48bit
365 * (except those using floats) 3-channel RGB16 variants (the latter
366 * seems to be more of a llvm bug though).
367 * The mesa state tracker only seems to use these for SINT/UINT formats.
368 */
369 if (format_desc->is_array && format_desc->nr_channels == 3) {
370 if (format_desc->block.bits == 24 || (format_desc->block.bits == 48 &&
371 !util_format_is_float(format))) {
372 return FALSE;
373 }
374 }
375 }
376
377 if (bind & PIPE_BIND_DISPLAY_TARGET) {
378 if(!winsys->is_displaytarget_format_supported(winsys, bind, format))
379 return FALSE;
380 }
381
382 if (bind & PIPE_BIND_DEPTH_STENCIL) {
383 if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN)
384 return FALSE;
385
386 if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS)
387 return FALSE;
388
389 /* TODO: Support stencil-only formats */
390 if (format_desc->swizzle[0] == UTIL_FORMAT_SWIZZLE_NONE) {
391 return FALSE;
392 }
393 }
394
395 if (format_desc->layout == UTIL_FORMAT_LAYOUT_S3TC) {
396 return util_format_s3tc_enabled;
397 }
398
399 /*
400 * Everything can be supported by u_format
401 * (those without fetch_rgba_float might be not but shouldn't hit that)
402 */
403
404 return TRUE;
405 }
406
407
408
409
410 static void
411 llvmpipe_flush_frontbuffer(struct pipe_screen *_screen,
412 struct pipe_resource *resource,
413 unsigned level, unsigned layer,
414 void *context_private)
415 {
416 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
417 struct sw_winsys *winsys = screen->winsys;
418 struct llvmpipe_resource *texture = llvmpipe_resource(resource);
419
420 assert(texture->dt);
421 if (texture->dt)
422 winsys->displaytarget_display(winsys, texture->dt, context_private);
423 }
424
425
426 static void
427 llvmpipe_destroy_screen( struct pipe_screen *_screen )
428 {
429 struct llvmpipe_screen *screen = llvmpipe_screen(_screen);
430 struct sw_winsys *winsys = screen->winsys;
431
432 if (screen->rast)
433 lp_rast_destroy(screen->rast);
434
435 lp_jit_screen_cleanup(screen);
436
437 if(winsys->destroy)
438 winsys->destroy(winsys);
439
440 pipe_mutex_destroy(screen->rast_mutex);
441
442 FREE(screen);
443 }
444
445
446
447
448 /**
449 * Fence reference counting.
450 */
451 static void
452 llvmpipe_fence_reference(struct pipe_screen *screen,
453 struct pipe_fence_handle **ptr,
454 struct pipe_fence_handle *fence)
455 {
456 struct lp_fence **old = (struct lp_fence **) ptr;
457 struct lp_fence *f = (struct lp_fence *) fence;
458
459 lp_fence_reference(old, f);
460 }
461
462
463 /**
464 * Has the fence been executed/finished?
465 */
466 static boolean
467 llvmpipe_fence_signalled(struct pipe_screen *screen,
468 struct pipe_fence_handle *fence)
469 {
470 struct lp_fence *f = (struct lp_fence *) fence;
471 return lp_fence_signalled(f);
472 }
473
474
475 /**
476 * Wait for the fence to finish.
477 */
478 static boolean
479 llvmpipe_fence_finish(struct pipe_screen *screen,
480 struct pipe_fence_handle *fence_handle,
481 uint64_t timeout)
482 {
483 struct lp_fence *f = (struct lp_fence *) fence_handle;
484
485 lp_fence_wait(f);
486 return TRUE;
487 }
488
489 static uint64_t
490 llvmpipe_get_timestamp(struct pipe_screen *_screen)
491 {
492 return os_time_get_nano();
493 }
494
495 /**
496 * Create a new pipe_screen object
497 * Note: we're not presently subclassing pipe_screen (no llvmpipe_screen).
498 */
499 struct pipe_screen *
500 llvmpipe_create_screen(struct sw_winsys *winsys)
501 {
502 struct llvmpipe_screen *screen;
503
504 util_cpu_detect();
505
506 #if defined(PIPE_ARCH_X86) && HAVE_LLVM < 0x0302
507 /* require SSE2 due to LLVM PR6960. */
508 if (!util_cpu_caps.has_sse2)
509 return NULL;
510 #endif
511
512 #ifdef DEBUG
513 LP_DEBUG = debug_get_flags_option("LP_DEBUG", lp_debug_flags, 0 );
514 #endif
515
516 LP_PERF = debug_get_flags_option("LP_PERF", lp_perf_flags, 0 );
517
518 screen = CALLOC_STRUCT(llvmpipe_screen);
519 if (!screen)
520 return NULL;
521
522 screen->winsys = winsys;
523
524 screen->base.destroy = llvmpipe_destroy_screen;
525
526 screen->base.get_name = llvmpipe_get_name;
527 screen->base.get_vendor = llvmpipe_get_vendor;
528 screen->base.get_param = llvmpipe_get_param;
529 screen->base.get_shader_param = llvmpipe_get_shader_param;
530 screen->base.get_paramf = llvmpipe_get_paramf;
531 screen->base.is_format_supported = llvmpipe_is_format_supported;
532
533 screen->base.context_create = llvmpipe_create_context;
534 screen->base.flush_frontbuffer = llvmpipe_flush_frontbuffer;
535 screen->base.fence_reference = llvmpipe_fence_reference;
536 screen->base.fence_signalled = llvmpipe_fence_signalled;
537 screen->base.fence_finish = llvmpipe_fence_finish;
538
539 screen->base.get_timestamp = llvmpipe_get_timestamp;
540
541 llvmpipe_init_screen_resource_funcs(&screen->base);
542
543 lp_jit_screen_init(screen);
544
545 screen->num_threads = util_cpu_caps.nr_cpus > 1 ? util_cpu_caps.nr_cpus : 0;
546 #ifdef PIPE_SUBSYSTEM_EMBEDDED
547 screen->num_threads = 0;
548 #endif
549 screen->num_threads = debug_get_num_option("LP_NUM_THREADS", screen->num_threads);
550 screen->num_threads = MIN2(screen->num_threads, LP_MAX_THREADS);
551
552 screen->rast = lp_rast_create(screen->num_threads);
553 if (!screen->rast) {
554 lp_jit_screen_cleanup(screen);
555 FREE(screen);
556 return NULL;
557 }
558 pipe_mutex_init(screen->rast_mutex);
559
560 util_format_s3tc_init();
561
562 return &screen->base;
563 }