gallium: separate out floating-point CAPs into its own enum
[mesa.git] / src / gallium / drivers / svga / svga_screen.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "util/u_memory.h"
27 #include "util/u_inlines.h"
28 #include "util/u_string.h"
29 #include "util/u_math.h"
30
31 #include "svga_winsys.h"
32 #include "svga_public.h"
33 #include "svga_context.h"
34 #include "svga_format.h"
35 #include "svga_screen.h"
36 #include "svga_resource_texture.h"
37 #include "svga_resource.h"
38 #include "svga_debug.h"
39
40 #include "svga3d_shaderdefs.h"
41
42
43 #ifdef DEBUG
44 int SVGA_DEBUG = 0;
45
46 static const struct debug_named_value svga_debug_flags[] = {
47 { "dma", DEBUG_DMA, NULL },
48 { "tgsi", DEBUG_TGSI, NULL },
49 { "pipe", DEBUG_PIPE, NULL },
50 { "state", DEBUG_STATE, NULL },
51 { "screen", DEBUG_SCREEN, NULL },
52 { "tex", DEBUG_TEX, NULL },
53 { "swtnl", DEBUG_SWTNL, NULL },
54 { "const", DEBUG_CONSTS, NULL },
55 { "viewport", DEBUG_VIEWPORT, NULL },
56 { "views", DEBUG_VIEWS, NULL },
57 { "perf", DEBUG_PERF, NULL },
58 { "flush", DEBUG_FLUSH, NULL },
59 { "sync", DEBUG_SYNC, NULL },
60 { "cache", DEBUG_CACHE, NULL },
61 DEBUG_NAMED_VALUE_END
62 };
63 #endif
64
65 static const char *
66 svga_get_vendor( struct pipe_screen *pscreen )
67 {
68 return "VMware, Inc.";
69 }
70
71
72 static const char *
73 svga_get_name( struct pipe_screen *pscreen )
74 {
75 const char *build = "", *llvm = "", *mutex = "";
76 static char name[100];
77 #ifdef DEBUG
78 /* Only return internal details in the DEBUG version:
79 */
80 build = "build: DEBUG;";
81 mutex = "mutex: " PIPE_ATOMIC ";";
82 #ifdef HAVE_LLVM
83 llvm = "LLVM;";
84 #endif
85 #else
86 build = "build: RELEASE;";
87 #endif
88
89 util_snprintf(name, sizeof(name), "SVGA3D; %s %s %s", build, mutex, llvm);
90 return name;
91 }
92
93
94
95
96 static float
97 svga_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
98 {
99 struct svga_screen *svgascreen = svga_screen(screen);
100 struct svga_winsys_screen *sws = svgascreen->sws;
101 SVGA3dDevCapResult result;
102
103 switch (param) {
104 case PIPE_CAPF_MAX_LINE_WIDTH:
105 /* fall-through */
106 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
107 return 7.0;
108
109 case PIPE_CAPF_MAX_POINT_WIDTH:
110 /* fall-through */
111 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
112 /* Keep this to a reasonable size to avoid failures in
113 * conform/pntaa.c:
114 */
115 return SVGA_MAX_POINTSIZE;
116
117 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
118 if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, &result))
119 return 4.0;
120 return result.u;
121
122 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
123 return 16.0;
124
125 default:
126 return 0;
127 }
128 }
129
130
131 static int
132 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
133 {
134 struct svga_screen *svgascreen = svga_screen(screen);
135 struct svga_winsys_screen *sws = svgascreen->sws;
136 SVGA3dDevCapResult result;
137
138 switch (param) {
139 case PIPE_CAP_MAX_COMBINED_SAMPLERS:
140 return 16;
141 case PIPE_CAP_NPOT_TEXTURES:
142 return 1;
143 case PIPE_CAP_TWO_SIDED_STENCIL:
144 return 1;
145 case PIPE_CAP_ANISOTROPIC_FILTER:
146 return 1;
147 case PIPE_CAP_POINT_SPRITE:
148 return 1;
149 case PIPE_CAP_MAX_RENDER_TARGETS:
150 if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_RENDER_TARGETS, &result))
151 return 1;
152 if(!result.u)
153 return 1;
154 return MIN2(result.u, PIPE_MAX_COLOR_BUFS);
155 case PIPE_CAP_OCCLUSION_QUERY:
156 return 1;
157 case PIPE_CAP_TIMER_QUERY:
158 return 0;
159 case PIPE_CAP_TEXTURE_SHADOW_MAP:
160 return 1;
161 case PIPE_CAP_TEXTURE_SWIZZLE:
162 return 1;
163
164 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
165 {
166 unsigned levels = SVGA_MAX_TEXTURE_LEVELS;
167 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
168 levels = MIN2(util_logbase2(result.u) + 1, levels);
169 else
170 levels = 12 /* 2048x2048 */;
171 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
172 levels = MIN2(util_logbase2(result.u) + 1, levels);
173 else
174 levels = 12 /* 2048x2048 */;
175 return levels;
176 }
177
178 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
179 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
180 return 8; /* max 128x128x128 */
181 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
182
183 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
184 /*
185 * No mechanism to query the host, and at least limited to 2048x2048 on
186 * certain hardware.
187 */
188 return MIN2(screen->get_paramf(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
189 12.0 /* 2048x2048 */);
190
191 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
192 return 1;
193
194 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
195 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
196 return 1;
197 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
198 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
199 return 0;
200
201 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE:
202 return 1;
203 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
204 return 0;
205
206 default:
207 return 0;
208 }
209 }
210
211 static int svga_get_shader_param(struct pipe_screen *screen, unsigned shader, enum pipe_shader_cap param)
212 {
213 struct svga_screen *svgascreen = svga_screen(screen);
214 struct svga_winsys_screen *sws = svgascreen->sws;
215 SVGA3dDevCapResult result;
216
217 switch (shader)
218 {
219 case PIPE_SHADER_FRAGMENT:
220 switch (param)
221 {
222 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
223 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
224 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
225 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
226 return 512;
227 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
228 return SVGA3D_MAX_NESTING_LEVEL;
229 case PIPE_SHADER_CAP_MAX_INPUTS:
230 return 10;
231 case PIPE_SHADER_CAP_MAX_CONSTS:
232 return 224;
233 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
234 return 1;
235 case PIPE_SHADER_CAP_MAX_TEMPS:
236 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, &result))
237 return 32;
238 return result.u;
239 case PIPE_SHADER_CAP_MAX_ADDRS:
240 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
241 /*
242 * Although PS 3.0 has some addressing abilities it can only represent
243 * loops that can be statically determined and unrolled. Given we can
244 * only handle a subset of the cases that the state tracker already
245 * does it is better to defer loop unrolling to the state tracker.
246 */
247 return 0;
248 case PIPE_SHADER_CAP_MAX_PREDS:
249 return 1;
250 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
251 return 1;
252 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
253 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
254 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
255 return 0;
256 case PIPE_SHADER_CAP_SUBROUTINES:
257 return 0;
258 case PIPE_SHADER_CAP_INTEGERS:
259 return 0;
260 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
261 return 16;
262 }
263 break;
264 case PIPE_SHADER_VERTEX:
265 switch (param)
266 {
267 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
268 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
269 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS, &result))
270 return 512;
271 return result.u;
272 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
273 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
274 /* XXX: until we have vertex texture support */
275 return 0;
276 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
277 return SVGA3D_MAX_NESTING_LEVEL;
278 case PIPE_SHADER_CAP_MAX_INPUTS:
279 return 16;
280 case PIPE_SHADER_CAP_MAX_CONSTS:
281 return 256;
282 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
283 return 1;
284 case PIPE_SHADER_CAP_MAX_TEMPS:
285 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, &result))
286 return 32;
287 return result.u;
288 case PIPE_SHADER_CAP_MAX_ADDRS:
289 return 1;
290 case PIPE_SHADER_CAP_MAX_PREDS:
291 return 1;
292 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
293 return 1;
294 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
295 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
296 return 1;
297 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
298 return 0;
299 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
300 return 1;
301 case PIPE_SHADER_CAP_SUBROUTINES:
302 return 0;
303 case PIPE_SHADER_CAP_INTEGERS:
304 return 0;
305 default:
306 break;
307 }
308 break;
309 default:
310 break;
311 }
312 return 0;
313 }
314
315
316 static boolean
317 svga_is_format_supported( struct pipe_screen *screen,
318 enum pipe_format format,
319 enum pipe_texture_target target,
320 unsigned sample_count,
321 unsigned tex_usage)
322 {
323 struct svga_screen *ss = svga_screen(screen);
324 SVGA3dSurfaceFormat svga_format;
325 SVGA3dSurfaceFormatCaps caps;
326 SVGA3dSurfaceFormatCaps mask;
327
328 assert(tex_usage);
329
330 if (sample_count > 1) {
331 return FALSE;
332 }
333
334 svga_format = svga_translate_format(ss, format, tex_usage);
335 if (svga_format == SVGA3D_FORMAT_INVALID) {
336 return FALSE;
337 }
338
339 /*
340 * Override host capabilities, so that we end up with the same
341 * visuals for all virtual hardware implementations.
342 */
343
344 if (tex_usage & PIPE_BIND_DISPLAY_TARGET) {
345 switch (svga_format) {
346 case SVGA3D_A8R8G8B8:
347 case SVGA3D_X8R8G8B8:
348 case SVGA3D_R5G6B5:
349 break;
350
351 /* Often unsupported/problematic. This means we end up with the same
352 * visuals for all virtual hardware implementations.
353 */
354 case PIPE_FORMAT_B4G4R4A4_UNORM:
355 case PIPE_FORMAT_B5G5R5A1_UNORM:
356 return FALSE;
357
358 default:
359 return FALSE;
360 }
361 }
362
363 /*
364 * Query the host capabilities.
365 */
366
367 svga_get_format_cap(ss, svga_format, &caps);
368
369 mask.value = 0;
370 if (tex_usage & PIPE_BIND_RENDER_TARGET) {
371 mask.offscreenRenderTarget = 1;
372 }
373 if (tex_usage & PIPE_BIND_DEPTH_STENCIL) {
374 mask.zStencil = 1;
375 }
376 if (tex_usage & PIPE_BIND_SAMPLER_VIEW) {
377 mask.texture = 1;
378 }
379
380 return (caps.value & mask.value) == mask.value;
381 }
382
383
384 static void
385 svga_fence_reference(struct pipe_screen *screen,
386 struct pipe_fence_handle **ptr,
387 struct pipe_fence_handle *fence)
388 {
389 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
390 sws->fence_reference(sws, ptr, fence);
391 }
392
393
394 static boolean
395 svga_fence_signalled(struct pipe_screen *screen,
396 struct pipe_fence_handle *fence)
397 {
398 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
399 return sws->fence_signalled(sws, fence, 0) == 0;
400 }
401
402
403 static boolean
404 svga_fence_finish(struct pipe_screen *screen,
405 struct pipe_fence_handle *fence,
406 uint64_t timeout)
407 {
408 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
409
410 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
411 __FUNCTION__, fence);
412
413 return sws->fence_finish(sws, fence, 0) == 0;
414 }
415
416
417 static void
418 svga_destroy_screen( struct pipe_screen *screen )
419 {
420 struct svga_screen *svgascreen = svga_screen(screen);
421
422 svga_screen_cache_cleanup(svgascreen);
423
424 pipe_mutex_destroy(svgascreen->swc_mutex);
425 pipe_mutex_destroy(svgascreen->tex_mutex);
426
427 svgascreen->sws->destroy(svgascreen->sws);
428
429 FREE(svgascreen);
430 }
431
432
433 /**
434 * Create a new svga_screen object
435 */
436 struct pipe_screen *
437 svga_screen_create(struct svga_winsys_screen *sws)
438 {
439 struct svga_screen *svgascreen;
440 struct pipe_screen *screen;
441 SVGA3dDevCapResult result;
442 boolean use_vs30, use_ps30;
443
444 #ifdef DEBUG
445 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
446 #endif
447
448 svgascreen = CALLOC_STRUCT(svga_screen);
449 if (!svgascreen)
450 goto error1;
451
452 svgascreen->debug.force_level_surface_view =
453 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
454 svgascreen->debug.force_surface_view =
455 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
456 svgascreen->debug.force_sampler_view =
457 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
458 svgascreen->debug.no_surface_view =
459 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
460 svgascreen->debug.no_sampler_view =
461 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
462
463 screen = &svgascreen->screen;
464
465 screen->destroy = svga_destroy_screen;
466 screen->get_name = svga_get_name;
467 screen->get_vendor = svga_get_vendor;
468 screen->get_param = svga_get_param;
469 screen->get_shader_param = svga_get_shader_param;
470 screen->get_paramf = svga_get_paramf;
471 screen->is_format_supported = svga_is_format_supported;
472 screen->context_create = svga_context_create;
473 screen->fence_reference = svga_fence_reference;
474 screen->fence_signalled = svga_fence_signalled;
475 screen->fence_finish = svga_fence_finish;
476 svgascreen->sws = sws;
477
478 svga_init_screen_resource_functions(svgascreen);
479
480 if (sws->get_hw_version) {
481 svgascreen->hw_version = sws->get_hw_version(sws);
482 } else {
483 svgascreen->hw_version = SVGA3D_HWVERSION_WS65_B1;
484 }
485
486 use_ps30 =
487 sws->get_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION, &result) &&
488 result.u >= SVGA3DPSVERSION_30 ? TRUE : FALSE;
489
490 use_vs30 =
491 sws->get_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION, &result) &&
492 result.u >= SVGA3DVSVERSION_30 ? TRUE : FALSE;
493
494 /* we require Shader model 3.0 or later */
495 if (!use_ps30 || !use_vs30)
496 goto error2;
497
498 /*
499 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
500 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
501 * we prefer the later when available.
502 *
503 * This mimics hardware vendors extensions for D3D depth sampling. See also
504 * http://aras-p.info/texts/D3D9GPUHacks.html
505 */
506
507 {
508 boolean has_df16, has_df24, has_d24s8_int;
509 SVGA3dSurfaceFormatCaps caps;
510 SVGA3dSurfaceFormatCaps mask;
511 mask.value = 0;
512 mask.zStencil = 1;
513 mask.texture = 1;
514
515 svgascreen->depth.z16 = SVGA3D_Z_D16;
516 svgascreen->depth.x8z24 = SVGA3D_Z_D24X8;
517 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8;
518
519 svga_get_format_cap(svgascreen, SVGA3D_Z_DF16, &caps);
520 has_df16 = (caps.value & mask.value) == mask.value;
521
522 svga_get_format_cap(svgascreen, SVGA3D_Z_DF24, &caps);
523 has_df24 = (caps.value & mask.value) == mask.value;
524
525 svga_get_format_cap(svgascreen, SVGA3D_Z_D24S8_INT, &caps);
526 has_d24s8_int = (caps.value & mask.value) == mask.value;
527
528 /* XXX: We might want some other logic here.
529 * Like if we only have d24s8_int we should
530 * emulate the other formats with that.
531 */
532 if (has_df16) {
533 svgascreen->depth.z16 = SVGA3D_Z_DF16;
534 }
535 if (has_df24) {
536 svgascreen->depth.x8z24 = SVGA3D_Z_DF24;
537 }
538 if (has_d24s8_int) {
539 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8_INT;
540 }
541 }
542
543 pipe_mutex_init(svgascreen->tex_mutex);
544 pipe_mutex_init(svgascreen->swc_mutex);
545
546 svga_screen_cache_init(svgascreen);
547
548 return screen;
549 error2:
550 FREE(svgascreen);
551 error1:
552 return NULL;
553 }
554
555 struct svga_winsys_screen *
556 svga_winsys_screen(struct pipe_screen *screen)
557 {
558 return svga_screen(screen)->sws;
559 }
560
561 #ifdef DEBUG
562 struct svga_screen *
563 svga_screen(struct pipe_screen *screen)
564 {
565 assert(screen);
566 assert(screen->destroy == svga_destroy_screen);
567 return (struct svga_screen *)screen;
568 }
569 #endif