gallium: add FMA and DFMA opcodes (v3)
[mesa.git] / src / gallium / drivers / svga / svga_screen.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "util/u_format.h"
27 #include "util/u_memory.h"
28 #include "util/u_inlines.h"
29 #include "util/u_string.h"
30 #include "util/u_math.h"
31
32 #include "svga_winsys.h"
33 #include "svga_public.h"
34 #include "svga_context.h"
35 #include "svga_format.h"
36 #include "svga_screen.h"
37 #include "svga_resource_texture.h"
38 #include "svga_resource.h"
39 #include "svga_debug.h"
40
41 #include "svga3d_shaderdefs.h"
42
43
44 #ifdef DEBUG
45 int SVGA_DEBUG = 0;
46
47 static const struct debug_named_value svga_debug_flags[] = {
48 { "dma", DEBUG_DMA, NULL },
49 { "tgsi", DEBUG_TGSI, NULL },
50 { "pipe", DEBUG_PIPE, NULL },
51 { "state", DEBUG_STATE, NULL },
52 { "screen", DEBUG_SCREEN, NULL },
53 { "tex", DEBUG_TEX, NULL },
54 { "swtnl", DEBUG_SWTNL, NULL },
55 { "const", DEBUG_CONSTS, NULL },
56 { "viewport", DEBUG_VIEWPORT, NULL },
57 { "views", DEBUG_VIEWS, NULL },
58 { "perf", DEBUG_PERF, NULL },
59 { "flush", DEBUG_FLUSH, NULL },
60 { "sync", DEBUG_SYNC, NULL },
61 { "cache", DEBUG_CACHE, NULL },
62 DEBUG_NAMED_VALUE_END
63 };
64 #endif
65
66 static const char *
67 svga_get_vendor( struct pipe_screen *pscreen )
68 {
69 return "VMware, Inc.";
70 }
71
72
73 static const char *
74 svga_get_name( struct pipe_screen *pscreen )
75 {
76 const char *build = "", *llvm = "", *mutex = "";
77 static char name[100];
78 #ifdef DEBUG
79 /* Only return internal details in the DEBUG version:
80 */
81 build = "build: DEBUG;";
82 mutex = "mutex: " PIPE_ATOMIC ";";
83 #ifdef HAVE_LLVM
84 llvm = "LLVM;";
85 #endif
86 #else
87 build = "build: RELEASE;";
88 #endif
89
90 util_snprintf(name, sizeof(name), "SVGA3D; %s %s %s", build, mutex, llvm);
91 return name;
92 }
93
94
95
96
97 static float
98 svga_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
99 {
100 struct svga_screen *svgascreen = svga_screen(screen);
101 struct svga_winsys_screen *sws = svgascreen->sws;
102 SVGA3dDevCapResult result;
103
104 switch (param) {
105 case PIPE_CAPF_MAX_LINE_WIDTH:
106 return svgascreen->maxLineWidth;
107 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
108 return svgascreen->maxLineWidthAA;
109
110 case PIPE_CAPF_MAX_POINT_WIDTH:
111 /* fall-through */
112 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
113 return svgascreen->maxPointSize;
114
115 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
116 if(!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, &result))
117 return 4.0f;
118 return (float) result.u;
119
120 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
121 return 15.0;
122 case PIPE_CAPF_GUARD_BAND_LEFT:
123 case PIPE_CAPF_GUARD_BAND_TOP:
124 case PIPE_CAPF_GUARD_BAND_RIGHT:
125 case PIPE_CAPF_GUARD_BAND_BOTTOM:
126 return 0.0;
127 }
128
129 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param);
130 return 0;
131 }
132
133
134 static int
135 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
136 {
137 struct svga_screen *svgascreen = svga_screen(screen);
138 struct svga_winsys_screen *sws = svgascreen->sws;
139 SVGA3dDevCapResult result;
140
141 switch (param) {
142 case PIPE_CAP_NPOT_TEXTURES:
143 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
144 return 1;
145 case PIPE_CAP_TWO_SIDED_STENCIL:
146 return 1;
147 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
148 return 0;
149 case PIPE_CAP_ANISOTROPIC_FILTER:
150 return 1;
151 case PIPE_CAP_POINT_SPRITE:
152 return 1;
153 case PIPE_CAP_TGSI_TEXCOORD:
154 return 0;
155 case PIPE_CAP_MAX_RENDER_TARGETS:
156 return svgascreen->max_color_buffers;
157 case PIPE_CAP_OCCLUSION_QUERY:
158 return 1;
159 case PIPE_CAP_QUERY_TIME_ELAPSED:
160 return 0;
161 case PIPE_CAP_TEXTURE_SHADOW_MAP:
162 return 1;
163 case PIPE_CAP_TEXTURE_SWIZZLE:
164 return 1;
165 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
166 return 0;
167 case PIPE_CAP_USER_VERTEX_BUFFERS:
168 case PIPE_CAP_USER_INDEX_BUFFERS:
169 return 0;
170 case PIPE_CAP_USER_CONSTANT_BUFFERS:
171 return 1;
172 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
173 return 16;
174
175 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
176 {
177 unsigned levels = SVGA_MAX_TEXTURE_LEVELS;
178 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
179 levels = MIN2(util_logbase2(result.u) + 1, levels);
180 else
181 levels = 12 /* 2048x2048 */;
182 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
183 levels = MIN2(util_logbase2(result.u) + 1, levels);
184 else
185 levels = 12 /* 2048x2048 */;
186 return levels;
187 }
188
189 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
190 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
191 return 8; /* max 128x128x128 */
192 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
193
194 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
195 /*
196 * No mechanism to query the host, and at least limited to 2048x2048 on
197 * certain hardware.
198 */
199 return MIN2(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
200 12 /* 2048x2048 */);
201
202 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
203 return 1;
204
205 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
206 return 1;
207 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
208 return 0;
209 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
210 return 0;
211 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
212 return 1;
213
214 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
215 return 1; /* The color outputs of vertex shaders are not clamped */
216 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
217 return 0; /* The driver can't clamp vertex colors */
218 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
219 return 0; /* The driver can't clamp fragment colors */
220
221 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
222 return 1; /* expected for GL_ARB_framebuffer_object */
223
224 case PIPE_CAP_GLSL_FEATURE_LEVEL:
225 return 120;
226
227 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
228 return 0;
229
230 case PIPE_CAP_SM3:
231 return 1;
232
233 /* Unsupported features */
234 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
235 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
236 case PIPE_CAP_SHADER_STENCIL_EXPORT:
237 case PIPE_CAP_DEPTH_CLIP_DISABLE:
238 case PIPE_CAP_SEAMLESS_CUBE_MAP:
239 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
240 case PIPE_CAP_INDEP_BLEND_ENABLE:
241 case PIPE_CAP_INDEP_BLEND_FUNC:
242 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
243 case PIPE_CAP_PRIMITIVE_RESTART:
244 case PIPE_CAP_TGSI_INSTANCEID:
245 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
246 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
247 case PIPE_CAP_MIN_TEXEL_OFFSET:
248 case PIPE_CAP_MAX_TEXEL_OFFSET:
249 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
250 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
251 case PIPE_CAP_CONDITIONAL_RENDER:
252 case PIPE_CAP_TEXTURE_BARRIER:
253 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
254 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
255 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
256 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
257 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
258 case PIPE_CAP_MAX_VERTEX_STREAMS:
259 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
260 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
261 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
262 case PIPE_CAP_COMPUTE:
263 case PIPE_CAP_START_INSTANCE:
264 case PIPE_CAP_QUERY_TIMESTAMP:
265 case PIPE_CAP_TEXTURE_MULTISAMPLE:
266 case PIPE_CAP_CUBE_MAP_ARRAY:
267 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
268 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
269 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
270 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
271 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
272 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
273 case PIPE_CAP_TEXTURE_GATHER_SM5:
274 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
275 case PIPE_CAP_FAKE_SW_MSAA:
276 case PIPE_CAP_TEXTURE_QUERY_LOD:
277 case PIPE_CAP_SAMPLE_SHADING:
278 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
279 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
280 case PIPE_CAP_DRAW_INDIRECT:
281 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
282 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
283 case PIPE_CAP_SAMPLER_VIEW_TARGET:
284 case PIPE_CAP_CLIP_HALFZ:
285 case PIPE_CAP_VERTEXID_NOBASE:
286 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
287 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
288 return 0;
289 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
290 return 64;
291 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
292 return 1;
293 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
294 return 2048;
295 case PIPE_CAP_MAX_VIEWPORTS:
296 return 1;
297 case PIPE_CAP_ENDIANNESS:
298 return PIPE_ENDIAN_LITTLE;
299
300 case PIPE_CAP_VENDOR_ID:
301 return 0x15ad; /* VMware Inc. */
302 case PIPE_CAP_DEVICE_ID:
303 return 0x0405; /* assume SVGA II */
304 case PIPE_CAP_ACCELERATED:
305 return 0; /* XXX: */
306 case PIPE_CAP_VIDEO_MEMORY:
307 /* XXX: Query the host ? */
308 return 1;
309 case PIPE_CAP_UMA:
310 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
311 return 0;
312 }
313
314 debug_printf("Unexpected PIPE_CAP_ query %u\n", param);
315 return 0;
316 }
317
318 static int svga_get_shader_param(struct pipe_screen *screen, unsigned shader, enum pipe_shader_cap param)
319 {
320 struct svga_screen *svgascreen = svga_screen(screen);
321 struct svga_winsys_screen *sws = svgascreen->sws;
322 SVGA3dDevCapResult result;
323
324 switch (shader)
325 {
326 case PIPE_SHADER_FRAGMENT:
327 switch (param)
328 {
329 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
330 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
331 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
332 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
333 return 512;
334 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
335 return SVGA3D_MAX_NESTING_LEVEL;
336 case PIPE_SHADER_CAP_MAX_INPUTS:
337 return 10;
338 case PIPE_SHADER_CAP_MAX_OUTPUTS:
339 return svgascreen->max_color_buffers;
340 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
341 return 224 * sizeof(float[4]);
342 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
343 return 1;
344 case PIPE_SHADER_CAP_MAX_TEMPS:
345 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, &result))
346 return 32;
347 return MIN2(result.u, SVGA3D_TEMPREG_MAX);
348 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
349 /*
350 * Although PS 3.0 has some addressing abilities it can only represent
351 * loops that can be statically determined and unrolled. Given we can
352 * only handle a subset of the cases that the state tracker already
353 * does it is better to defer loop unrolling to the state tracker.
354 */
355 return 0;
356 case PIPE_SHADER_CAP_MAX_PREDS:
357 return 1;
358 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
359 return 0;
360 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
361 return 0;
362 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
363 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
364 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
365 return 0;
366 case PIPE_SHADER_CAP_SUBROUTINES:
367 return 0;
368 case PIPE_SHADER_CAP_INTEGERS:
369 return 0;
370 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
371 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
372 return 16;
373 case PIPE_SHADER_CAP_PREFERRED_IR:
374 return PIPE_SHADER_IR_TGSI;
375 case PIPE_SHADER_CAP_DOUBLES:
376 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
377 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
378 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
379 return 0;
380 }
381 /* If we get here, we failed to handle a cap above */
382 debug_printf("Unexpected fragment shader query %u\n", param);
383 return 0;
384 case PIPE_SHADER_VERTEX:
385 switch (param)
386 {
387 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
388 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
389 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS, &result))
390 return 512;
391 return result.u;
392 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
393 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
394 /* XXX: until we have vertex texture support */
395 return 0;
396 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
397 return SVGA3D_MAX_NESTING_LEVEL;
398 case PIPE_SHADER_CAP_MAX_INPUTS:
399 return 16;
400 case PIPE_SHADER_CAP_MAX_OUTPUTS:
401 return 10;
402 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
403 return 256 * sizeof(float[4]);
404 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
405 return 1;
406 case PIPE_SHADER_CAP_MAX_TEMPS:
407 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, &result))
408 return 32;
409 return MIN2(result.u, SVGA3D_TEMPREG_MAX);
410 case PIPE_SHADER_CAP_MAX_PREDS:
411 return 1;
412 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
413 return 0;
414 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
415 return 0;
416 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
417 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
418 return 1;
419 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
420 return 0;
421 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
422 return 1;
423 case PIPE_SHADER_CAP_SUBROUTINES:
424 return 0;
425 case PIPE_SHADER_CAP_INTEGERS:
426 return 0;
427 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
428 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
429 return 0;
430 case PIPE_SHADER_CAP_PREFERRED_IR:
431 return PIPE_SHADER_IR_TGSI;
432 case PIPE_SHADER_CAP_DOUBLES:
433 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
434 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
435 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
436 return 0;
437 }
438 /* If we get here, we failed to handle a cap above */
439 debug_printf("Unexpected vertex shader query %u\n", param);
440 return 0;
441 case PIPE_SHADER_GEOMETRY:
442 case PIPE_SHADER_COMPUTE:
443 /* no support for geometry or compute shaders at this time */
444 return 0;
445 default:
446 debug_printf("Unexpected shader type (%u) query\n", shader);
447 return 0;
448 }
449 return 0;
450 }
451
452
453 /**
454 * Implemnt pipe_screen::is_format_supported().
455 * \param bindings bitmask of PIPE_BIND_x flags
456 */
457 static boolean
458 svga_is_format_supported( struct pipe_screen *screen,
459 enum pipe_format format,
460 enum pipe_texture_target target,
461 unsigned sample_count,
462 unsigned bindings)
463 {
464 struct svga_screen *ss = svga_screen(screen);
465 SVGA3dSurfaceFormat svga_format;
466 SVGA3dSurfaceFormatCaps caps;
467 SVGA3dSurfaceFormatCaps mask;
468
469 assert(bindings);
470
471 if (sample_count > 1) {
472 return FALSE;
473 }
474
475 svga_format = svga_translate_format(ss, format, bindings);
476 if (svga_format == SVGA3D_FORMAT_INVALID) {
477 return FALSE;
478 }
479
480 /*
481 * Override host capabilities, so that we end up with the same
482 * visuals for all virtual hardware implementations.
483 */
484
485 if (bindings & PIPE_BIND_DISPLAY_TARGET) {
486 switch (svga_format) {
487 case SVGA3D_A8R8G8B8:
488 case SVGA3D_X8R8G8B8:
489 case SVGA3D_R5G6B5:
490 break;
491
492 /* Often unsupported/problematic. This means we end up with the same
493 * visuals for all virtual hardware implementations.
494 */
495 case SVGA3D_A4R4G4B4:
496 case SVGA3D_A1R5G5B5:
497 return FALSE;
498
499 default:
500 return FALSE;
501 }
502 }
503
504 /*
505 * Query the host capabilities.
506 */
507
508 svga_get_format_cap(ss, svga_format, &caps);
509
510 mask.value = 0;
511 if (bindings & PIPE_BIND_RENDER_TARGET) {
512 mask.offscreenRenderTarget = 1;
513 }
514 if (bindings & PIPE_BIND_DEPTH_STENCIL) {
515 mask.zStencil = 1;
516 }
517 if (bindings & PIPE_BIND_SAMPLER_VIEW) {
518 mask.texture = 1;
519 }
520
521 if (target == PIPE_TEXTURE_CUBE) {
522 mask.cubeTexture = 1;
523 }
524 if (target == PIPE_TEXTURE_3D) {
525 mask.volumeTexture = 1;
526 }
527
528 return (caps.value & mask.value) == mask.value;
529 }
530
531
532 static void
533 svga_fence_reference(struct pipe_screen *screen,
534 struct pipe_fence_handle **ptr,
535 struct pipe_fence_handle *fence)
536 {
537 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
538 sws->fence_reference(sws, ptr, fence);
539 }
540
541
542 static boolean
543 svga_fence_signalled(struct pipe_screen *screen,
544 struct pipe_fence_handle *fence)
545 {
546 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
547 return sws->fence_signalled(sws, fence, 0) == 0;
548 }
549
550
551 static boolean
552 svga_fence_finish(struct pipe_screen *screen,
553 struct pipe_fence_handle *fence,
554 uint64_t timeout)
555 {
556 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
557
558 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
559 __FUNCTION__, fence);
560
561 return sws->fence_finish(sws, fence, 0) == 0;
562 }
563
564
565 static int
566 svga_get_driver_query_info(struct pipe_screen *screen,
567 unsigned index,
568 struct pipe_driver_query_info *info)
569 {
570 static const struct pipe_driver_query_info queries[] = {
571 {"draw-calls", SVGA_QUERY_DRAW_CALLS, 0, FALSE},
572 {"fallbacks", SVGA_QUERY_FALLBACKS, 0, FALSE},
573 {"memory-used", SVGA_QUERY_MEMORY_USED, 0, TRUE}
574 };
575
576 if (!info)
577 return Elements(queries);
578
579 if (index >= Elements(queries))
580 return 0;
581
582 *info = queries[index];
583 return 1;
584 }
585
586
587 static void
588 svga_destroy_screen( struct pipe_screen *screen )
589 {
590 struct svga_screen *svgascreen = svga_screen(screen);
591
592 svga_screen_cache_cleanup(svgascreen);
593
594 pipe_mutex_destroy(svgascreen->swc_mutex);
595 pipe_mutex_destroy(svgascreen->tex_mutex);
596
597 svgascreen->sws->destroy(svgascreen->sws);
598
599 FREE(svgascreen);
600 }
601
602
603 /**
604 * Create a new svga_screen object
605 */
606 struct pipe_screen *
607 svga_screen_create(struct svga_winsys_screen *sws)
608 {
609 struct svga_screen *svgascreen;
610 struct pipe_screen *screen;
611 SVGA3dDevCapResult result;
612 boolean use_vs30, use_ps30;
613
614 #ifdef DEBUG
615 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
616 #endif
617
618 svgascreen = CALLOC_STRUCT(svga_screen);
619 if (!svgascreen)
620 goto error1;
621
622 svgascreen->debug.force_level_surface_view =
623 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
624 svgascreen->debug.force_surface_view =
625 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
626 svgascreen->debug.force_sampler_view =
627 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
628 svgascreen->debug.no_surface_view =
629 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
630 svgascreen->debug.no_sampler_view =
631 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
632
633 screen = &svgascreen->screen;
634
635 screen->destroy = svga_destroy_screen;
636 screen->get_name = svga_get_name;
637 screen->get_vendor = svga_get_vendor;
638 screen->get_param = svga_get_param;
639 screen->get_shader_param = svga_get_shader_param;
640 screen->get_paramf = svga_get_paramf;
641 screen->is_format_supported = svga_is_format_supported;
642 screen->context_create = svga_context_create;
643 screen->fence_reference = svga_fence_reference;
644 screen->fence_signalled = svga_fence_signalled;
645 screen->fence_finish = svga_fence_finish;
646 screen->get_driver_query_info = svga_get_driver_query_info;
647 svgascreen->sws = sws;
648
649 svga_init_screen_resource_functions(svgascreen);
650
651 if (sws->get_hw_version) {
652 svgascreen->hw_version = sws->get_hw_version(sws);
653 } else {
654 svgascreen->hw_version = SVGA3D_HWVERSION_WS65_B1;
655 }
656
657 use_ps30 =
658 sws->get_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION, &result) &&
659 result.u >= SVGA3DPSVERSION_30 ? TRUE : FALSE;
660
661 use_vs30 =
662 sws->get_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION, &result) &&
663 result.u >= SVGA3DVSVERSION_30 ? TRUE : FALSE;
664
665 /* we require Shader model 3.0 or later */
666 if (!use_ps30 || !use_vs30)
667 goto error2;
668
669 /*
670 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
671 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
672 * we prefer the later when available.
673 *
674 * This mimics hardware vendors extensions for D3D depth sampling. See also
675 * http://aras-p.info/texts/D3D9GPUHacks.html
676 */
677
678 {
679 boolean has_df16, has_df24, has_d24s8_int;
680 SVGA3dSurfaceFormatCaps caps;
681 SVGA3dSurfaceFormatCaps mask;
682 mask.value = 0;
683 mask.zStencil = 1;
684 mask.texture = 1;
685
686 svgascreen->depth.z16 = SVGA3D_Z_D16;
687 svgascreen->depth.x8z24 = SVGA3D_Z_D24X8;
688 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8;
689
690 svga_get_format_cap(svgascreen, SVGA3D_Z_DF16, &caps);
691 has_df16 = (caps.value & mask.value) == mask.value;
692
693 svga_get_format_cap(svgascreen, SVGA3D_Z_DF24, &caps);
694 has_df24 = (caps.value & mask.value) == mask.value;
695
696 svga_get_format_cap(svgascreen, SVGA3D_Z_D24S8_INT, &caps);
697 has_d24s8_int = (caps.value & mask.value) == mask.value;
698
699 /* XXX: We might want some other logic here.
700 * Like if we only have d24s8_int we should
701 * emulate the other formats with that.
702 */
703 if (has_df16) {
704 svgascreen->depth.z16 = SVGA3D_Z_DF16;
705 }
706 if (has_df24) {
707 svgascreen->depth.x8z24 = SVGA3D_Z_DF24;
708 }
709 if (has_d24s8_int) {
710 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8_INT;
711 }
712 }
713
714 /* Query device caps
715 */
716 if (!sws->get_cap(sws, SVGA3D_DEVCAP_LINE_STIPPLE, &result))
717 svgascreen->haveLineStipple = FALSE;
718 else
719 svgascreen->haveLineStipple = result.u;
720
721 if (!sws->get_cap(sws, SVGA3D_DEVCAP_LINE_AA, &result))
722 svgascreen->haveLineSmooth = FALSE;
723 else
724 svgascreen->haveLineSmooth = result.u;
725
726 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_LINE_WIDTH, &result))
727 svgascreen->maxLineWidth = 1.0F;
728 else
729 svgascreen->maxLineWidth = result.f;
730
731 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_AA_LINE_WIDTH, &result))
732 svgascreen->maxLineWidthAA = 1.0F;
733 else
734 svgascreen->maxLineWidthAA = result.f;
735
736 if (0)
737 debug_printf("svga: haveLineStip %u "
738 "haveLineSmooth %u maxLineWidth %f\n",
739 svgascreen->haveLineStipple, svgascreen->haveLineSmooth,
740 svgascreen->maxLineWidth);
741
742 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_POINT_SIZE, &result)) {
743 svgascreen->maxPointSize = 1.0F;
744 } else {
745 /* Keep this to a reasonable size to avoid failures in
746 * conform/pntaa.c:
747 */
748 svgascreen->maxPointSize = MIN2(result.f, 80.0f);
749 }
750
751 /* The SVGA3D device always supports 4 targets at this time, regardless
752 * of what querying SVGA3D_DEVCAP_MAX_RENDER_TARGETS might return.
753 */
754 svgascreen->max_color_buffers = 4;
755
756 pipe_mutex_init(svgascreen->tex_mutex);
757 pipe_mutex_init(svgascreen->swc_mutex);
758
759 svga_screen_cache_init(svgascreen);
760
761 return screen;
762 error2:
763 FREE(svgascreen);
764 error1:
765 return NULL;
766 }
767
768 struct svga_winsys_screen *
769 svga_winsys_screen(struct pipe_screen *screen)
770 {
771 return svga_screen(screen)->sws;
772 }
773
774 #ifdef DEBUG
775 struct svga_screen *
776 svga_screen(struct pipe_screen *screen)
777 {
778 assert(screen);
779 assert(screen->destroy == svga_destroy_screen);
780 return (struct svga_screen *)screen;
781 }
782 #endif