1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 **********************************************************/
26 #include "util/u_format.h"
27 #include "util/u_memory.h"
28 #include "util/u_inlines.h"
29 #include "util/u_string.h"
30 #include "util/u_math.h"
32 #include "svga_winsys.h"
33 #include "svga_public.h"
34 #include "svga_context.h"
35 #include "svga_format.h"
36 #include "svga_screen.h"
37 #include "svga_tgsi.h"
38 #include "svga_resource_texture.h"
39 #include "svga_resource.h"
40 #include "svga_debug.h"
42 #include "svga3d_shaderdefs.h"
43 #include "VGPU10ShaderTokens.h"
45 /* NOTE: this constant may get moved into a svga3d*.h header file */
46 #define SVGA3D_DX_MAX_RESOURCE_SIZE (128 * 1024 * 1024)
51 static const struct debug_named_value svga_debug_flags
[] = {
52 { "dma", DEBUG_DMA
, NULL
},
53 { "tgsi", DEBUG_TGSI
, NULL
},
54 { "pipe", DEBUG_PIPE
, NULL
},
55 { "state", DEBUG_STATE
, NULL
},
56 { "screen", DEBUG_SCREEN
, NULL
},
57 { "tex", DEBUG_TEX
, NULL
},
58 { "swtnl", DEBUG_SWTNL
, NULL
},
59 { "const", DEBUG_CONSTS
, NULL
},
60 { "viewport", DEBUG_VIEWPORT
, NULL
},
61 { "views", DEBUG_VIEWS
, NULL
},
62 { "perf", DEBUG_PERF
, NULL
},
63 { "flush", DEBUG_FLUSH
, NULL
},
64 { "sync", DEBUG_SYNC
, NULL
},
65 { "cache", DEBUG_CACHE
, NULL
},
66 { "streamout", DEBUG_STREAMOUT
, NULL
},
67 { "query", DEBUG_QUERY
, NULL
},
73 svga_get_vendor( struct pipe_screen
*pscreen
)
75 return "VMware, Inc.";
80 svga_get_name( struct pipe_screen
*pscreen
)
82 const char *build
= "", *llvm
= "", *mutex
= "";
83 static char name
[100];
85 /* Only return internal details in the DEBUG version:
87 build
= "build: DEBUG;";
88 mutex
= "mutex: " PIPE_ATOMIC
";";
90 build
= "build: RELEASE;";
96 util_snprintf(name
, sizeof(name
), "SVGA3D; %s %s %s", build
, mutex
, llvm
);
101 /** Helper for querying float-valued device cap */
103 get_float_cap(struct svga_winsys_screen
*sws
, unsigned cap
, float defaultVal
)
105 SVGA3dDevCapResult result
;
106 if (sws
->get_cap(sws
, cap
, &result
))
113 /** Helper for querying uint-valued device cap */
115 get_uint_cap(struct svga_winsys_screen
*sws
, unsigned cap
, unsigned defaultVal
)
117 SVGA3dDevCapResult result
;
118 if (sws
->get_cap(sws
, cap
, &result
))
125 /** Helper for querying boolean-valued device cap */
127 get_bool_cap(struct svga_winsys_screen
*sws
, unsigned cap
, boolean defaultVal
)
129 SVGA3dDevCapResult result
;
130 if (sws
->get_cap(sws
, cap
, &result
))
138 svga_get_paramf(struct pipe_screen
*screen
, enum pipe_capf param
)
140 struct svga_screen
*svgascreen
= svga_screen(screen
);
141 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
144 case PIPE_CAPF_MAX_LINE_WIDTH
:
145 return svgascreen
->maxLineWidth
;
146 case PIPE_CAPF_MAX_LINE_WIDTH_AA
:
147 return svgascreen
->maxLineWidthAA
;
149 case PIPE_CAPF_MAX_POINT_WIDTH
:
151 case PIPE_CAPF_MAX_POINT_WIDTH_AA
:
152 return svgascreen
->maxPointSize
;
154 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY
:
155 return (float) get_uint_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY
, 4);
157 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS
:
160 case PIPE_CAPF_GUARD_BAND_LEFT
:
161 case PIPE_CAPF_GUARD_BAND_TOP
:
162 case PIPE_CAPF_GUARD_BAND_RIGHT
:
163 case PIPE_CAPF_GUARD_BAND_BOTTOM
:
167 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param
);
173 svga_get_param(struct pipe_screen
*screen
, enum pipe_cap param
)
175 struct svga_screen
*svgascreen
= svga_screen(screen
);
176 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
177 SVGA3dDevCapResult result
;
180 case PIPE_CAP_NPOT_TEXTURES
:
181 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES
:
183 case PIPE_CAP_TWO_SIDED_STENCIL
:
185 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS
:
187 * "In virtually every OpenGL implementation and hardware,
188 * GL_MAX_DUAL_SOURCE_DRAW_BUFFERS is 1"
189 * http://www.opengl.org/wiki/Blending
191 return sws
->have_vgpu10
? 1 : 0;
192 case PIPE_CAP_ANISOTROPIC_FILTER
:
194 case PIPE_CAP_POINT_SPRITE
:
196 case PIPE_CAP_TGSI_TEXCOORD
:
198 case PIPE_CAP_MAX_RENDER_TARGETS
:
199 return svgascreen
->max_color_buffers
;
200 case PIPE_CAP_OCCLUSION_QUERY
:
202 case PIPE_CAP_QUERY_TIME_ELAPSED
:
204 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS
:
205 return sws
->have_vgpu10
;
206 case PIPE_CAP_TEXTURE_SHADOW_MAP
:
208 case PIPE_CAP_TEXTURE_SWIZZLE
:
210 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK
:
212 case PIPE_CAP_USER_VERTEX_BUFFERS
:
213 case PIPE_CAP_USER_INDEX_BUFFERS
:
215 case PIPE_CAP_USER_CONSTANT_BUFFERS
:
217 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT
:
220 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS
:
222 unsigned levels
= SVGA_MAX_TEXTURE_LEVELS
;
223 if (sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH
, &result
))
224 levels
= MIN2(util_logbase2(result
.u
) + 1, levels
);
226 levels
= 12 /* 2048x2048 */;
227 if (sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT
, &result
))
228 levels
= MIN2(util_logbase2(result
.u
) + 1, levels
);
230 levels
= 12 /* 2048x2048 */;
234 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
235 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT
, &result
))
236 return 8; /* max 128x128x128 */
237 return MIN2(util_logbase2(result
.u
) + 1, SVGA_MAX_TEXTURE_LEVELS
);
239 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
241 * No mechanism to query the host, and at least limited to 2048x2048 on
244 return MIN2(screen
->get_param(screen
, PIPE_CAP_MAX_TEXTURE_2D_LEVELS
),
247 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS
:
248 return sws
->have_vgpu10
? SVGA3D_MAX_SURFACE_ARRAYSIZE
: 0;
250 case PIPE_CAP_BLEND_EQUATION_SEPARATE
: /* req. for GL 1.5 */
253 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
255 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
256 return sws
->have_vgpu10
;
257 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
259 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
260 return !sws
->have_vgpu10
;
262 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED
:
263 return 1; /* The color outputs of vertex shaders are not clamped */
264 case PIPE_CAP_VERTEX_COLOR_CLAMPED
:
265 return 0; /* The driver can't clamp vertex colors */
266 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED
:
267 return 0; /* The driver can't clamp fragment colors */
269 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS
:
270 return 1; /* expected for GL_ARB_framebuffer_object */
272 case PIPE_CAP_GLSL_FEATURE_LEVEL
:
273 return sws
->have_vgpu10
? 330 : 120;
275 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER
:
281 case PIPE_CAP_DEPTH_CLIP_DISABLE
:
282 case PIPE_CAP_INDEP_BLEND_ENABLE
:
283 case PIPE_CAP_CONDITIONAL_RENDER
:
284 case PIPE_CAP_QUERY_TIMESTAMP
:
285 case PIPE_CAP_TGSI_INSTANCEID
:
286 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR
:
287 case PIPE_CAP_SEAMLESS_CUBE_MAP
:
288 case PIPE_CAP_FAKE_SW_MSAA
:
289 return sws
->have_vgpu10
;
291 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS
:
292 return sws
->have_vgpu10
? SVGA3D_DX_MAX_SOTARGETS
: 0;
293 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS
:
294 return sws
->have_vgpu10
? 4 : 0;
295 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS
:
296 return sws
->have_vgpu10
? SVGA3D_MAX_STREAMOUT_DECLS
: 0;
297 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME
:
299 case PIPE_CAP_TEXTURE_MULTISAMPLE
:
300 return svgascreen
->ms_samples
? 1 : 0;
302 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE
:
303 return SVGA3D_DX_MAX_RESOURCE_SIZE
;
305 case PIPE_CAP_MIN_TEXEL_OFFSET
:
306 return sws
->have_vgpu10
? VGPU10_MIN_TEXEL_FETCH_OFFSET
: 0;
307 case PIPE_CAP_MAX_TEXEL_OFFSET
:
308 return sws
->have_vgpu10
? VGPU10_MAX_TEXEL_FETCH_OFFSET
: 0;
310 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET
:
311 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET
:
314 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES
:
315 return sws
->have_vgpu10
? 256 : 0;
316 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS
:
317 return sws
->have_vgpu10
? 1024 : 0;
319 case PIPE_CAP_PRIMITIVE_RESTART
:
320 return 1; /* may be a sw fallback, depending on restart index */
322 case PIPE_CAP_GENERATE_MIPMAP
:
323 return sws
->have_vgpu10
;
325 /* Unsupported features */
326 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION
:
327 case PIPE_CAP_TEXTURE_MIRROR_CLAMP
:
328 case PIPE_CAP_SHADER_STENCIL_EXPORT
:
329 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE
:
330 case PIPE_CAP_INDEP_BLEND_FUNC
:
331 case PIPE_CAP_TEXTURE_BARRIER
:
332 case PIPE_CAP_MAX_VERTEX_STREAMS
:
333 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS
:
334 case PIPE_CAP_COMPUTE
:
335 case PIPE_CAP_START_INSTANCE
:
336 case PIPE_CAP_CUBE_MAP_ARRAY
:
337 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT
:
338 case PIPE_CAP_QUERY_PIPELINE_STATISTICS
:
339 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT
:
340 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS
:
341 case PIPE_CAP_TEXTURE_GATHER_SM5
:
342 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT
:
343 case PIPE_CAP_TEXTURE_QUERY_LOD
:
344 case PIPE_CAP_SAMPLE_SHADING
:
345 case PIPE_CAP_TEXTURE_GATHER_OFFSETS
:
346 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION
:
347 case PIPE_CAP_DRAW_INDIRECT
:
348 case PIPE_CAP_MULTI_DRAW_INDIRECT
:
349 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS
:
350 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE
:
351 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED
:
352 case PIPE_CAP_SAMPLER_VIEW_TARGET
:
353 case PIPE_CAP_CLIP_HALFZ
:
354 case PIPE_CAP_VERTEXID_NOBASE
:
355 case PIPE_CAP_POLYGON_OFFSET_CLAMP
:
356 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE
:
357 case PIPE_CAP_TGSI_PACK_HALF_FLOAT
:
358 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT
:
359 case PIPE_CAP_INVALIDATE_BUFFER
:
360 case PIPE_CAP_STRING_MARKER
:
361 case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS
:
362 case PIPE_CAP_QUERY_MEMORY_INFO
:
363 case PIPE_CAP_PCI_GROUP
:
364 case PIPE_CAP_PCI_BUS
:
365 case PIPE_CAP_PCI_DEVICE
:
366 case PIPE_CAP_PCI_FUNCTION
:
367 case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR
:
369 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT
:
371 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY
:
372 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY
:
373 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY
:
374 return 1; /* need 4-byte alignment for all offsets and strides */
375 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE
:
377 case PIPE_CAP_MAX_VIEWPORTS
:
379 case PIPE_CAP_ENDIANNESS
:
380 return PIPE_ENDIAN_LITTLE
;
382 case PIPE_CAP_VENDOR_ID
:
383 return 0x15ad; /* VMware Inc. */
384 case PIPE_CAP_DEVICE_ID
:
385 return 0x0405; /* assume SVGA II */
386 case PIPE_CAP_ACCELERATED
:
388 case PIPE_CAP_VIDEO_MEMORY
:
389 /* XXX: Query the host ? */
392 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY
:
393 case PIPE_CAP_DEVICE_RESET_STATUS_QUERY
:
394 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS
:
395 case PIPE_CAP_TEXTURE_FLOAT_LINEAR
:
396 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR
:
397 case PIPE_CAP_DEPTH_BOUNDS_TEST
:
398 case PIPE_CAP_TGSI_TXQS
:
399 case PIPE_CAP_FORCE_PERSAMPLE_INTERP
:
400 case PIPE_CAP_SHAREABLE_SHADERS
:
401 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS
:
402 case PIPE_CAP_CLEAR_TEXTURE
:
403 case PIPE_CAP_DRAW_PARAMETERS
:
404 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL
:
405 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL
:
406 case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY
:
407 case PIPE_CAP_QUERY_BUFFER_OBJECT
:
408 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT
:
412 debug_printf("Unexpected PIPE_CAP_ query %u\n", param
);
418 vgpu9_get_shader_param(struct pipe_screen
*screen
, unsigned shader
,
419 enum pipe_shader_cap param
)
421 struct svga_screen
*svgascreen
= svga_screen(screen
);
422 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
425 assert(!sws
->have_vgpu10
);
429 case PIPE_SHADER_FRAGMENT
:
432 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
433 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
434 return get_uint_cap(sws
,
435 SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_INSTRUCTIONS
,
437 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
438 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
440 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
441 return SVGA3D_MAX_NESTING_LEVEL
;
442 case PIPE_SHADER_CAP_MAX_INPUTS
:
444 case PIPE_SHADER_CAP_MAX_OUTPUTS
:
445 return svgascreen
->max_color_buffers
;
446 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE
:
447 return 224 * sizeof(float[4]);
448 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
450 case PIPE_SHADER_CAP_MAX_TEMPS
:
451 val
= get_uint_cap(sws
, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS
, 32);
452 return MIN2(val
, SVGA3D_TEMPREG_MAX
);
453 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
455 * Although PS 3.0 has some addressing abilities it can only represent
456 * loops that can be statically determined and unrolled. Given we can
457 * only handle a subset of the cases that the state tracker already
458 * does it is better to defer loop unrolling to the state tracker.
461 case PIPE_SHADER_CAP_MAX_PREDS
:
463 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
465 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED
:
467 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
468 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
469 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
471 case PIPE_SHADER_CAP_SUBROUTINES
:
473 case PIPE_SHADER_CAP_INTEGERS
:
475 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
476 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS
:
478 case PIPE_SHADER_CAP_PREFERRED_IR
:
479 return PIPE_SHADER_IR_TGSI
;
480 case PIPE_SHADER_CAP_SUPPORTED_IRS
:
482 case PIPE_SHADER_CAP_DOUBLES
:
483 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED
:
484 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED
:
485 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED
:
486 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE
:
487 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS
:
488 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES
:
490 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT
:
493 /* If we get here, we failed to handle a cap above */
494 debug_printf("Unexpected fragment shader query %u\n", param
);
496 case PIPE_SHADER_VERTEX
:
499 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
500 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
501 return get_uint_cap(sws
, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS
,
503 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
504 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
505 /* XXX: until we have vertex texture support */
507 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
508 return SVGA3D_MAX_NESTING_LEVEL
;
509 case PIPE_SHADER_CAP_MAX_INPUTS
:
511 case PIPE_SHADER_CAP_MAX_OUTPUTS
:
513 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE
:
514 return 256 * sizeof(float[4]);
515 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
517 case PIPE_SHADER_CAP_MAX_TEMPS
:
518 val
= get_uint_cap(sws
, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS
, 32);
519 return MIN2(val
, SVGA3D_TEMPREG_MAX
);
520 case PIPE_SHADER_CAP_MAX_PREDS
:
522 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
524 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED
:
526 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
527 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
529 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
531 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
533 case PIPE_SHADER_CAP_SUBROUTINES
:
535 case PIPE_SHADER_CAP_INTEGERS
:
537 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
538 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS
:
540 case PIPE_SHADER_CAP_PREFERRED_IR
:
541 return PIPE_SHADER_IR_TGSI
;
542 case PIPE_SHADER_CAP_SUPPORTED_IRS
:
544 case PIPE_SHADER_CAP_DOUBLES
:
545 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED
:
546 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED
:
547 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED
:
548 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE
:
549 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS
:
550 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES
:
552 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT
:
555 /* If we get here, we failed to handle a cap above */
556 debug_printf("Unexpected vertex shader query %u\n", param
);
558 case PIPE_SHADER_GEOMETRY
:
559 case PIPE_SHADER_COMPUTE
:
560 case PIPE_SHADER_TESS_CTRL
:
561 case PIPE_SHADER_TESS_EVAL
:
562 /* no support for geometry, tess or compute shaders at this time */
565 debug_printf("Unexpected shader type (%u) query\n", shader
);
573 vgpu10_get_shader_param(struct pipe_screen
*screen
, unsigned shader
,
574 enum pipe_shader_cap param
)
576 struct svga_screen
*svgascreen
= svga_screen(screen
);
577 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
579 assert(sws
->have_vgpu10
);
580 (void) sws
; /* silence unused var warnings in non-debug builds */
582 /* Only VS, GS, FS supported */
583 if (shader
!= PIPE_SHADER_VERTEX
&&
584 shader
!= PIPE_SHADER_GEOMETRY
&&
585 shader
!= PIPE_SHADER_FRAGMENT
) {
589 /* NOTE: we do not query the device for any caps/limits at this time */
591 /* Generally the same limits for vertex, geometry and fragment shaders */
593 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
594 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
595 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
596 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
598 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
600 case PIPE_SHADER_CAP_MAX_INPUTS
:
601 if (shader
== PIPE_SHADER_FRAGMENT
)
602 return VGPU10_MAX_FS_INPUTS
;
603 else if (shader
== PIPE_SHADER_GEOMETRY
)
604 return VGPU10_MAX_GS_INPUTS
;
606 return VGPU10_MAX_VS_INPUTS
;
607 case PIPE_SHADER_CAP_MAX_OUTPUTS
:
608 if (shader
== PIPE_SHADER_FRAGMENT
)
609 return VGPU10_MAX_FS_OUTPUTS
;
610 else if (shader
== PIPE_SHADER_GEOMETRY
)
611 return VGPU10_MAX_GS_OUTPUTS
;
613 return VGPU10_MAX_VS_OUTPUTS
;
614 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE
:
615 return VGPU10_MAX_CONSTANT_BUFFER_ELEMENT_COUNT
* sizeof(float[4]);
616 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
617 return svgascreen
->max_const_buffers
;
618 case PIPE_SHADER_CAP_MAX_TEMPS
:
619 return VGPU10_MAX_TEMPS
;
620 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
621 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
622 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
623 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
624 return TRUE
; /* XXX verify */
625 case PIPE_SHADER_CAP_MAX_PREDS
:
627 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
628 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED
:
629 case PIPE_SHADER_CAP_SUBROUTINES
:
630 case PIPE_SHADER_CAP_INTEGERS
:
632 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
633 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS
:
634 return SVGA3D_DX_MAX_SAMPLERS
;
635 case PIPE_SHADER_CAP_PREFERRED_IR
:
636 return PIPE_SHADER_IR_TGSI
;
637 case PIPE_SHADER_CAP_SUPPORTED_IRS
:
639 case PIPE_SHADER_CAP_DOUBLES
:
640 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED
:
641 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED
:
642 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED
:
643 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE
:
644 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS
:
645 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES
:
647 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT
:
650 debug_printf("Unexpected vgpu10 shader query %u\n", param
);
658 svga_get_shader_param(struct pipe_screen
*screen
, unsigned shader
,
659 enum pipe_shader_cap param
)
661 struct svga_screen
*svgascreen
= svga_screen(screen
);
662 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
663 if (sws
->have_vgpu10
) {
664 return vgpu10_get_shader_param(screen
, shader
, param
);
667 return vgpu9_get_shader_param(screen
, shader
, param
);
673 * Implement pipe_screen::is_format_supported().
674 * \param bindings bitmask of PIPE_BIND_x flags
677 svga_is_format_supported( struct pipe_screen
*screen
,
678 enum pipe_format format
,
679 enum pipe_texture_target target
,
680 unsigned sample_count
,
683 struct svga_screen
*ss
= svga_screen(screen
);
684 SVGA3dSurfaceFormat svga_format
;
685 SVGA3dSurfaceFormatCaps caps
;
686 SVGA3dSurfaceFormatCaps mask
;
690 if (sample_count
> 1) {
691 /* In ms_samples, if bit N is set it means that we support
692 * multisample with N+1 samples per pixel.
694 if ((ss
->ms_samples
& (1 << (sample_count
- 1))) == 0) {
699 svga_format
= svga_translate_format(ss
, format
, bindings
);
700 if (svga_format
== SVGA3D_FORMAT_INVALID
) {
704 /* we don't support sRGB rendering into display targets */
705 if (util_format_is_srgb(format
) && (bindings
& PIPE_BIND_DISPLAY_TARGET
)) {
710 * For VGPU10 vertex formats, skip querying host capabilities
713 if (ss
->sws
->have_vgpu10
&& (bindings
& PIPE_BIND_VERTEX_BUFFER
)) {
714 SVGA3dSurfaceFormat svga_format
;
716 svga_translate_vertex_format_vgpu10(format
, &svga_format
, &flags
);
717 return svga_format
!= SVGA3D_FORMAT_INVALID
;
721 * Override host capabilities, so that we end up with the same
722 * visuals for all virtual hardware implementations.
725 if (bindings
& PIPE_BIND_DISPLAY_TARGET
) {
726 switch (svga_format
) {
727 case SVGA3D_A8R8G8B8
:
728 case SVGA3D_X8R8G8B8
:
733 case SVGA3D_B8G8R8A8_UNORM
:
734 case SVGA3D_B8G8R8X8_UNORM
:
735 case SVGA3D_B5G6R5_UNORM
:
738 /* Often unsupported/problematic. This means we end up with the same
739 * visuals for all virtual hardware implementations.
741 case SVGA3D_A4R4G4B4
:
742 case SVGA3D_A1R5G5B5
:
751 * Query the host capabilities.
754 svga_get_format_cap(ss
, svga_format
, &caps
);
756 if (bindings
& PIPE_BIND_RENDER_TARGET
) {
757 /* Check that the color surface is blendable, unless it's an
760 if (!svga_format_is_integer(svga_format
) &&
761 (caps
.value
& SVGA3DFORMAT_OP_NOALPHABLEND
)) {
767 if (bindings
& PIPE_BIND_RENDER_TARGET
) {
768 mask
.value
|= SVGA3DFORMAT_OP_OFFSCREEN_RENDERTARGET
;
770 if (bindings
& PIPE_BIND_DEPTH_STENCIL
) {
771 mask
.value
|= SVGA3DFORMAT_OP_ZSTENCIL
;
773 if (bindings
& PIPE_BIND_SAMPLER_VIEW
) {
774 mask
.value
|= SVGA3DFORMAT_OP_TEXTURE
;
777 if (target
== PIPE_TEXTURE_CUBE
) {
778 mask
.value
|= SVGA3DFORMAT_OP_CUBETEXTURE
;
780 else if (target
== PIPE_TEXTURE_3D
) {
781 mask
.value
|= SVGA3DFORMAT_OP_VOLUMETEXTURE
;
784 return (caps
.value
& mask
.value
) == mask
.value
;
789 svga_fence_reference(struct pipe_screen
*screen
,
790 struct pipe_fence_handle
**ptr
,
791 struct pipe_fence_handle
*fence
)
793 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
794 sws
->fence_reference(sws
, ptr
, fence
);
799 svga_fence_finish(struct pipe_screen
*screen
,
800 struct pipe_fence_handle
*fence
,
803 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
806 return sws
->fence_signalled(sws
, fence
, 0) == 0;
808 SVGA_DBG(DEBUG_DMA
|DEBUG_PERF
, "%s fence_ptr %p\n",
809 __FUNCTION__
, fence
);
811 return sws
->fence_finish(sws
, fence
, 0) == 0;
816 svga_get_driver_query_info(struct pipe_screen
*screen
,
818 struct pipe_driver_query_info
*info
)
820 #define QUERY(NAME, ENUM, UNITS) \
821 {NAME, ENUM, {0}, UNITS, PIPE_DRIVER_QUERY_RESULT_TYPE_AVERAGE, 0, 0x0}
823 static const struct pipe_driver_query_info queries
[] = {
824 /* per-frame counters */
825 QUERY("num-draw-calls", SVGA_QUERY_NUM_DRAW_CALLS
,
826 PIPE_DRIVER_QUERY_TYPE_UINT64
),
827 QUERY("num-fallbacks", SVGA_QUERY_NUM_FALLBACKS
,
828 PIPE_DRIVER_QUERY_TYPE_UINT64
),
829 QUERY("num-flushes", SVGA_QUERY_NUM_FLUSHES
,
830 PIPE_DRIVER_QUERY_TYPE_UINT64
),
831 QUERY("num-validations", SVGA_QUERY_NUM_VALIDATIONS
,
832 PIPE_DRIVER_QUERY_TYPE_UINT64
),
833 QUERY("map-buffer-time", SVGA_QUERY_MAP_BUFFER_TIME
,
834 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS
),
835 QUERY("num-resources-mapped", SVGA_QUERY_NUM_RESOURCES_MAPPED
,
836 PIPE_DRIVER_QUERY_TYPE_UINT64
),
837 QUERY("num-bytes-uploaded", SVGA_QUERY_NUM_BYTES_UPLOADED
,
838 PIPE_DRIVER_QUERY_TYPE_BYTES
),
839 QUERY("command-buffer-size", SVGA_QUERY_COMMAND_BUFFER_SIZE
,
840 PIPE_DRIVER_QUERY_TYPE_BYTES
),
841 QUERY("flush-time", SVGA_QUERY_FLUSH_TIME
,
842 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS
),
843 QUERY("surface-write-flushes", SVGA_QUERY_SURFACE_WRITE_FLUSHES
,
844 PIPE_DRIVER_QUERY_TYPE_UINT64
),
845 QUERY("num-readbacks", SVGA_QUERY_NUM_READBACKS
,
846 PIPE_DRIVER_QUERY_TYPE_UINT64
),
847 QUERY("num-resource-updates", SVGA_QUERY_NUM_RESOURCE_UPDATES
,
848 PIPE_DRIVER_QUERY_TYPE_UINT64
),
849 QUERY("num-buffer-uploads", SVGA_QUERY_NUM_BUFFER_UPLOADS
,
850 PIPE_DRIVER_QUERY_TYPE_UINT64
),
851 QUERY("num-const-buf-updates", SVGA_QUERY_NUM_CONST_BUF_UPDATES
,
852 PIPE_DRIVER_QUERY_TYPE_UINT64
),
853 QUERY("num-const-updates", SVGA_QUERY_NUM_CONST_UPDATES
,
854 PIPE_DRIVER_QUERY_TYPE_UINT64
),
856 /* running total counters */
857 QUERY("memory-used", SVGA_QUERY_MEMORY_USED
,
858 PIPE_DRIVER_QUERY_TYPE_BYTES
),
859 QUERY("num-shaders", SVGA_QUERY_NUM_SHADERS
,
860 PIPE_DRIVER_QUERY_TYPE_UINT64
),
861 QUERY("num-resources", SVGA_QUERY_NUM_RESOURCES
,
862 PIPE_DRIVER_QUERY_TYPE_UINT64
),
863 QUERY("num-state-objects", SVGA_QUERY_NUM_STATE_OBJECTS
,
864 PIPE_DRIVER_QUERY_TYPE_UINT64
),
865 QUERY("num-surface-views", SVGA_QUERY_NUM_SURFACE_VIEWS
,
866 PIPE_DRIVER_QUERY_TYPE_UINT64
),
867 QUERY("num-generate-mipmap", SVGA_QUERY_NUM_GENERATE_MIPMAP
,
868 PIPE_DRIVER_QUERY_TYPE_UINT64
),
873 return ARRAY_SIZE(queries
);
875 if (index
>= ARRAY_SIZE(queries
))
878 *info
= queries
[index
];
884 svga_destroy_screen( struct pipe_screen
*screen
)
886 struct svga_screen
*svgascreen
= svga_screen(screen
);
888 svga_screen_cache_cleanup(svgascreen
);
890 pipe_mutex_destroy(svgascreen
->swc_mutex
);
891 pipe_mutex_destroy(svgascreen
->tex_mutex
);
893 svgascreen
->sws
->destroy(svgascreen
->sws
);
900 * Create a new svga_screen object
903 svga_screen_create(struct svga_winsys_screen
*sws
)
905 struct svga_screen
*svgascreen
;
906 struct pipe_screen
*screen
;
909 SVGA_DEBUG
= debug_get_flags_option("SVGA_DEBUG", svga_debug_flags
, 0 );
912 svgascreen
= CALLOC_STRUCT(svga_screen
);
916 svgascreen
->debug
.force_level_surface_view
=
917 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE
);
918 svgascreen
->debug
.force_surface_view
=
919 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE
);
920 svgascreen
->debug
.force_sampler_view
=
921 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE
);
922 svgascreen
->debug
.no_surface_view
=
923 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE
);
924 svgascreen
->debug
.no_sampler_view
=
925 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE
);
927 screen
= &svgascreen
->screen
;
929 screen
->destroy
= svga_destroy_screen
;
930 screen
->get_name
= svga_get_name
;
931 screen
->get_vendor
= svga_get_vendor
;
932 screen
->get_device_vendor
= svga_get_vendor
; // TODO actual device vendor
933 screen
->get_param
= svga_get_param
;
934 screen
->get_shader_param
= svga_get_shader_param
;
935 screen
->get_paramf
= svga_get_paramf
;
936 screen
->get_timestamp
= NULL
;
937 screen
->is_format_supported
= svga_is_format_supported
;
938 screen
->context_create
= svga_context_create
;
939 screen
->fence_reference
= svga_fence_reference
;
940 screen
->fence_finish
= svga_fence_finish
;
941 screen
->get_driver_query_info
= svga_get_driver_query_info
;
942 svgascreen
->sws
= sws
;
944 svga_init_screen_resource_functions(svgascreen
);
946 if (sws
->get_hw_version
) {
947 svgascreen
->hw_version
= sws
->get_hw_version(sws
);
949 svgascreen
->hw_version
= SVGA3D_HWVERSION_WS65_B1
;
953 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
954 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
955 * we prefer the later when available.
957 * This mimics hardware vendors extensions for D3D depth sampling. See also
958 * http://aras-p.info/texts/D3D9GPUHacks.html
962 boolean has_df16
, has_df24
, has_d24s8_int
;
963 SVGA3dSurfaceFormatCaps caps
;
964 SVGA3dSurfaceFormatCaps mask
;
969 svgascreen
->depth
.z16
= SVGA3D_Z_D16
;
970 svgascreen
->depth
.x8z24
= SVGA3D_Z_D24X8
;
971 svgascreen
->depth
.s8z24
= SVGA3D_Z_D24S8
;
973 svga_get_format_cap(svgascreen
, SVGA3D_Z_DF16
, &caps
);
974 has_df16
= (caps
.value
& mask
.value
) == mask
.value
;
976 svga_get_format_cap(svgascreen
, SVGA3D_Z_DF24
, &caps
);
977 has_df24
= (caps
.value
& mask
.value
) == mask
.value
;
979 svga_get_format_cap(svgascreen
, SVGA3D_Z_D24S8_INT
, &caps
);
980 has_d24s8_int
= (caps
.value
& mask
.value
) == mask
.value
;
982 /* XXX: We might want some other logic here.
983 * Like if we only have d24s8_int we should
984 * emulate the other formats with that.
987 svgascreen
->depth
.z16
= SVGA3D_Z_DF16
;
990 svgascreen
->depth
.x8z24
= SVGA3D_Z_DF24
;
993 svgascreen
->depth
.s8z24
= SVGA3D_Z_D24S8_INT
;
999 if (sws
->have_vgpu10
) {
1000 svgascreen
->haveProvokingVertex
1001 = get_bool_cap(sws
, SVGA3D_DEVCAP_DX_PROVOKING_VERTEX
, FALSE
);
1002 svgascreen
->haveLineSmooth
= TRUE
;
1003 svgascreen
->maxPointSize
= 80.0F
;
1004 svgascreen
->max_color_buffers
= SVGA3D_DX_MAX_RENDER_TARGETS
;
1006 /* Multisample samples per pixel */
1007 if (debug_get_bool_option("SVGA_MSAA", TRUE
)) {
1008 svgascreen
->ms_samples
=
1009 get_uint_cap(sws
, SVGA3D_DEVCAP_MULTISAMPLE_MASKABLESAMPLES
, 0);
1012 /* Maximum number of constant buffers */
1013 svgascreen
->max_const_buffers
=
1014 get_uint_cap(sws
, SVGA3D_DEVCAP_DX_MAX_CONSTANT_BUFFERS
, 1);
1015 assert(svgascreen
->max_const_buffers
<= SVGA_MAX_CONST_BUFS
);
1019 unsigned vs_ver
= get_uint_cap(sws
, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION
,
1020 SVGA3DVSVERSION_NONE
);
1021 unsigned fs_ver
= get_uint_cap(sws
, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION
,
1022 SVGA3DPSVERSION_NONE
);
1024 /* we require Shader model 3.0 or later */
1025 if (fs_ver
< SVGA3DPSVERSION_30
|| vs_ver
< SVGA3DVSVERSION_30
) {
1029 svgascreen
->haveProvokingVertex
= FALSE
;
1031 svgascreen
->haveLineSmooth
=
1032 get_bool_cap(sws
, SVGA3D_DEVCAP_LINE_AA
, FALSE
);
1034 svgascreen
->maxPointSize
=
1035 get_float_cap(sws
, SVGA3D_DEVCAP_MAX_POINT_SIZE
, 1.0f
);
1036 /* Keep this to a reasonable size to avoid failures in conform/pntaa.c */
1037 svgascreen
->maxPointSize
= MIN2(svgascreen
->maxPointSize
, 80.0f
);
1039 /* The SVGA3D device always supports 4 targets at this time, regardless
1040 * of what querying SVGA3D_DEVCAP_MAX_RENDER_TARGETS might return.
1042 svgascreen
->max_color_buffers
= 4;
1044 /* Only support one constant buffer
1046 svgascreen
->max_const_buffers
= 1;
1048 /* No multisampling */
1049 svgascreen
->ms_samples
= 0;
1052 /* common VGPU9 / VGPU10 caps */
1053 svgascreen
->haveLineStipple
=
1054 get_bool_cap(sws
, SVGA3D_DEVCAP_LINE_STIPPLE
, FALSE
);
1056 svgascreen
->maxLineWidth
=
1057 get_float_cap(sws
, SVGA3D_DEVCAP_MAX_LINE_WIDTH
, 1.0f
);
1059 svgascreen
->maxLineWidthAA
=
1060 get_float_cap(sws
, SVGA3D_DEVCAP_MAX_AA_LINE_WIDTH
, 1.0f
);
1063 debug_printf("svga: haveProvokingVertex %u\n",
1064 svgascreen
->haveProvokingVertex
);
1065 debug_printf("svga: haveLineStip %u "
1066 "haveLineSmooth %u maxLineWidth %f\n",
1067 svgascreen
->haveLineStipple
, svgascreen
->haveLineSmooth
,
1068 svgascreen
->maxLineWidth
);
1069 debug_printf("svga: maxPointSize %g\n", svgascreen
->maxPointSize
);
1072 pipe_mutex_init(svgascreen
->tex_mutex
);
1073 pipe_mutex_init(svgascreen
->swc_mutex
);
1075 svga_screen_cache_init(svgascreen
);
1084 struct svga_winsys_screen
*
1085 svga_winsys_screen(struct pipe_screen
*screen
)
1087 return svga_screen(screen
)->sws
;
1091 struct svga_screen
*
1092 svga_screen(struct pipe_screen
*screen
)
1095 assert(screen
->destroy
== svga_destroy_screen
);
1096 return (struct svga_screen
*)screen
;