1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 **********************************************************/
26 #include "util/u_memory.h"
27 #include "util/u_inlines.h"
28 #include "util/u_string.h"
29 #include "util/u_math.h"
31 #include "svga_winsys.h"
32 #include "svga_public.h"
33 #include "svga_context.h"
34 #include "svga_format.h"
35 #include "svga_screen.h"
36 #include "svga_resource_texture.h"
37 #include "svga_resource.h"
38 #include "svga_debug.h"
40 #include "svga3d_shaderdefs.h"
46 static const struct debug_named_value svga_debug_flags
[] = {
47 { "dma", DEBUG_DMA
, NULL
},
48 { "tgsi", DEBUG_TGSI
, NULL
},
49 { "pipe", DEBUG_PIPE
, NULL
},
50 { "state", DEBUG_STATE
, NULL
},
51 { "screen", DEBUG_SCREEN
, NULL
},
52 { "tex", DEBUG_TEX
, NULL
},
53 { "swtnl", DEBUG_SWTNL
, NULL
},
54 { "const", DEBUG_CONSTS
, NULL
},
55 { "viewport", DEBUG_VIEWPORT
, NULL
},
56 { "views", DEBUG_VIEWS
, NULL
},
57 { "perf", DEBUG_PERF
, NULL
},
58 { "flush", DEBUG_FLUSH
, NULL
},
59 { "sync", DEBUG_SYNC
, NULL
},
60 { "cache", DEBUG_CACHE
, NULL
},
66 svga_get_vendor( struct pipe_screen
*pscreen
)
68 return "VMware, Inc.";
73 svga_get_name( struct pipe_screen
*pscreen
)
75 const char *build
= "", *llvm
= "", *mutex
= "";
76 static char name
[100];
78 /* Only return internal details in the DEBUG version:
80 build
= "build: DEBUG;";
81 mutex
= "mutex: " PIPE_ATOMIC
";";
86 build
= "build: RELEASE;";
89 util_snprintf(name
, sizeof(name
), "SVGA3D; %s %s %s", build
, mutex
, llvm
);
97 svga_get_paramf(struct pipe_screen
*screen
, enum pipe_capf param
)
99 struct svga_screen
*svgascreen
= svga_screen(screen
);
100 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
101 SVGA3dDevCapResult result
;
104 case PIPE_CAPF_MAX_LINE_WIDTH
:
106 case PIPE_CAPF_MAX_LINE_WIDTH_AA
:
109 case PIPE_CAPF_MAX_POINT_WIDTH
:
111 case PIPE_CAPF_MAX_POINT_WIDTH_AA
:
112 return svgascreen
->maxPointSize
;
114 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY
:
115 if(!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY
, &result
))
119 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS
:
123 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param
);
130 svga_get_param(struct pipe_screen
*screen
, enum pipe_cap param
)
132 struct svga_screen
*svgascreen
= svga_screen(screen
);
133 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
134 SVGA3dDevCapResult result
;
137 case PIPE_CAP_MAX_COMBINED_SAMPLERS
:
139 case PIPE_CAP_NPOT_TEXTURES
:
141 case PIPE_CAP_TWO_SIDED_STENCIL
:
143 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS
:
145 case PIPE_CAP_ANISOTROPIC_FILTER
:
147 case PIPE_CAP_POINT_SPRITE
:
149 case PIPE_CAP_MAX_RENDER_TARGETS
:
150 if(!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_RENDER_TARGETS
, &result
))
154 return MIN2(result
.u
, PIPE_MAX_COLOR_BUFS
);
155 case PIPE_CAP_OCCLUSION_QUERY
:
157 case PIPE_CAP_TIMER_QUERY
:
159 case PIPE_CAP_TEXTURE_SHADOW_MAP
:
161 case PIPE_CAP_TEXTURE_SWIZZLE
:
163 case PIPE_CAP_USER_VERTEX_BUFFERS
:
164 case PIPE_CAP_USER_INDEX_BUFFERS
:
165 case PIPE_CAP_USER_CONSTANT_BUFFERS
:
168 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS
:
170 unsigned levels
= SVGA_MAX_TEXTURE_LEVELS
;
171 if (sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH
, &result
))
172 levels
= MIN2(util_logbase2(result
.u
) + 1, levels
);
174 levels
= 12 /* 2048x2048 */;
175 if (sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT
, &result
))
176 levels
= MIN2(util_logbase2(result
.u
) + 1, levels
);
178 levels
= 12 /* 2048x2048 */;
182 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
183 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT
, &result
))
184 return 8; /* max 128x128x128 */
185 return MIN2(util_logbase2(result
.u
) + 1, SVGA_MAX_TEXTURE_LEVELS
);
187 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
189 * No mechanism to query the host, and at least limited to 2048x2048 on
192 return MIN2(screen
->get_param(screen
, PIPE_CAP_MAX_TEXTURE_2D_LEVELS
),
195 case PIPE_CAP_BLEND_EQUATION_SEPARATE
: /* req. for GL 1.5 */
198 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
199 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
201 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
202 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
205 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE
:
208 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED
:
209 return 1; /* The color outputs of vertex shaders are not clamped */
210 case PIPE_CAP_VERTEX_COLOR_CLAMPED
:
211 return 0; /* The driver can't clamp vertex colors */
212 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED
:
213 return 0; /* The driver can't clamp fragment colors */
215 /* Unsupported features */
216 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS
:
217 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION
:
218 case PIPE_CAP_TEXTURE_MIRROR_CLAMP
:
220 case PIPE_CAP_SHADER_STENCIL_EXPORT
:
221 case PIPE_CAP_DEPTH_CLIP_DISABLE
:
222 case PIPE_CAP_SEAMLESS_CUBE_MAP
:
223 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE
:
224 case PIPE_CAP_INDEP_BLEND_ENABLE
:
225 case PIPE_CAP_INDEP_BLEND_FUNC
:
226 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS
:
227 case PIPE_CAP_PRIMITIVE_RESTART
:
228 case PIPE_CAP_TGSI_INSTANCEID
:
229 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR
:
230 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS
:
231 case PIPE_CAP_MIN_TEXEL_OFFSET
:
232 case PIPE_CAP_MAX_TEXEL_OFFSET
:
233 case PIPE_CAP_CONDITIONAL_RENDER
:
234 case PIPE_CAP_TEXTURE_BARRIER
:
235 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS
:
236 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS
:
237 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME
:
238 case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS
:
239 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS
:
240 case PIPE_CAP_GLSL_FEATURE_LEVEL
:
244 debug_printf("Unexpected PIPE_CAP_ query %u\n", param
);
249 static int svga_get_shader_param(struct pipe_screen
*screen
, unsigned shader
, enum pipe_shader_cap param
)
251 struct svga_screen
*svgascreen
= svga_screen(screen
);
252 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
253 SVGA3dDevCapResult result
;
257 case PIPE_SHADER_FRAGMENT
:
260 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
261 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
262 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
263 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
265 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
266 return SVGA3D_MAX_NESTING_LEVEL
;
267 case PIPE_SHADER_CAP_MAX_INPUTS
:
269 case PIPE_SHADER_CAP_MAX_CONSTS
:
271 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
273 case PIPE_SHADER_CAP_MAX_TEMPS
:
274 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS
, &result
))
276 return MIN2(result
.u
, SVGA3D_TEMPREG_MAX
);
277 case PIPE_SHADER_CAP_MAX_ADDRS
:
278 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
280 * Although PS 3.0 has some addressing abilities it can only represent
281 * loops that can be statically determined and unrolled. Given we can
282 * only handle a subset of the cases that the state tracker already
283 * does it is better to defer loop unrolling to the state tracker.
286 case PIPE_SHADER_CAP_MAX_PREDS
:
288 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
290 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
291 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
292 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
294 case PIPE_SHADER_CAP_SUBROUTINES
:
296 case PIPE_SHADER_CAP_INTEGERS
:
298 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
301 debug_printf("Unexpected vertex shader query %u\n", param
);
305 case PIPE_SHADER_VERTEX
:
308 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
309 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
310 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS
, &result
))
313 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
314 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
315 /* XXX: until we have vertex texture support */
317 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
318 return SVGA3D_MAX_NESTING_LEVEL
;
319 case PIPE_SHADER_CAP_MAX_INPUTS
:
321 case PIPE_SHADER_CAP_MAX_CONSTS
:
323 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
325 case PIPE_SHADER_CAP_MAX_TEMPS
:
326 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS
, &result
))
328 return MIN2(result
.u
, SVGA3D_TEMPREG_MAX
);
329 case PIPE_SHADER_CAP_MAX_ADDRS
:
331 case PIPE_SHADER_CAP_MAX_PREDS
:
333 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
335 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
336 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
338 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
340 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
342 case PIPE_SHADER_CAP_SUBROUTINES
:
344 case PIPE_SHADER_CAP_INTEGERS
:
346 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
349 debug_printf("Unexpected vertex shader query %u\n", param
);
353 case PIPE_SHADER_GEOMETRY
:
354 /* no support for geometry shaders at this time */
357 debug_printf("Unexpected vertex shader query %u\n", param
);
365 svga_is_format_supported( struct pipe_screen
*screen
,
366 enum pipe_format format
,
367 enum pipe_texture_target target
,
368 unsigned sample_count
,
371 struct svga_screen
*ss
= svga_screen(screen
);
372 SVGA3dSurfaceFormat svga_format
;
373 SVGA3dSurfaceFormatCaps caps
;
374 SVGA3dSurfaceFormatCaps mask
;
378 if (sample_count
> 1) {
382 svga_format
= svga_translate_format(ss
, format
, tex_usage
);
383 if (svga_format
== SVGA3D_FORMAT_INVALID
) {
388 * Override host capabilities, so that we end up with the same
389 * visuals for all virtual hardware implementations.
392 if (tex_usage
& PIPE_BIND_DISPLAY_TARGET
) {
393 switch (svga_format
) {
394 case SVGA3D_A8R8G8B8
:
395 case SVGA3D_X8R8G8B8
:
399 /* Often unsupported/problematic. This means we end up with the same
400 * visuals for all virtual hardware implementations.
402 case SVGA3D_A4R4G4B4
:
403 case SVGA3D_A1R5G5B5
:
412 * Query the host capabilities.
415 svga_get_format_cap(ss
, svga_format
, &caps
);
418 if (tex_usage
& PIPE_BIND_RENDER_TARGET
) {
419 mask
.offscreenRenderTarget
= 1;
421 if (tex_usage
& PIPE_BIND_DEPTH_STENCIL
) {
424 if (tex_usage
& PIPE_BIND_SAMPLER_VIEW
) {
428 return (caps
.value
& mask
.value
) == mask
.value
;
433 svga_fence_reference(struct pipe_screen
*screen
,
434 struct pipe_fence_handle
**ptr
,
435 struct pipe_fence_handle
*fence
)
437 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
438 sws
->fence_reference(sws
, ptr
, fence
);
443 svga_fence_signalled(struct pipe_screen
*screen
,
444 struct pipe_fence_handle
*fence
)
446 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
447 return sws
->fence_signalled(sws
, fence
, 0) == 0;
452 svga_fence_finish(struct pipe_screen
*screen
,
453 struct pipe_fence_handle
*fence
,
456 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
458 SVGA_DBG(DEBUG_DMA
|DEBUG_PERF
, "%s fence_ptr %p\n",
459 __FUNCTION__
, fence
);
461 return sws
->fence_finish(sws
, fence
, 0) == 0;
466 svga_destroy_screen( struct pipe_screen
*screen
)
468 struct svga_screen
*svgascreen
= svga_screen(screen
);
470 svga_screen_cache_cleanup(svgascreen
);
472 pipe_mutex_destroy(svgascreen
->swc_mutex
);
473 pipe_mutex_destroy(svgascreen
->tex_mutex
);
475 svgascreen
->sws
->destroy(svgascreen
->sws
);
482 * Create a new svga_screen object
485 svga_screen_create(struct svga_winsys_screen
*sws
)
487 struct svga_screen
*svgascreen
;
488 struct pipe_screen
*screen
;
489 SVGA3dDevCapResult result
;
490 boolean use_vs30
, use_ps30
;
493 SVGA_DEBUG
= debug_get_flags_option("SVGA_DEBUG", svga_debug_flags
, 0 );
496 svgascreen
= CALLOC_STRUCT(svga_screen
);
500 svgascreen
->debug
.force_level_surface_view
=
501 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE
);
502 svgascreen
->debug
.force_surface_view
=
503 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE
);
504 svgascreen
->debug
.force_sampler_view
=
505 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE
);
506 svgascreen
->debug
.no_surface_view
=
507 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE
);
508 svgascreen
->debug
.no_sampler_view
=
509 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE
);
511 screen
= &svgascreen
->screen
;
513 screen
->destroy
= svga_destroy_screen
;
514 screen
->get_name
= svga_get_name
;
515 screen
->get_vendor
= svga_get_vendor
;
516 screen
->get_param
= svga_get_param
;
517 screen
->get_shader_param
= svga_get_shader_param
;
518 screen
->get_paramf
= svga_get_paramf
;
519 screen
->is_format_supported
= svga_is_format_supported
;
520 screen
->context_create
= svga_context_create
;
521 screen
->fence_reference
= svga_fence_reference
;
522 screen
->fence_signalled
= svga_fence_signalled
;
523 screen
->fence_finish
= svga_fence_finish
;
524 svgascreen
->sws
= sws
;
526 svga_init_screen_resource_functions(svgascreen
);
528 if (sws
->get_hw_version
) {
529 svgascreen
->hw_version
= sws
->get_hw_version(sws
);
531 svgascreen
->hw_version
= SVGA3D_HWVERSION_WS65_B1
;
535 sws
->get_cap(sws
, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION
, &result
) &&
536 result
.u
>= SVGA3DPSVERSION_30
? TRUE
: FALSE
;
539 sws
->get_cap(sws
, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION
, &result
) &&
540 result
.u
>= SVGA3DVSVERSION_30
? TRUE
: FALSE
;
542 /* we require Shader model 3.0 or later */
543 if (!use_ps30
|| !use_vs30
)
547 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
548 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
549 * we prefer the later when available.
551 * This mimics hardware vendors extensions for D3D depth sampling. See also
552 * http://aras-p.info/texts/D3D9GPUHacks.html
556 boolean has_df16
, has_df24
, has_d24s8_int
;
557 SVGA3dSurfaceFormatCaps caps
;
558 SVGA3dSurfaceFormatCaps mask
;
563 svgascreen
->depth
.z16
= SVGA3D_Z_D16
;
564 svgascreen
->depth
.x8z24
= SVGA3D_Z_D24X8
;
565 svgascreen
->depth
.s8z24
= SVGA3D_Z_D24S8
;
567 svga_get_format_cap(svgascreen
, SVGA3D_Z_DF16
, &caps
);
568 has_df16
= (caps
.value
& mask
.value
) == mask
.value
;
570 svga_get_format_cap(svgascreen
, SVGA3D_Z_DF24
, &caps
);
571 has_df24
= (caps
.value
& mask
.value
) == mask
.value
;
573 svga_get_format_cap(svgascreen
, SVGA3D_Z_D24S8_INT
, &caps
);
574 has_d24s8_int
= (caps
.value
& mask
.value
) == mask
.value
;
576 /* XXX: We might want some other logic here.
577 * Like if we only have d24s8_int we should
578 * emulate the other formats with that.
581 svgascreen
->depth
.z16
= SVGA3D_Z_DF16
;
584 svgascreen
->depth
.x8z24
= SVGA3D_Z_DF24
;
587 svgascreen
->depth
.s8z24
= SVGA3D_Z_D24S8_INT
;
591 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_POINT_SIZE
, &result
)) {
592 svgascreen
->maxPointSize
= 1.0F
;
594 /* Keep this to a reasonable size to avoid failures in
597 svgascreen
->maxPointSize
= MIN2(result
.f
, 80.0f
);
600 pipe_mutex_init(svgascreen
->tex_mutex
);
601 pipe_mutex_init(svgascreen
->swc_mutex
);
603 svga_screen_cache_init(svgascreen
);
612 struct svga_winsys_screen
*
613 svga_winsys_screen(struct pipe_screen
*screen
)
615 return svga_screen(screen
)->sws
;
620 svga_screen(struct pipe_screen
*screen
)
623 assert(screen
->destroy
== svga_destroy_screen
);
624 return (struct svga_screen
*)screen
;