1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
24 **********************************************************/
26 #include "util/u_memory.h"
27 #include "util/u_inlines.h"
28 #include "util/u_string.h"
29 #include "util/u_math.h"
31 #include "svga_winsys.h"
32 #include "svga_public.h"
33 #include "svga_context.h"
34 #include "svga_format.h"
35 #include "svga_screen.h"
36 #include "svga_resource_texture.h"
37 #include "svga_resource.h"
38 #include "svga_debug.h"
40 #include "svga3d_shaderdefs.h"
46 static const struct debug_named_value svga_debug_flags
[] = {
47 { "dma", DEBUG_DMA
, NULL
},
48 { "tgsi", DEBUG_TGSI
, NULL
},
49 { "pipe", DEBUG_PIPE
, NULL
},
50 { "state", DEBUG_STATE
, NULL
},
51 { "screen", DEBUG_SCREEN
, NULL
},
52 { "tex", DEBUG_TEX
, NULL
},
53 { "swtnl", DEBUG_SWTNL
, NULL
},
54 { "const", DEBUG_CONSTS
, NULL
},
55 { "viewport", DEBUG_VIEWPORT
, NULL
},
56 { "views", DEBUG_VIEWS
, NULL
},
57 { "perf", DEBUG_PERF
, NULL
},
58 { "flush", DEBUG_FLUSH
, NULL
},
59 { "sync", DEBUG_SYNC
, NULL
},
60 { "cache", DEBUG_CACHE
, NULL
},
66 svga_get_vendor( struct pipe_screen
*pscreen
)
68 return "VMware, Inc.";
73 svga_get_name( struct pipe_screen
*pscreen
)
75 const char *build
= "", *llvm
= "", *mutex
= "";
76 static char name
[100];
78 /* Only return internal details in the DEBUG version:
80 build
= "build: DEBUG;";
81 mutex
= "mutex: " PIPE_ATOMIC
";";
86 build
= "build: RELEASE;";
89 util_snprintf(name
, sizeof(name
), "SVGA3D; %s %s %s", build
, mutex
, llvm
);
97 svga_get_paramf(struct pipe_screen
*screen
, enum pipe_capf param
)
99 struct svga_screen
*svgascreen
= svga_screen(screen
);
100 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
101 SVGA3dDevCapResult result
;
104 case PIPE_CAPF_MAX_LINE_WIDTH
:
106 case PIPE_CAPF_MAX_LINE_WIDTH_AA
:
109 case PIPE_CAPF_MAX_POINT_WIDTH
:
111 case PIPE_CAPF_MAX_POINT_WIDTH_AA
:
112 return svgascreen
->maxPointSize
;
114 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY
:
115 if(!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY
, &result
))
119 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS
:
123 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param
);
130 svga_get_param(struct pipe_screen
*screen
, enum pipe_cap param
)
132 struct svga_screen
*svgascreen
= svga_screen(screen
);
133 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
134 SVGA3dDevCapResult result
;
137 case PIPE_CAP_MAX_COMBINED_SAMPLERS
:
139 case PIPE_CAP_NPOT_TEXTURES
:
141 case PIPE_CAP_TWO_SIDED_STENCIL
:
143 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS
:
145 case PIPE_CAP_ANISOTROPIC_FILTER
:
147 case PIPE_CAP_POINT_SPRITE
:
149 case PIPE_CAP_MAX_RENDER_TARGETS
:
150 if(!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_RENDER_TARGETS
, &result
))
154 return MIN2(result
.u
, PIPE_MAX_COLOR_BUFS
);
155 case PIPE_CAP_OCCLUSION_QUERY
:
157 case PIPE_CAP_TIMER_QUERY
:
159 case PIPE_CAP_TEXTURE_SHADOW_MAP
:
161 case PIPE_CAP_TEXTURE_SWIZZLE
:
163 case PIPE_CAP_USER_VERTEX_BUFFERS
:
166 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS
:
168 unsigned levels
= SVGA_MAX_TEXTURE_LEVELS
;
169 if (sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH
, &result
))
170 levels
= MIN2(util_logbase2(result
.u
) + 1, levels
);
172 levels
= 12 /* 2048x2048 */;
173 if (sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT
, &result
))
174 levels
= MIN2(util_logbase2(result
.u
) + 1, levels
);
176 levels
= 12 /* 2048x2048 */;
180 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS
:
181 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT
, &result
))
182 return 8; /* max 128x128x128 */
183 return MIN2(util_logbase2(result
.u
) + 1, SVGA_MAX_TEXTURE_LEVELS
);
185 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS
:
187 * No mechanism to query the host, and at least limited to 2048x2048 on
190 return MIN2(screen
->get_param(screen
, PIPE_CAP_MAX_TEXTURE_2D_LEVELS
),
193 case PIPE_CAP_BLEND_EQUATION_SEPARATE
: /* req. for GL 1.5 */
196 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT
:
197 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER
:
199 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT
:
200 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER
:
203 case PIPE_CAP_DEPTHSTENCIL_CLEAR_SEPARATE
:
206 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED
:
207 return 1; /* The color outputs of vertex shaders are not clamped */
208 case PIPE_CAP_VERTEX_COLOR_CLAMPED
:
209 return 0; /* The driver can't clamp vertex colors */
210 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED
:
211 return 0; /* The driver can't clamp fragment colors */
213 /* Unsupported features */
214 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS
:
215 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION
:
216 case PIPE_CAP_TEXTURE_MIRROR_CLAMP
:
218 case PIPE_CAP_SHADER_STENCIL_EXPORT
:
219 case PIPE_CAP_DEPTH_CLIP_DISABLE
:
220 case PIPE_CAP_SEAMLESS_CUBE_MAP
:
221 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE
:
222 case PIPE_CAP_INDEP_BLEND_ENABLE
:
223 case PIPE_CAP_INDEP_BLEND_FUNC
:
224 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS
:
225 case PIPE_CAP_PRIMITIVE_RESTART
:
226 case PIPE_CAP_TGSI_INSTANCEID
:
227 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR
:
228 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS
:
229 case PIPE_CAP_MIN_TEXEL_OFFSET
:
230 case PIPE_CAP_MAX_TEXEL_OFFSET
:
231 case PIPE_CAP_CONDITIONAL_RENDER
:
232 case PIPE_CAP_TEXTURE_BARRIER
:
233 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS
:
234 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS
:
235 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME
:
236 case PIPE_CAP_TGSI_CAN_COMPACT_VARYINGS
:
237 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS
:
238 case PIPE_CAP_GLSL_FEATURE_LEVEL
:
239 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY
:
240 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY
:
242 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY
:
246 debug_printf("Unexpected PIPE_CAP_ query %u\n", param
);
251 static int svga_get_shader_param(struct pipe_screen
*screen
, unsigned shader
, enum pipe_shader_cap param
)
253 struct svga_screen
*svgascreen
= svga_screen(screen
);
254 struct svga_winsys_screen
*sws
= svgascreen
->sws
;
255 SVGA3dDevCapResult result
;
259 case PIPE_SHADER_FRAGMENT
:
262 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
263 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
264 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
265 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
267 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
268 return SVGA3D_MAX_NESTING_LEVEL
;
269 case PIPE_SHADER_CAP_MAX_INPUTS
:
271 case PIPE_SHADER_CAP_MAX_CONSTS
:
273 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
275 case PIPE_SHADER_CAP_MAX_TEMPS
:
276 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS
, &result
))
278 return MIN2(result
.u
, SVGA3D_TEMPREG_MAX
);
279 case PIPE_SHADER_CAP_MAX_ADDRS
:
280 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
282 * Although PS 3.0 has some addressing abilities it can only represent
283 * loops that can be statically determined and unrolled. Given we can
284 * only handle a subset of the cases that the state tracker already
285 * does it is better to defer loop unrolling to the state tracker.
288 case PIPE_SHADER_CAP_MAX_PREDS
:
290 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
292 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
293 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
294 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
296 case PIPE_SHADER_CAP_SUBROUTINES
:
298 case PIPE_SHADER_CAP_INTEGERS
:
300 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
303 debug_printf("Unexpected vertex shader query %u\n", param
);
307 case PIPE_SHADER_VERTEX
:
310 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS
:
311 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS
:
312 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS
, &result
))
315 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS
:
316 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS
:
317 /* XXX: until we have vertex texture support */
319 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH
:
320 return SVGA3D_MAX_NESTING_LEVEL
;
321 case PIPE_SHADER_CAP_MAX_INPUTS
:
323 case PIPE_SHADER_CAP_MAX_CONSTS
:
325 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS
:
327 case PIPE_SHADER_CAP_MAX_TEMPS
:
328 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS
, &result
))
330 return MIN2(result
.u
, SVGA3D_TEMPREG_MAX
);
331 case PIPE_SHADER_CAP_MAX_ADDRS
:
333 case PIPE_SHADER_CAP_MAX_PREDS
:
335 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED
:
337 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR
:
338 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR
:
340 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR
:
342 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR
:
344 case PIPE_SHADER_CAP_SUBROUTINES
:
346 case PIPE_SHADER_CAP_INTEGERS
:
348 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS
:
351 debug_printf("Unexpected vertex shader query %u\n", param
);
355 case PIPE_SHADER_GEOMETRY
:
356 /* no support for geometry shaders at this time */
359 debug_printf("Unexpected vertex shader query %u\n", param
);
367 svga_is_format_supported( struct pipe_screen
*screen
,
368 enum pipe_format format
,
369 enum pipe_texture_target target
,
370 unsigned sample_count
,
373 struct svga_screen
*ss
= svga_screen(screen
);
374 SVGA3dSurfaceFormat svga_format
;
375 SVGA3dSurfaceFormatCaps caps
;
376 SVGA3dSurfaceFormatCaps mask
;
380 if (sample_count
> 1) {
384 svga_format
= svga_translate_format(ss
, format
, tex_usage
);
385 if (svga_format
== SVGA3D_FORMAT_INVALID
) {
390 * Override host capabilities, so that we end up with the same
391 * visuals for all virtual hardware implementations.
394 if (tex_usage
& PIPE_BIND_DISPLAY_TARGET
) {
395 switch (svga_format
) {
396 case SVGA3D_A8R8G8B8
:
397 case SVGA3D_X8R8G8B8
:
401 /* Often unsupported/problematic. This means we end up with the same
402 * visuals for all virtual hardware implementations.
404 case SVGA3D_A4R4G4B4
:
405 case SVGA3D_A1R5G5B5
:
414 * Query the host capabilities.
417 svga_get_format_cap(ss
, svga_format
, &caps
);
420 if (tex_usage
& PIPE_BIND_RENDER_TARGET
) {
421 mask
.offscreenRenderTarget
= 1;
423 if (tex_usage
& PIPE_BIND_DEPTH_STENCIL
) {
426 if (tex_usage
& PIPE_BIND_SAMPLER_VIEW
) {
430 return (caps
.value
& mask
.value
) == mask
.value
;
435 svga_fence_reference(struct pipe_screen
*screen
,
436 struct pipe_fence_handle
**ptr
,
437 struct pipe_fence_handle
*fence
)
439 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
440 sws
->fence_reference(sws
, ptr
, fence
);
445 svga_fence_signalled(struct pipe_screen
*screen
,
446 struct pipe_fence_handle
*fence
)
448 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
449 return sws
->fence_signalled(sws
, fence
, 0) == 0;
454 svga_fence_finish(struct pipe_screen
*screen
,
455 struct pipe_fence_handle
*fence
,
458 struct svga_winsys_screen
*sws
= svga_screen(screen
)->sws
;
460 SVGA_DBG(DEBUG_DMA
|DEBUG_PERF
, "%s fence_ptr %p\n",
461 __FUNCTION__
, fence
);
463 return sws
->fence_finish(sws
, fence
, 0) == 0;
468 svga_destroy_screen( struct pipe_screen
*screen
)
470 struct svga_screen
*svgascreen
= svga_screen(screen
);
472 svga_screen_cache_cleanup(svgascreen
);
474 pipe_mutex_destroy(svgascreen
->swc_mutex
);
475 pipe_mutex_destroy(svgascreen
->tex_mutex
);
477 svgascreen
->sws
->destroy(svgascreen
->sws
);
484 * Create a new svga_screen object
487 svga_screen_create(struct svga_winsys_screen
*sws
)
489 struct svga_screen
*svgascreen
;
490 struct pipe_screen
*screen
;
491 SVGA3dDevCapResult result
;
492 boolean use_vs30
, use_ps30
;
495 SVGA_DEBUG
= debug_get_flags_option("SVGA_DEBUG", svga_debug_flags
, 0 );
498 svgascreen
= CALLOC_STRUCT(svga_screen
);
502 svgascreen
->debug
.force_level_surface_view
=
503 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE
);
504 svgascreen
->debug
.force_surface_view
=
505 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE
);
506 svgascreen
->debug
.force_sampler_view
=
507 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE
);
508 svgascreen
->debug
.no_surface_view
=
509 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE
);
510 svgascreen
->debug
.no_sampler_view
=
511 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE
);
513 screen
= &svgascreen
->screen
;
515 screen
->destroy
= svga_destroy_screen
;
516 screen
->get_name
= svga_get_name
;
517 screen
->get_vendor
= svga_get_vendor
;
518 screen
->get_param
= svga_get_param
;
519 screen
->get_shader_param
= svga_get_shader_param
;
520 screen
->get_paramf
= svga_get_paramf
;
521 screen
->is_format_supported
= svga_is_format_supported
;
522 screen
->context_create
= svga_context_create
;
523 screen
->fence_reference
= svga_fence_reference
;
524 screen
->fence_signalled
= svga_fence_signalled
;
525 screen
->fence_finish
= svga_fence_finish
;
526 svgascreen
->sws
= sws
;
528 svga_init_screen_resource_functions(svgascreen
);
530 if (sws
->get_hw_version
) {
531 svgascreen
->hw_version
= sws
->get_hw_version(sws
);
533 svgascreen
->hw_version
= SVGA3D_HWVERSION_WS65_B1
;
537 sws
->get_cap(sws
, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION
, &result
) &&
538 result
.u
>= SVGA3DPSVERSION_30
? TRUE
: FALSE
;
541 sws
->get_cap(sws
, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION
, &result
) &&
542 result
.u
>= SVGA3DVSVERSION_30
? TRUE
: FALSE
;
544 /* we require Shader model 3.0 or later */
545 if (!use_ps30
|| !use_vs30
)
549 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
550 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
551 * we prefer the later when available.
553 * This mimics hardware vendors extensions for D3D depth sampling. See also
554 * http://aras-p.info/texts/D3D9GPUHacks.html
558 boolean has_df16
, has_df24
, has_d24s8_int
;
559 SVGA3dSurfaceFormatCaps caps
;
560 SVGA3dSurfaceFormatCaps mask
;
565 svgascreen
->depth
.z16
= SVGA3D_Z_D16
;
566 svgascreen
->depth
.x8z24
= SVGA3D_Z_D24X8
;
567 svgascreen
->depth
.s8z24
= SVGA3D_Z_D24S8
;
569 svga_get_format_cap(svgascreen
, SVGA3D_Z_DF16
, &caps
);
570 has_df16
= (caps
.value
& mask
.value
) == mask
.value
;
572 svga_get_format_cap(svgascreen
, SVGA3D_Z_DF24
, &caps
);
573 has_df24
= (caps
.value
& mask
.value
) == mask
.value
;
575 svga_get_format_cap(svgascreen
, SVGA3D_Z_D24S8_INT
, &caps
);
576 has_d24s8_int
= (caps
.value
& mask
.value
) == mask
.value
;
578 /* XXX: We might want some other logic here.
579 * Like if we only have d24s8_int we should
580 * emulate the other formats with that.
583 svgascreen
->depth
.z16
= SVGA3D_Z_DF16
;
586 svgascreen
->depth
.x8z24
= SVGA3D_Z_DF24
;
589 svgascreen
->depth
.s8z24
= SVGA3D_Z_D24S8_INT
;
593 if (!sws
->get_cap(sws
, SVGA3D_DEVCAP_MAX_POINT_SIZE
, &result
)) {
594 svgascreen
->maxPointSize
= 1.0F
;
596 /* Keep this to a reasonable size to avoid failures in
599 svgascreen
->maxPointSize
= MIN2(result
.f
, 80.0f
);
602 pipe_mutex_init(svgascreen
->tex_mutex
);
603 pipe_mutex_init(svgascreen
->swc_mutex
);
605 svga_screen_cache_init(svgascreen
);
614 struct svga_winsys_screen
*
615 svga_winsys_screen(struct pipe_screen
*screen
)
617 return svga_screen(screen
)->sws
;
622 svga_screen(struct pipe_screen
*screen
)
625 assert(screen
->destroy
== svga_destroy_screen
);
626 return (struct svga_screen
*)screen
;