gallium: introduce PIPE_CAP_LOAD_CONSTBUF
[mesa.git] / src / gallium / drivers / svga / svga_screen.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "git_sha1.h" /* For MESA_GIT_SHA1 */
27 #include "util/u_format.h"
28 #include "util/u_memory.h"
29 #include "util/u_inlines.h"
30 #include "util/u_string.h"
31 #include "util/u_math.h"
32
33 #include "os/os_process.h"
34
35 #include "svga_winsys.h"
36 #include "svga_public.h"
37 #include "svga_context.h"
38 #include "svga_format.h"
39 #include "svga_msg.h"
40 #include "svga_screen.h"
41 #include "svga_tgsi.h"
42 #include "svga_resource_texture.h"
43 #include "svga_resource.h"
44 #include "svga_debug.h"
45
46 #include "svga3d_shaderdefs.h"
47 #include "VGPU10ShaderTokens.h"
48
49 /* NOTE: this constant may get moved into a svga3d*.h header file */
50 #define SVGA3D_DX_MAX_RESOURCE_SIZE (128 * 1024 * 1024)
51
52 #ifndef MESA_GIT_SHA1
53 #define MESA_GIT_SHA1 "(unknown git revision)"
54 #endif
55
56 #ifdef DEBUG
57 int SVGA_DEBUG = 0;
58
59 static const struct debug_named_value svga_debug_flags[] = {
60 { "dma", DEBUG_DMA, NULL },
61 { "tgsi", DEBUG_TGSI, NULL },
62 { "pipe", DEBUG_PIPE, NULL },
63 { "state", DEBUG_STATE, NULL },
64 { "screen", DEBUG_SCREEN, NULL },
65 { "tex", DEBUG_TEX, NULL },
66 { "swtnl", DEBUG_SWTNL, NULL },
67 { "const", DEBUG_CONSTS, NULL },
68 { "viewport", DEBUG_VIEWPORT, NULL },
69 { "views", DEBUG_VIEWS, NULL },
70 { "perf", DEBUG_PERF, NULL },
71 { "flush", DEBUG_FLUSH, NULL },
72 { "sync", DEBUG_SYNC, NULL },
73 { "cache", DEBUG_CACHE, NULL },
74 { "streamout", DEBUG_STREAMOUT, NULL },
75 { "query", DEBUG_QUERY, NULL },
76 { "samplers", DEBUG_SAMPLERS, NULL },
77 DEBUG_NAMED_VALUE_END
78 };
79 #endif
80
81 static const char *
82 svga_get_vendor( struct pipe_screen *pscreen )
83 {
84 return "VMware, Inc.";
85 }
86
87
88 static const char *
89 svga_get_name( struct pipe_screen *pscreen )
90 {
91 const char *build = "", *llvm = "", *mutex = "";
92 static char name[100];
93 #ifdef DEBUG
94 /* Only return internal details in the DEBUG version:
95 */
96 build = "build: DEBUG;";
97 mutex = "mutex: " PIPE_ATOMIC ";";
98 #elif defined(VMX86_STATS)
99 build = "build: OPT;";
100 #else
101 build = "build: RELEASE;";
102 #endif
103 #ifdef HAVE_LLVM
104 llvm = "LLVM;";
105 #endif
106
107 util_snprintf(name, sizeof(name), "SVGA3D; %s %s %s", build, mutex, llvm);
108 return name;
109 }
110
111
112 /** Helper for querying float-valued device cap */
113 static float
114 get_float_cap(struct svga_winsys_screen *sws, unsigned cap, float defaultVal)
115 {
116 SVGA3dDevCapResult result;
117 if (sws->get_cap(sws, cap, &result))
118 return result.f;
119 else
120 return defaultVal;
121 }
122
123
124 /** Helper for querying uint-valued device cap */
125 static unsigned
126 get_uint_cap(struct svga_winsys_screen *sws, unsigned cap, unsigned defaultVal)
127 {
128 SVGA3dDevCapResult result;
129 if (sws->get_cap(sws, cap, &result))
130 return result.u;
131 else
132 return defaultVal;
133 }
134
135
136 /** Helper for querying boolean-valued device cap */
137 static boolean
138 get_bool_cap(struct svga_winsys_screen *sws, unsigned cap, boolean defaultVal)
139 {
140 SVGA3dDevCapResult result;
141 if (sws->get_cap(sws, cap, &result))
142 return result.b;
143 else
144 return defaultVal;
145 }
146
147
148 static float
149 svga_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
150 {
151 struct svga_screen *svgascreen = svga_screen(screen);
152 struct svga_winsys_screen *sws = svgascreen->sws;
153
154 switch (param) {
155 case PIPE_CAPF_MAX_LINE_WIDTH:
156 return svgascreen->maxLineWidth;
157 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
158 return svgascreen->maxLineWidthAA;
159
160 case PIPE_CAPF_MAX_POINT_WIDTH:
161 /* fall-through */
162 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
163 return svgascreen->maxPointSize;
164
165 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
166 return (float) get_uint_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, 4);
167
168 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
169 return 15.0;
170
171 case PIPE_CAPF_GUARD_BAND_LEFT:
172 case PIPE_CAPF_GUARD_BAND_TOP:
173 case PIPE_CAPF_GUARD_BAND_RIGHT:
174 case PIPE_CAPF_GUARD_BAND_BOTTOM:
175 return 0.0;
176 }
177
178 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param);
179 return 0;
180 }
181
182
183 static int
184 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
185 {
186 struct svga_screen *svgascreen = svga_screen(screen);
187 struct svga_winsys_screen *sws = svgascreen->sws;
188 SVGA3dDevCapResult result;
189
190 switch (param) {
191 case PIPE_CAP_NPOT_TEXTURES:
192 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
193 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
194 return 1;
195 case PIPE_CAP_TWO_SIDED_STENCIL:
196 return 1;
197 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
198 /*
199 * "In virtually every OpenGL implementation and hardware,
200 * GL_MAX_DUAL_SOURCE_DRAW_BUFFERS is 1"
201 * http://www.opengl.org/wiki/Blending
202 */
203 return sws->have_vgpu10 ? 1 : 0;
204 case PIPE_CAP_ANISOTROPIC_FILTER:
205 return 1;
206 case PIPE_CAP_POINT_SPRITE:
207 return 1;
208 case PIPE_CAP_TGSI_TEXCOORD:
209 return 0;
210 case PIPE_CAP_MAX_RENDER_TARGETS:
211 return svgascreen->max_color_buffers;
212 case PIPE_CAP_OCCLUSION_QUERY:
213 return 1;
214 case PIPE_CAP_QUERY_TIME_ELAPSED:
215 return 0;
216 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
217 return sws->have_vgpu10;
218 case PIPE_CAP_TEXTURE_SHADOW_MAP:
219 return 1;
220 case PIPE_CAP_TEXTURE_SWIZZLE:
221 return 1;
222 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
223 return 0;
224 case PIPE_CAP_USER_VERTEX_BUFFERS:
225 return 0;
226 case PIPE_CAP_USER_CONSTANT_BUFFERS:
227 return 1;
228 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
229 return 256;
230
231 case PIPE_CAP_MAX_TEXTURE_2D_LEVELS:
232 {
233 unsigned levels = SVGA_MAX_TEXTURE_LEVELS;
234 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
235 levels = MIN2(util_logbase2(result.u) + 1, levels);
236 else
237 levels = 12 /* 2048x2048 */;
238 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
239 levels = MIN2(util_logbase2(result.u) + 1, levels);
240 else
241 levels = 12 /* 2048x2048 */;
242 return levels;
243 }
244
245 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
246 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
247 return 8; /* max 128x128x128 */
248 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
249
250 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
251 /*
252 * No mechanism to query the host, and at least limited to 2048x2048 on
253 * certain hardware.
254 */
255 return MIN2(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_LEVELS),
256 12 /* 2048x2048 */);
257
258 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
259 return sws->have_vgpu10 ? SVGA3D_MAX_SURFACE_ARRAYSIZE : 0;
260
261 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
262 return 1;
263
264 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
265 return 1;
266 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
267 return sws->have_vgpu10;
268 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
269 return 0;
270 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
271 return !sws->have_vgpu10;
272
273 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
274 return 1; /* The color outputs of vertex shaders are not clamped */
275 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
276 return 0; /* The driver can't clamp vertex colors */
277 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
278 return 0; /* The driver can't clamp fragment colors */
279
280 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
281 return 1; /* expected for GL_ARB_framebuffer_object */
282
283 case PIPE_CAP_GLSL_FEATURE_LEVEL:
284 return sws->have_vgpu10 ? 330 : 120;
285
286 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
287 return 0;
288
289 case PIPE_CAP_SM3:
290 return 1;
291
292 case PIPE_CAP_DEPTH_CLIP_DISABLE:
293 case PIPE_CAP_INDEP_BLEND_ENABLE:
294 case PIPE_CAP_CONDITIONAL_RENDER:
295 case PIPE_CAP_QUERY_TIMESTAMP:
296 case PIPE_CAP_TGSI_INSTANCEID:
297 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
298 case PIPE_CAP_SEAMLESS_CUBE_MAP:
299 case PIPE_CAP_FAKE_SW_MSAA:
300 return sws->have_vgpu10;
301
302 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
303 return sws->have_vgpu10 ? SVGA3D_DX_MAX_SOTARGETS : 0;
304 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
305 return sws->have_vgpu10 ? 4 : 0;
306 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
307 return sws->have_vgpu10 ? SVGA3D_MAX_STREAMOUT_DECLS : 0;
308 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
309 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
310 return 0;
311 case PIPE_CAP_TEXTURE_MULTISAMPLE:
312 return svgascreen->ms_samples ? 1 : 0;
313
314 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
315 /* convert bytes to texels for the case of the largest texel
316 * size: float[4].
317 */
318 return SVGA3D_DX_MAX_RESOURCE_SIZE / (4 * sizeof(float));
319
320 case PIPE_CAP_MIN_TEXEL_OFFSET:
321 return sws->have_vgpu10 ? VGPU10_MIN_TEXEL_FETCH_OFFSET : 0;
322 case PIPE_CAP_MAX_TEXEL_OFFSET:
323 return sws->have_vgpu10 ? VGPU10_MAX_TEXEL_FETCH_OFFSET : 0;
324
325 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
326 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
327 return 0;
328
329 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
330 return sws->have_vgpu10 ? 256 : 0;
331 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
332 return sws->have_vgpu10 ? 1024 : 0;
333
334 case PIPE_CAP_PRIMITIVE_RESTART:
335 return 1; /* may be a sw fallback, depending on restart index */
336
337 case PIPE_CAP_GENERATE_MIPMAP:
338 return sws->have_generate_mipmap_cmd;
339
340 case PIPE_CAP_NATIVE_FENCE_FD:
341 return sws->have_fence_fd;
342
343 /* Unsupported features */
344 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
345 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
346 case PIPE_CAP_SHADER_STENCIL_EXPORT:
347 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
348 case PIPE_CAP_INDEP_BLEND_FUNC:
349 case PIPE_CAP_TEXTURE_BARRIER:
350 case PIPE_CAP_MAX_VERTEX_STREAMS:
351 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
352 case PIPE_CAP_COMPUTE:
353 case PIPE_CAP_START_INSTANCE:
354 case PIPE_CAP_CUBE_MAP_ARRAY:
355 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
356 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
357 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
358 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
359 case PIPE_CAP_TEXTURE_GATHER_SM5:
360 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
361 case PIPE_CAP_TEXTURE_QUERY_LOD:
362 case PIPE_CAP_SAMPLE_SHADING:
363 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
364 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
365 case PIPE_CAP_DRAW_INDIRECT:
366 case PIPE_CAP_MULTI_DRAW_INDIRECT:
367 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:
368 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
369 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
370 case PIPE_CAP_SAMPLER_VIEW_TARGET:
371 case PIPE_CAP_CLIP_HALFZ:
372 case PIPE_CAP_VERTEXID_NOBASE:
373 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
374 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
375 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
376 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
377 case PIPE_CAP_INVALIDATE_BUFFER:
378 case PIPE_CAP_STRING_MARKER:
379 case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS:
380 case PIPE_CAP_QUERY_MEMORY_INFO:
381 case PIPE_CAP_PCI_GROUP:
382 case PIPE_CAP_PCI_BUS:
383 case PIPE_CAP_PCI_DEVICE:
384 case PIPE_CAP_PCI_FUNCTION:
385 case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:
386 return 0;
387 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
388 return 64;
389 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
390 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
391 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
392 return 1; /* need 4-byte alignment for all offsets and strides */
393 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
394 return 2048;
395 case PIPE_CAP_MAX_VIEWPORTS:
396 return 1;
397 case PIPE_CAP_ENDIANNESS:
398 return PIPE_ENDIAN_LITTLE;
399
400 case PIPE_CAP_VENDOR_ID:
401 return 0x15ad; /* VMware Inc. */
402 case PIPE_CAP_DEVICE_ID:
403 return 0x0405; /* assume SVGA II */
404 case PIPE_CAP_ACCELERATED:
405 return 0; /* XXX: */
406 case PIPE_CAP_VIDEO_MEMORY:
407 /* XXX: Query the host ? */
408 return 1;
409 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
410 return sws->have_vgpu10;
411 case PIPE_CAP_CLEAR_TEXTURE:
412 return sws->have_vgpu10;
413 case PIPE_CAP_UMA:
414 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
415 case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:
416 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
417 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
418 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
419 case PIPE_CAP_DEPTH_BOUNDS_TEST:
420 case PIPE_CAP_TGSI_TXQS:
421 case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
422 case PIPE_CAP_SHAREABLE_SHADERS:
423 case PIPE_CAP_DRAW_PARAMETERS:
424 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
425 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
426 case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY:
427 case PIPE_CAP_QUERY_BUFFER_OBJECT:
428 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
429 case PIPE_CAP_CULL_DISTANCE:
430 case PIPE_CAP_PRIMITIVE_RESTART_FOR_PATCHES:
431 case PIPE_CAP_TGSI_VOTE:
432 case PIPE_CAP_MAX_WINDOW_RECTANGLES:
433 case PIPE_CAP_POLYGON_OFFSET_UNITS_UNSCALED:
434 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
435 case PIPE_CAP_TGSI_ARRAY_COMPONENTS:
436 case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
437 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
438 case PIPE_CAP_TGSI_FS_FBFETCH:
439 case PIPE_CAP_TGSI_MUL_ZERO_WINS:
440 case PIPE_CAP_DOUBLES:
441 case PIPE_CAP_INT64:
442 case PIPE_CAP_INT64_DIVMOD:
443 case PIPE_CAP_TGSI_TEX_TXF_LZ:
444 case PIPE_CAP_TGSI_CLOCK:
445 case PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE:
446 case PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE:
447 case PIPE_CAP_TGSI_BALLOT:
448 case PIPE_CAP_TGSI_TES_LAYER_VIEWPORT:
449 case PIPE_CAP_CAN_BIND_CONST_BUFFER_AS_VERTEX:
450 case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
451 case PIPE_CAP_POST_DEPTH_COVERAGE:
452 case PIPE_CAP_BINDLESS_TEXTURE:
453 case PIPE_CAP_NIR_SAMPLERS_AS_DEREF:
454 case PIPE_CAP_QUERY_SO_OVERFLOW:
455 case PIPE_CAP_MEMOBJ:
456 case PIPE_CAP_LOAD_CONSTBUF:
457 return 0;
458 }
459
460 debug_printf("Unexpected PIPE_CAP_ query %u\n", param);
461 return 0;
462 }
463
464
465 static int
466 vgpu9_get_shader_param(struct pipe_screen *screen,
467 enum pipe_shader_type shader,
468 enum pipe_shader_cap param)
469 {
470 struct svga_screen *svgascreen = svga_screen(screen);
471 struct svga_winsys_screen *sws = svgascreen->sws;
472 unsigned val;
473
474 assert(!sws->have_vgpu10);
475
476 switch (shader)
477 {
478 case PIPE_SHADER_FRAGMENT:
479 switch (param)
480 {
481 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
482 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
483 return get_uint_cap(sws,
484 SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_INSTRUCTIONS,
485 512);
486 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
487 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
488 return 512;
489 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
490 return SVGA3D_MAX_NESTING_LEVEL;
491 case PIPE_SHADER_CAP_MAX_INPUTS:
492 return 10;
493 case PIPE_SHADER_CAP_MAX_OUTPUTS:
494 return svgascreen->max_color_buffers;
495 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
496 return 224 * sizeof(float[4]);
497 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
498 return 1;
499 case PIPE_SHADER_CAP_MAX_TEMPS:
500 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, 32);
501 return MIN2(val, SVGA3D_TEMPREG_MAX);
502 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
503 /*
504 * Although PS 3.0 has some addressing abilities it can only represent
505 * loops that can be statically determined and unrolled. Given we can
506 * only handle a subset of the cases that the state tracker already
507 * does it is better to defer loop unrolling to the state tracker.
508 */
509 return 0;
510 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
511 return 0;
512 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
513 return 0;
514 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
515 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
516 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
517 return 0;
518 case PIPE_SHADER_CAP_SUBROUTINES:
519 return 0;
520 case PIPE_SHADER_CAP_INTEGERS:
521 return 0;
522 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
523 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
524 return 16;
525 case PIPE_SHADER_CAP_PREFERRED_IR:
526 return PIPE_SHADER_IR_TGSI;
527 case PIPE_SHADER_CAP_SUPPORTED_IRS:
528 return 0;
529 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
530 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
531 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
532 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
533 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
534 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
535 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
536 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
537 return 0;
538 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
539 return 32;
540 }
541 /* If we get here, we failed to handle a cap above */
542 debug_printf("Unexpected fragment shader query %u\n", param);
543 return 0;
544 case PIPE_SHADER_VERTEX:
545 switch (param)
546 {
547 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
548 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
549 return get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS,
550 512);
551 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
552 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
553 /* XXX: until we have vertex texture support */
554 return 0;
555 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
556 return SVGA3D_MAX_NESTING_LEVEL;
557 case PIPE_SHADER_CAP_MAX_INPUTS:
558 return 16;
559 case PIPE_SHADER_CAP_MAX_OUTPUTS:
560 return 10;
561 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
562 return 256 * sizeof(float[4]);
563 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
564 return 1;
565 case PIPE_SHADER_CAP_MAX_TEMPS:
566 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, 32);
567 return MIN2(val, SVGA3D_TEMPREG_MAX);
568 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
569 return 0;
570 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
571 return 0;
572 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
573 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
574 return 1;
575 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
576 return 0;
577 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
578 return 1;
579 case PIPE_SHADER_CAP_SUBROUTINES:
580 return 0;
581 case PIPE_SHADER_CAP_INTEGERS:
582 return 0;
583 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
584 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
585 return 0;
586 case PIPE_SHADER_CAP_PREFERRED_IR:
587 return PIPE_SHADER_IR_TGSI;
588 case PIPE_SHADER_CAP_SUPPORTED_IRS:
589 return 0;
590 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
591 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
592 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
593 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
594 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
595 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
596 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
597 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
598 return 0;
599 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
600 return 32;
601 }
602 /* If we get here, we failed to handle a cap above */
603 debug_printf("Unexpected vertex shader query %u\n", param);
604 return 0;
605 case PIPE_SHADER_GEOMETRY:
606 case PIPE_SHADER_COMPUTE:
607 case PIPE_SHADER_TESS_CTRL:
608 case PIPE_SHADER_TESS_EVAL:
609 /* no support for geometry, tess or compute shaders at this time */
610 return 0;
611 default:
612 debug_printf("Unexpected shader type (%u) query\n", shader);
613 return 0;
614 }
615 return 0;
616 }
617
618
619 static int
620 vgpu10_get_shader_param(struct pipe_screen *screen,
621 enum pipe_shader_type shader,
622 enum pipe_shader_cap param)
623 {
624 struct svga_screen *svgascreen = svga_screen(screen);
625 struct svga_winsys_screen *sws = svgascreen->sws;
626
627 assert(sws->have_vgpu10);
628 (void) sws; /* silence unused var warnings in non-debug builds */
629
630 /* Only VS, GS, FS supported */
631 if (shader != PIPE_SHADER_VERTEX &&
632 shader != PIPE_SHADER_GEOMETRY &&
633 shader != PIPE_SHADER_FRAGMENT) {
634 return 0;
635 }
636
637 /* NOTE: we do not query the device for any caps/limits at this time */
638
639 /* Generally the same limits for vertex, geometry and fragment shaders */
640 switch (param) {
641 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
642 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
643 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
644 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
645 return 64 * 1024;
646 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
647 return 64;
648 case PIPE_SHADER_CAP_MAX_INPUTS:
649 if (shader == PIPE_SHADER_FRAGMENT)
650 return VGPU10_MAX_FS_INPUTS;
651 else if (shader == PIPE_SHADER_GEOMETRY)
652 return VGPU10_MAX_GS_INPUTS;
653 else
654 return VGPU10_MAX_VS_INPUTS;
655 case PIPE_SHADER_CAP_MAX_OUTPUTS:
656 if (shader == PIPE_SHADER_FRAGMENT)
657 return VGPU10_MAX_FS_OUTPUTS;
658 else if (shader == PIPE_SHADER_GEOMETRY)
659 return VGPU10_MAX_GS_OUTPUTS;
660 else
661 return VGPU10_MAX_VS_OUTPUTS;
662 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
663 return VGPU10_MAX_CONSTANT_BUFFER_ELEMENT_COUNT * sizeof(float[4]);
664 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
665 return svgascreen->max_const_buffers;
666 case PIPE_SHADER_CAP_MAX_TEMPS:
667 return VGPU10_MAX_TEMPS;
668 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
669 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
670 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
671 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
672 return TRUE; /* XXX verify */
673 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
674 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
675 case PIPE_SHADER_CAP_SUBROUTINES:
676 case PIPE_SHADER_CAP_INTEGERS:
677 return TRUE;
678 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
679 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
680 return SVGA3D_DX_MAX_SAMPLERS;
681 case PIPE_SHADER_CAP_PREFERRED_IR:
682 return PIPE_SHADER_IR_TGSI;
683 case PIPE_SHADER_CAP_SUPPORTED_IRS:
684 return 0;
685 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
686 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
687 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
688 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
689 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
690 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
691 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
692 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
693 return 0;
694 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
695 return 32;
696 default:
697 debug_printf("Unexpected vgpu10 shader query %u\n", param);
698 return 0;
699 }
700 return 0;
701 }
702
703
704 static int
705 svga_get_shader_param(struct pipe_screen *screen, enum pipe_shader_type shader,
706 enum pipe_shader_cap param)
707 {
708 struct svga_screen *svgascreen = svga_screen(screen);
709 struct svga_winsys_screen *sws = svgascreen->sws;
710 if (sws->have_vgpu10) {
711 return vgpu10_get_shader_param(screen, shader, param);
712 }
713 else {
714 return vgpu9_get_shader_param(screen, shader, param);
715 }
716 }
717
718
719 /**
720 * Implement pipe_screen::is_format_supported().
721 * \param bindings bitmask of PIPE_BIND_x flags
722 */
723 static boolean
724 svga_is_format_supported( struct pipe_screen *screen,
725 enum pipe_format format,
726 enum pipe_texture_target target,
727 unsigned sample_count,
728 unsigned bindings)
729 {
730 struct svga_screen *ss = svga_screen(screen);
731 SVGA3dSurfaceFormat svga_format;
732 SVGA3dSurfaceFormatCaps caps;
733 SVGA3dSurfaceFormatCaps mask;
734
735 assert(bindings);
736
737 if (sample_count > 1) {
738 /* In ms_samples, if bit N is set it means that we support
739 * multisample with N+1 samples per pixel.
740 */
741 if ((ss->ms_samples & (1 << (sample_count - 1))) == 0) {
742 return FALSE;
743 }
744 }
745
746 svga_format = svga_translate_format(ss, format, bindings);
747 if (svga_format == SVGA3D_FORMAT_INVALID) {
748 return FALSE;
749 }
750
751 /* we don't support sRGB rendering into display targets */
752 if (util_format_is_srgb(format) && (bindings & PIPE_BIND_DISPLAY_TARGET)) {
753 return FALSE;
754 }
755
756 /*
757 * For VGPU10 vertex formats, skip querying host capabilities
758 */
759
760 if (ss->sws->have_vgpu10 && (bindings & PIPE_BIND_VERTEX_BUFFER)) {
761 SVGA3dSurfaceFormat svga_format;
762 unsigned flags;
763 svga_translate_vertex_format_vgpu10(format, &svga_format, &flags);
764 return svga_format != SVGA3D_FORMAT_INVALID;
765 }
766
767 /*
768 * Override host capabilities, so that we end up with the same
769 * visuals for all virtual hardware implementations.
770 */
771
772 if (bindings & PIPE_BIND_DISPLAY_TARGET) {
773 switch (svga_format) {
774 case SVGA3D_A8R8G8B8:
775 case SVGA3D_X8R8G8B8:
776 case SVGA3D_R5G6B5:
777 break;
778
779 /* VGPU10 formats */
780 case SVGA3D_B8G8R8A8_UNORM:
781 case SVGA3D_B8G8R8X8_UNORM:
782 case SVGA3D_B5G6R5_UNORM:
783 break;
784
785 /* Often unsupported/problematic. This means we end up with the same
786 * visuals for all virtual hardware implementations.
787 */
788 case SVGA3D_A4R4G4B4:
789 case SVGA3D_A1R5G5B5:
790 return FALSE;
791
792 default:
793 return FALSE;
794 }
795 }
796
797 /*
798 * Query the host capabilities.
799 */
800
801 svga_get_format_cap(ss, svga_format, &caps);
802
803 if (bindings & PIPE_BIND_RENDER_TARGET) {
804 /* Check that the color surface is blendable, unless it's an
805 * integer format.
806 */
807 if (!svga_format_is_integer(svga_format) &&
808 (caps.value & SVGA3DFORMAT_OP_NOALPHABLEND)) {
809 return FALSE;
810 }
811 }
812
813 mask.value = 0;
814 if (bindings & PIPE_BIND_RENDER_TARGET) {
815 mask.value |= SVGA3DFORMAT_OP_OFFSCREEN_RENDERTARGET;
816 }
817 if (bindings & PIPE_BIND_DEPTH_STENCIL) {
818 mask.value |= SVGA3DFORMAT_OP_ZSTENCIL;
819 }
820 if (bindings & PIPE_BIND_SAMPLER_VIEW) {
821 mask.value |= SVGA3DFORMAT_OP_TEXTURE;
822 }
823
824 if (target == PIPE_TEXTURE_CUBE) {
825 mask.value |= SVGA3DFORMAT_OP_CUBETEXTURE;
826 }
827 else if (target == PIPE_TEXTURE_3D) {
828 mask.value |= SVGA3DFORMAT_OP_VOLUMETEXTURE;
829 }
830
831 return (caps.value & mask.value) == mask.value;
832 }
833
834
835 static void
836 svga_fence_reference(struct pipe_screen *screen,
837 struct pipe_fence_handle **ptr,
838 struct pipe_fence_handle *fence)
839 {
840 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
841 sws->fence_reference(sws, ptr, fence);
842 }
843
844
845 static boolean
846 svga_fence_finish(struct pipe_screen *screen,
847 struct pipe_context *ctx,
848 struct pipe_fence_handle *fence,
849 uint64_t timeout)
850 {
851 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
852 boolean retVal;
853
854 SVGA_STATS_TIME_PUSH(sws, SVGA_STATS_TIME_FENCEFINISH);
855
856 if (!timeout) {
857 retVal = sws->fence_signalled(sws, fence, 0) == 0;
858 }
859 else {
860 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
861 __FUNCTION__, fence);
862
863 retVal = sws->fence_finish(sws, fence, timeout, 0) == 0;
864 }
865
866 SVGA_STATS_TIME_POP(sws);
867
868 return retVal;
869 }
870
871
872 static int
873 svga_fence_get_fd(struct pipe_screen *screen,
874 struct pipe_fence_handle *fence)
875 {
876 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
877
878 return sws->fence_get_fd(sws, fence, TRUE);
879 }
880
881
882 static int
883 svga_get_driver_query_info(struct pipe_screen *screen,
884 unsigned index,
885 struct pipe_driver_query_info *info)
886 {
887 #define QUERY(NAME, ENUM, UNITS) \
888 {NAME, ENUM, {0}, UNITS, PIPE_DRIVER_QUERY_RESULT_TYPE_AVERAGE, 0, 0x0}
889
890 static const struct pipe_driver_query_info queries[] = {
891 /* per-frame counters */
892 QUERY("num-draw-calls", SVGA_QUERY_NUM_DRAW_CALLS,
893 PIPE_DRIVER_QUERY_TYPE_UINT64),
894 QUERY("num-fallbacks", SVGA_QUERY_NUM_FALLBACKS,
895 PIPE_DRIVER_QUERY_TYPE_UINT64),
896 QUERY("num-flushes", SVGA_QUERY_NUM_FLUSHES,
897 PIPE_DRIVER_QUERY_TYPE_UINT64),
898 QUERY("num-validations", SVGA_QUERY_NUM_VALIDATIONS,
899 PIPE_DRIVER_QUERY_TYPE_UINT64),
900 QUERY("map-buffer-time", SVGA_QUERY_MAP_BUFFER_TIME,
901 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
902 QUERY("num-buffers-mapped", SVGA_QUERY_NUM_BUFFERS_MAPPED,
903 PIPE_DRIVER_QUERY_TYPE_UINT64),
904 QUERY("num-textures-mapped", SVGA_QUERY_NUM_TEXTURES_MAPPED,
905 PIPE_DRIVER_QUERY_TYPE_UINT64),
906 QUERY("num-bytes-uploaded", SVGA_QUERY_NUM_BYTES_UPLOADED,
907 PIPE_DRIVER_QUERY_TYPE_BYTES),
908 QUERY("command-buffer-size", SVGA_QUERY_COMMAND_BUFFER_SIZE,
909 PIPE_DRIVER_QUERY_TYPE_BYTES),
910 QUERY("flush-time", SVGA_QUERY_FLUSH_TIME,
911 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
912 QUERY("surface-write-flushes", SVGA_QUERY_SURFACE_WRITE_FLUSHES,
913 PIPE_DRIVER_QUERY_TYPE_UINT64),
914 QUERY("num-readbacks", SVGA_QUERY_NUM_READBACKS,
915 PIPE_DRIVER_QUERY_TYPE_UINT64),
916 QUERY("num-resource-updates", SVGA_QUERY_NUM_RESOURCE_UPDATES,
917 PIPE_DRIVER_QUERY_TYPE_UINT64),
918 QUERY("num-buffer-uploads", SVGA_QUERY_NUM_BUFFER_UPLOADS,
919 PIPE_DRIVER_QUERY_TYPE_UINT64),
920 QUERY("num-const-buf-updates", SVGA_QUERY_NUM_CONST_BUF_UPDATES,
921 PIPE_DRIVER_QUERY_TYPE_UINT64),
922 QUERY("num-const-updates", SVGA_QUERY_NUM_CONST_UPDATES,
923 PIPE_DRIVER_QUERY_TYPE_UINT64),
924
925 /* running total counters */
926 QUERY("memory-used", SVGA_QUERY_MEMORY_USED,
927 PIPE_DRIVER_QUERY_TYPE_BYTES),
928 QUERY("num-shaders", SVGA_QUERY_NUM_SHADERS,
929 PIPE_DRIVER_QUERY_TYPE_UINT64),
930 QUERY("num-resources", SVGA_QUERY_NUM_RESOURCES,
931 PIPE_DRIVER_QUERY_TYPE_UINT64),
932 QUERY("num-state-objects", SVGA_QUERY_NUM_STATE_OBJECTS,
933 PIPE_DRIVER_QUERY_TYPE_UINT64),
934 QUERY("num-surface-views", SVGA_QUERY_NUM_SURFACE_VIEWS,
935 PIPE_DRIVER_QUERY_TYPE_UINT64),
936 QUERY("num-generate-mipmap", SVGA_QUERY_NUM_GENERATE_MIPMAP,
937 PIPE_DRIVER_QUERY_TYPE_UINT64),
938 QUERY("num-failed-allocations", SVGA_QUERY_NUM_FAILED_ALLOCATIONS,
939 PIPE_DRIVER_QUERY_TYPE_UINT64),
940 };
941 #undef QUERY
942
943 if (!info)
944 return ARRAY_SIZE(queries);
945
946 if (index >= ARRAY_SIZE(queries))
947 return 0;
948
949 *info = queries[index];
950 return 1;
951 }
952
953
954 static void
955 init_logging(struct pipe_screen *screen)
956 {
957 static const char *log_prefix = "Mesa: ";
958 char host_log[1000];
959
960 /* Log Version to Host */
961 util_snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
962 "%s%s", log_prefix, svga_get_name(screen));
963 svga_host_log(host_log);
964
965 util_snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
966 "%s%s (%s)", log_prefix, PACKAGE_VERSION, MESA_GIT_SHA1);
967 svga_host_log(host_log);
968
969 /* If the SVGA_EXTRA_LOGGING env var is set, log the process's command
970 * line (program name and arguments).
971 */
972 if (debug_get_bool_option("SVGA_EXTRA_LOGGING", FALSE)) {
973 char cmdline[1000];
974 if (os_get_command_line(cmdline, sizeof(cmdline))) {
975 util_snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
976 "%s%s", log_prefix, cmdline);
977 svga_host_log(host_log);
978 }
979 }
980 }
981
982
983 static void
984 svga_destroy_screen( struct pipe_screen *screen )
985 {
986 struct svga_screen *svgascreen = svga_screen(screen);
987
988 svga_screen_cache_cleanup(svgascreen);
989
990 mtx_destroy(&svgascreen->swc_mutex);
991 mtx_destroy(&svgascreen->tex_mutex);
992
993 svgascreen->sws->destroy(svgascreen->sws);
994
995 FREE(svgascreen);
996 }
997
998
999 /**
1000 * Create a new svga_screen object
1001 */
1002 struct pipe_screen *
1003 svga_screen_create(struct svga_winsys_screen *sws)
1004 {
1005 struct svga_screen *svgascreen;
1006 struct pipe_screen *screen;
1007
1008 #ifdef DEBUG
1009 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
1010 #endif
1011
1012 svgascreen = CALLOC_STRUCT(svga_screen);
1013 if (!svgascreen)
1014 goto error1;
1015
1016 svgascreen->debug.force_level_surface_view =
1017 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
1018 svgascreen->debug.force_surface_view =
1019 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
1020 svgascreen->debug.force_sampler_view =
1021 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
1022 svgascreen->debug.no_surface_view =
1023 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
1024 svgascreen->debug.no_sampler_view =
1025 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
1026 svgascreen->debug.no_cache_index_buffers =
1027 debug_get_bool_option("SVGA_NO_CACHE_INDEX_BUFFERS", FALSE);
1028
1029 screen = &svgascreen->screen;
1030
1031 screen->destroy = svga_destroy_screen;
1032 screen->get_name = svga_get_name;
1033 screen->get_vendor = svga_get_vendor;
1034 screen->get_device_vendor = svga_get_vendor; // TODO actual device vendor
1035 screen->get_param = svga_get_param;
1036 screen->get_shader_param = svga_get_shader_param;
1037 screen->get_paramf = svga_get_paramf;
1038 screen->get_timestamp = NULL;
1039 screen->is_format_supported = svga_is_format_supported;
1040 screen->context_create = svga_context_create;
1041 screen->fence_reference = svga_fence_reference;
1042 screen->fence_finish = svga_fence_finish;
1043 screen->fence_get_fd = svga_fence_get_fd;
1044
1045 screen->get_driver_query_info = svga_get_driver_query_info;
1046 svgascreen->sws = sws;
1047
1048 svga_init_screen_resource_functions(svgascreen);
1049
1050 if (sws->get_hw_version) {
1051 svgascreen->hw_version = sws->get_hw_version(sws);
1052 } else {
1053 svgascreen->hw_version = SVGA3D_HWVERSION_WS65_B1;
1054 }
1055
1056 if (svgascreen->hw_version < SVGA3D_HWVERSION_WS8_B1) {
1057 /* too old for 3D acceleration */
1058 debug_printf("Hardware version 0x%x is too old for accerated 3D\n",
1059 svgascreen->hw_version);
1060 goto error2;
1061 }
1062
1063 /*
1064 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
1065 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
1066 * we prefer the later when available.
1067 *
1068 * This mimics hardware vendors extensions for D3D depth sampling. See also
1069 * http://aras-p.info/texts/D3D9GPUHacks.html
1070 */
1071
1072 {
1073 boolean has_df16, has_df24, has_d24s8_int;
1074 SVGA3dSurfaceFormatCaps caps;
1075 SVGA3dSurfaceFormatCaps mask;
1076 mask.value = 0;
1077 mask.zStencil = 1;
1078 mask.texture = 1;
1079
1080 svgascreen->depth.z16 = SVGA3D_Z_D16;
1081 svgascreen->depth.x8z24 = SVGA3D_Z_D24X8;
1082 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8;
1083
1084 svga_get_format_cap(svgascreen, SVGA3D_Z_DF16, &caps);
1085 has_df16 = (caps.value & mask.value) == mask.value;
1086
1087 svga_get_format_cap(svgascreen, SVGA3D_Z_DF24, &caps);
1088 has_df24 = (caps.value & mask.value) == mask.value;
1089
1090 svga_get_format_cap(svgascreen, SVGA3D_Z_D24S8_INT, &caps);
1091 has_d24s8_int = (caps.value & mask.value) == mask.value;
1092
1093 /* XXX: We might want some other logic here.
1094 * Like if we only have d24s8_int we should
1095 * emulate the other formats with that.
1096 */
1097 if (has_df16) {
1098 svgascreen->depth.z16 = SVGA3D_Z_DF16;
1099 }
1100 if (has_df24) {
1101 svgascreen->depth.x8z24 = SVGA3D_Z_DF24;
1102 }
1103 if (has_d24s8_int) {
1104 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8_INT;
1105 }
1106 }
1107
1108 /* Query device caps
1109 */
1110 if (sws->have_vgpu10) {
1111 svgascreen->haveProvokingVertex
1112 = get_bool_cap(sws, SVGA3D_DEVCAP_DX_PROVOKING_VERTEX, FALSE);
1113 svgascreen->haveLineSmooth = TRUE;
1114 svgascreen->maxPointSize = 80.0F;
1115 svgascreen->max_color_buffers = SVGA3D_DX_MAX_RENDER_TARGETS;
1116
1117 /* Multisample samples per pixel */
1118 if (debug_get_bool_option("SVGA_MSAA", TRUE)) {
1119 svgascreen->ms_samples =
1120 get_uint_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_MASKABLESAMPLES, 0);
1121 }
1122
1123 /* We only support 4x, 8x, 16x MSAA */
1124 svgascreen->ms_samples &= ((1 << (4-1)) |
1125 (1 << (8-1)) |
1126 (1 << (16-1)));
1127
1128 /* Maximum number of constant buffers */
1129 svgascreen->max_const_buffers =
1130 get_uint_cap(sws, SVGA3D_DEVCAP_DX_MAX_CONSTANT_BUFFERS, 1);
1131 assert(svgascreen->max_const_buffers <= SVGA_MAX_CONST_BUFS);
1132 }
1133 else {
1134 /* VGPU9 */
1135 unsigned vs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION,
1136 SVGA3DVSVERSION_NONE);
1137 unsigned fs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION,
1138 SVGA3DPSVERSION_NONE);
1139
1140 /* we require Shader model 3.0 or later */
1141 if (fs_ver < SVGA3DPSVERSION_30 || vs_ver < SVGA3DVSVERSION_30) {
1142 goto error2;
1143 }
1144
1145 svgascreen->haveProvokingVertex = FALSE;
1146
1147 svgascreen->haveLineSmooth =
1148 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_AA, FALSE);
1149
1150 svgascreen->maxPointSize =
1151 get_float_cap(sws, SVGA3D_DEVCAP_MAX_POINT_SIZE, 1.0f);
1152 /* Keep this to a reasonable size to avoid failures in conform/pntaa.c */
1153 svgascreen->maxPointSize = MIN2(svgascreen->maxPointSize, 80.0f);
1154
1155 /* The SVGA3D device always supports 4 targets at this time, regardless
1156 * of what querying SVGA3D_DEVCAP_MAX_RENDER_TARGETS might return.
1157 */
1158 svgascreen->max_color_buffers = 4;
1159
1160 /* Only support one constant buffer
1161 */
1162 svgascreen->max_const_buffers = 1;
1163
1164 /* No multisampling */
1165 svgascreen->ms_samples = 0;
1166 }
1167
1168 /* common VGPU9 / VGPU10 caps */
1169 svgascreen->haveLineStipple =
1170 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_STIPPLE, FALSE);
1171
1172 svgascreen->maxLineWidth =
1173 MAX2(1.0, get_float_cap(sws, SVGA3D_DEVCAP_MAX_LINE_WIDTH, 1.0f));
1174
1175 svgascreen->maxLineWidthAA =
1176 MAX2(1.0, get_float_cap(sws, SVGA3D_DEVCAP_MAX_AA_LINE_WIDTH, 1.0f));
1177
1178 if (0) {
1179 debug_printf("svga: haveProvokingVertex %u\n",
1180 svgascreen->haveProvokingVertex);
1181 debug_printf("svga: haveLineStip %u "
1182 "haveLineSmooth %u maxLineWidth %.2f maxLineWidthAA %.2f\n",
1183 svgascreen->haveLineStipple, svgascreen->haveLineSmooth,
1184 svgascreen->maxLineWidth, svgascreen->maxLineWidthAA);
1185 debug_printf("svga: maxPointSize %g\n", svgascreen->maxPointSize);
1186 debug_printf("svga: msaa samples mask: 0x%x\n", svgascreen->ms_samples);
1187 }
1188
1189 (void) mtx_init(&svgascreen->tex_mutex, mtx_plain);
1190 (void) mtx_init(&svgascreen->swc_mutex, mtx_recursive);
1191
1192 svga_screen_cache_init(svgascreen);
1193
1194 init_logging(screen);
1195
1196 return screen;
1197 error2:
1198 FREE(svgascreen);
1199 error1:
1200 return NULL;
1201 }
1202
1203 struct svga_winsys_screen *
1204 svga_winsys_screen(struct pipe_screen *screen)
1205 {
1206 return svga_screen(screen)->sws;
1207 }
1208
1209 #ifdef DEBUG
1210 struct svga_screen *
1211 svga_screen(struct pipe_screen *screen)
1212 {
1213 assert(screen);
1214 assert(screen->destroy == svga_destroy_screen);
1215 return (struct svga_screen *)screen;
1216 }
1217 #endif