gallium: add shader caps INT16 and FP16_DERIVATIVES
[mesa.git] / src / gallium / drivers / svga / svga_screen.c
1 /**********************************************************
2 * Copyright 2008-2009 VMware, Inc. All rights reserved.
3 *
4 * Permission is hereby granted, free of charge, to any person
5 * obtaining a copy of this software and associated documentation
6 * files (the "Software"), to deal in the Software without
7 * restriction, including without limitation the rights to use, copy,
8 * modify, merge, publish, distribute, sublicense, and/or sell copies
9 * of the Software, and to permit persons to whom the Software is
10 * furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice shall be
13 * included in all copies or substantial portions of the Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
19 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
20 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
21 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 * SOFTWARE.
23 *
24 **********************************************************/
25
26 #include "git_sha1.h" /* For MESA_GIT_SHA1 */
27 #include "util/format/u_format.h"
28 #include "util/u_memory.h"
29 #include "util/u_inlines.h"
30 #include "util/u_screen.h"
31 #include "util/u_string.h"
32 #include "util/u_math.h"
33
34 #include "os/os_process.h"
35
36 #include "svga_winsys.h"
37 #include "svga_public.h"
38 #include "svga_context.h"
39 #include "svga_format.h"
40 #include "svga_screen.h"
41 #include "svga_tgsi.h"
42 #include "svga_resource_texture.h"
43 #include "svga_resource.h"
44 #include "svga_debug.h"
45
46 #include "svga3d_shaderdefs.h"
47 #include "VGPU10ShaderTokens.h"
48
49 /* NOTE: this constant may get moved into a svga3d*.h header file */
50 #define SVGA3D_DX_MAX_RESOURCE_SIZE (128 * 1024 * 1024)
51
52 #ifdef DEBUG
53 int SVGA_DEBUG = 0;
54
55 static const struct debug_named_value svga_debug_flags[] = {
56 { "dma", DEBUG_DMA, NULL },
57 { "tgsi", DEBUG_TGSI, NULL },
58 { "pipe", DEBUG_PIPE, NULL },
59 { "state", DEBUG_STATE, NULL },
60 { "screen", DEBUG_SCREEN, NULL },
61 { "tex", DEBUG_TEX, NULL },
62 { "swtnl", DEBUG_SWTNL, NULL },
63 { "const", DEBUG_CONSTS, NULL },
64 { "viewport", DEBUG_VIEWPORT, NULL },
65 { "views", DEBUG_VIEWS, NULL },
66 { "perf", DEBUG_PERF, NULL },
67 { "flush", DEBUG_FLUSH, NULL },
68 { "sync", DEBUG_SYNC, NULL },
69 { "cache", DEBUG_CACHE, NULL },
70 { "streamout", DEBUG_STREAMOUT, NULL },
71 { "query", DEBUG_QUERY, NULL },
72 { "samplers", DEBUG_SAMPLERS, NULL },
73 DEBUG_NAMED_VALUE_END
74 };
75 #endif
76
77 static const char *
78 svga_get_vendor( struct pipe_screen *pscreen )
79 {
80 return "VMware, Inc.";
81 }
82
83
84 static const char *
85 svga_get_name( struct pipe_screen *pscreen )
86 {
87 const char *build = "", *llvm = "", *mutex = "";
88 static char name[100];
89 #ifdef DEBUG
90 /* Only return internal details in the DEBUG version:
91 */
92 build = "build: DEBUG;";
93 mutex = "mutex: " PIPE_ATOMIC ";";
94 #else
95 build = "build: RELEASE;";
96 #endif
97 #ifdef LLVM_AVAILABLE
98 llvm = "LLVM;";
99 #endif
100
101 snprintf(name, sizeof(name), "SVGA3D; %s %s %s", build, mutex, llvm);
102 return name;
103 }
104
105
106 /** Helper for querying float-valued device cap */
107 static float
108 get_float_cap(struct svga_winsys_screen *sws, SVGA3dDevCapIndex cap,
109 float defaultVal)
110 {
111 SVGA3dDevCapResult result;
112 if (sws->get_cap(sws, cap, &result))
113 return result.f;
114 else
115 return defaultVal;
116 }
117
118
119 /** Helper for querying uint-valued device cap */
120 static unsigned
121 get_uint_cap(struct svga_winsys_screen *sws, SVGA3dDevCapIndex cap,
122 unsigned defaultVal)
123 {
124 SVGA3dDevCapResult result;
125 if (sws->get_cap(sws, cap, &result))
126 return result.u;
127 else
128 return defaultVal;
129 }
130
131
132 /** Helper for querying boolean-valued device cap */
133 static boolean
134 get_bool_cap(struct svga_winsys_screen *sws, SVGA3dDevCapIndex cap,
135 boolean defaultVal)
136 {
137 SVGA3dDevCapResult result;
138 if (sws->get_cap(sws, cap, &result))
139 return result.b;
140 else
141 return defaultVal;
142 }
143
144
145 static float
146 svga_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
147 {
148 struct svga_screen *svgascreen = svga_screen(screen);
149 struct svga_winsys_screen *sws = svgascreen->sws;
150
151 switch (param) {
152 case PIPE_CAPF_MAX_LINE_WIDTH:
153 return svgascreen->maxLineWidth;
154 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
155 return svgascreen->maxLineWidthAA;
156
157 case PIPE_CAPF_MAX_POINT_WIDTH:
158 /* fall-through */
159 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
160 return svgascreen->maxPointSize;
161
162 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
163 return (float) get_uint_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_ANISOTROPY, 4);
164
165 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
166 return 15.0;
167
168 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
169 /* fall-through */
170 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
171 /* fall-through */
172 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
173 return 0.0f;
174
175 }
176
177 debug_printf("Unexpected PIPE_CAPF_ query %u\n", param);
178 return 0;
179 }
180
181
182 static int
183 svga_get_param(struct pipe_screen *screen, enum pipe_cap param)
184 {
185 struct svga_screen *svgascreen = svga_screen(screen);
186 struct svga_winsys_screen *sws = svgascreen->sws;
187 SVGA3dDevCapResult result;
188
189 switch (param) {
190 case PIPE_CAP_NPOT_TEXTURES:
191 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
192 case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
193 return 1;
194 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
195 /*
196 * "In virtually every OpenGL implementation and hardware,
197 * GL_MAX_DUAL_SOURCE_DRAW_BUFFERS is 1"
198 * http://www.opengl.org/wiki/Blending
199 */
200 return sws->have_vgpu10 ? 1 : 0;
201 case PIPE_CAP_ANISOTROPIC_FILTER:
202 return 1;
203 case PIPE_CAP_POINT_SPRITE:
204 return 1;
205 case PIPE_CAP_TGSI_TEXCOORD:
206 return 0;
207 case PIPE_CAP_MAX_RENDER_TARGETS:
208 return svgascreen->max_color_buffers;
209 case PIPE_CAP_OCCLUSION_QUERY:
210 return 1;
211 case PIPE_CAP_QUERY_TIME_ELAPSED:
212 return 0;
213 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
214 return sws->have_vgpu10;
215 case PIPE_CAP_TEXTURE_SWIZZLE:
216 return 1;
217 case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:
218 return 0;
219 case PIPE_CAP_USER_VERTEX_BUFFERS:
220 return 0;
221 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
222 return 256;
223
224 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
225 {
226 unsigned size = 1 << (SVGA_MAX_TEXTURE_LEVELS - 1);
227 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_WIDTH, &result))
228 size = MIN2(result.u, size);
229 else
230 size = 2048;
231 if (sws->get_cap(sws, SVGA3D_DEVCAP_MAX_TEXTURE_HEIGHT, &result))
232 size = MIN2(result.u, size);
233 else
234 size = 2048;
235 return size;
236 }
237
238 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
239 if (!sws->get_cap(sws, SVGA3D_DEVCAP_MAX_VOLUME_EXTENT, &result))
240 return 8; /* max 128x128x128 */
241 return MIN2(util_logbase2(result.u) + 1, SVGA_MAX_TEXTURE_LEVELS);
242
243 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
244 /*
245 * No mechanism to query the host, and at least limited to 2048x2048 on
246 * certain hardware.
247 */
248 return MIN2(util_last_bit(screen->get_param(screen, PIPE_CAP_MAX_TEXTURE_2D_SIZE)),
249 12 /* 2048x2048 */);
250
251 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
252 return sws->have_vgpu10 ? SVGA3D_MAX_SURFACE_ARRAYSIZE : 0;
253
254 case PIPE_CAP_BLEND_EQUATION_SEPARATE: /* req. for GL 1.5 */
255 return 1;
256
257 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
258 return 1;
259 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
260 return sws->have_vgpu10;
261 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
262 return 0;
263 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
264 return !sws->have_vgpu10;
265
266 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
267 return 1; /* The color outputs of vertex shaders are not clamped */
268 case PIPE_CAP_VERTEX_COLOR_CLAMPED:
269 return 0; /* The driver can't clamp vertex colors */
270 case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
271 return 0; /* The driver can't clamp fragment colors */
272
273 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
274 return 1; /* expected for GL_ARB_framebuffer_object */
275
276 case PIPE_CAP_GLSL_FEATURE_LEVEL:
277 return sws->have_vgpu10 ? 330 : 120;
278
279 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
280 return sws->have_vgpu10 ? 330 : 120;
281
282 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
283 case PIPE_CAP_DEPTH_CLIP_DISABLE_SEPARATE:
284 return 0;
285
286 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
287 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
288 case PIPE_CAP_VERTEX_SHADER_SATURATE:
289 return 1;
290
291 case PIPE_CAP_DEPTH_CLIP_DISABLE:
292 case PIPE_CAP_INDEP_BLEND_ENABLE:
293 case PIPE_CAP_CONDITIONAL_RENDER:
294 case PIPE_CAP_QUERY_TIMESTAMP:
295 case PIPE_CAP_TGSI_INSTANCEID:
296 case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
297 case PIPE_CAP_SEAMLESS_CUBE_MAP:
298 case PIPE_CAP_FAKE_SW_MSAA:
299 return sws->have_vgpu10;
300
301 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
302 return sws->have_vgpu10 ? SVGA3D_DX_MAX_SOTARGETS : 0;
303 case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
304 return sws->have_vgpu10 ? 4 : 0;
305 case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
306 return sws->have_vgpu10 ? SVGA3D_MAX_STREAMOUT_DECLS : 0;
307 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
308 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
309 return 0;
310 case PIPE_CAP_TEXTURE_MULTISAMPLE:
311 return svgascreen->ms_samples ? 1 : 0;
312
313 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
314 /* convert bytes to texels for the case of the largest texel
315 * size: float[4].
316 */
317 return SVGA3D_DX_MAX_RESOURCE_SIZE / (4 * sizeof(float));
318
319 case PIPE_CAP_MIN_TEXEL_OFFSET:
320 return sws->have_vgpu10 ? VGPU10_MIN_TEXEL_FETCH_OFFSET : 0;
321 case PIPE_CAP_MAX_TEXEL_OFFSET:
322 return sws->have_vgpu10 ? VGPU10_MAX_TEXEL_FETCH_OFFSET : 0;
323
324 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
325 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
326 return 0;
327
328 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
329 return sws->have_vgpu10 ? 256 : 0;
330 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
331 return sws->have_vgpu10 ? 1024 : 0;
332
333 case PIPE_CAP_PRIMITIVE_RESTART:
334 return 1; /* may be a sw fallback, depending on restart index */
335
336 case PIPE_CAP_GENERATE_MIPMAP:
337 return sws->have_generate_mipmap_cmd;
338
339 case PIPE_CAP_NATIVE_FENCE_FD:
340 return sws->have_fence_fd;
341
342 case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
343 return 1;
344
345 case PIPE_CAP_CUBE_MAP_ARRAY:
346 case PIPE_CAP_INDEP_BLEND_FUNC:
347 case PIPE_CAP_SAMPLE_SHADING:
348 case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
349 case PIPE_CAP_TEXTURE_QUERY_LOD:
350 return sws->have_sm4_1;
351
352 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
353 return sws->have_sm4_1 ? 1 : 0; /* only single-channel textures */
354 case PIPE_CAP_MAX_VARYINGS:
355 return sws->have_vgpu10 ? VGPU10_MAX_FS_INPUTS : 10;
356 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
357 return sws->have_coherent;
358
359 /* Unsupported features */
360 case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
361 case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
362 case PIPE_CAP_SHADER_STENCIL_EXPORT:
363 case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
364 case PIPE_CAP_TEXTURE_BARRIER:
365 case PIPE_CAP_MAX_VERTEX_STREAMS:
366 case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:
367 case PIPE_CAP_COMPUTE:
368 case PIPE_CAP_START_INSTANCE:
369 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
370 case PIPE_CAP_QUERY_PIPELINE_STATISTICS:
371 case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
372 case PIPE_CAP_TEXTURE_GATHER_SM5:
373 case PIPE_CAP_TEXTURE_GATHER_OFFSETS:
374 case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
375 case PIPE_CAP_DRAW_INDIRECT:
376 case PIPE_CAP_MULTI_DRAW_INDIRECT:
377 case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:
378 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
379 case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
380 case PIPE_CAP_SAMPLER_VIEW_TARGET:
381 case PIPE_CAP_CLIP_HALFZ:
382 case PIPE_CAP_VERTEXID_NOBASE:
383 case PIPE_CAP_POLYGON_OFFSET_CLAMP:
384 case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
385 case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
386 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
387 case PIPE_CAP_INVALIDATE_BUFFER:
388 case PIPE_CAP_STRING_MARKER:
389 case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS:
390 case PIPE_CAP_QUERY_MEMORY_INFO:
391 case PIPE_CAP_PCI_GROUP:
392 case PIPE_CAP_PCI_BUS:
393 case PIPE_CAP_PCI_DEVICE:
394 case PIPE_CAP_PCI_FUNCTION:
395 case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:
396 case PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_TRIANGLES:
397 case PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_POINTS_LINES:
398 case PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_TRIANGLES:
399 case PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_POINTS_LINES:
400 case PIPE_CAP_CONSERVATIVE_RASTER_POST_DEPTH_COVERAGE:
401 case PIPE_CAP_MAX_CONSERVATIVE_RASTER_SUBPIXEL_PRECISION_BIAS:
402 case PIPE_CAP_MAX_TEXTURE_UPLOAD_MEMORY_BUDGET:
403 return 0;
404 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
405 return 64;
406 case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
407 case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:
408 case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:
409 return 1; /* need 4-byte alignment for all offsets and strides */
410 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
411 return 2048;
412 case PIPE_CAP_MAX_VIEWPORTS:
413 return 1;
414 case PIPE_CAP_ENDIANNESS:
415 return PIPE_ENDIAN_LITTLE;
416
417 case PIPE_CAP_VENDOR_ID:
418 return 0x15ad; /* VMware Inc. */
419 case PIPE_CAP_DEVICE_ID:
420 return 0x0405; /* assume SVGA II */
421 case PIPE_CAP_ACCELERATED:
422 return 0; /* XXX: */
423 case PIPE_CAP_VIDEO_MEMORY:
424 /* XXX: Query the host ? */
425 return 1;
426 case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
427 return sws->have_vgpu10;
428 case PIPE_CAP_CLEAR_TEXTURE:
429 return sws->have_vgpu10;
430 case PIPE_CAP_UMA:
431 case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
432 case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:
433 case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
434 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
435 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
436 case PIPE_CAP_DEPTH_BOUNDS_TEST:
437 case PIPE_CAP_TGSI_TXQS:
438 case PIPE_CAP_SHAREABLE_SHADERS:
439 case PIPE_CAP_DRAW_PARAMETERS:
440 case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
441 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
442 case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY:
443 case PIPE_CAP_QUERY_BUFFER_OBJECT:
444 case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
445 case PIPE_CAP_CULL_DISTANCE:
446 case PIPE_CAP_PRIMITIVE_RESTART_FOR_PATCHES:
447 case PIPE_CAP_TGSI_VOTE:
448 case PIPE_CAP_MAX_WINDOW_RECTANGLES:
449 case PIPE_CAP_POLYGON_OFFSET_UNITS_UNSCALED:
450 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
451 case PIPE_CAP_TGSI_ARRAY_COMPONENTS:
452 case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
453 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
454 case PIPE_CAP_FBFETCH:
455 case PIPE_CAP_TGSI_MUL_ZERO_WINS:
456 case PIPE_CAP_DOUBLES:
457 case PIPE_CAP_INT64:
458 case PIPE_CAP_INT64_DIVMOD:
459 case PIPE_CAP_TGSI_TEX_TXF_LZ:
460 case PIPE_CAP_TGSI_CLOCK:
461 case PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE:
462 case PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE:
463 case PIPE_CAP_TGSI_BALLOT:
464 case PIPE_CAP_TGSI_TES_LAYER_VIEWPORT:
465 case PIPE_CAP_CAN_BIND_CONST_BUFFER_AS_VERTEX:
466 case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:
467 case PIPE_CAP_POST_DEPTH_COVERAGE:
468 case PIPE_CAP_BINDLESS_TEXTURE:
469 case PIPE_CAP_NIR_SAMPLERS_AS_DEREF:
470 case PIPE_CAP_QUERY_SO_OVERFLOW:
471 case PIPE_CAP_MEMOBJ:
472 case PIPE_CAP_LOAD_CONSTBUF:
473 case PIPE_CAP_TGSI_ANY_REG_AS_ADDRESS:
474 case PIPE_CAP_TILE_RASTER_ORDER:
475 case PIPE_CAP_MAX_COMBINED_SHADER_OUTPUT_RESOURCES:
476 case PIPE_CAP_FRAMEBUFFER_MSAA_CONSTRAINTS:
477 case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
478 case PIPE_CAP_CONTEXT_PRIORITY_MASK:
479 case PIPE_CAP_FENCE_SIGNAL:
480 case PIPE_CAP_CONSTBUF0_FLAGS:
481 case PIPE_CAP_PACKED_UNIFORMS:
482 case PIPE_CAP_PROGRAMMABLE_SAMPLE_LOCATIONS:
483 return 0;
484 case PIPE_CAP_TGSI_DIV:
485 return 1;
486 case PIPE_CAP_MAX_GS_INVOCATIONS:
487 return 32;
488 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
489 return 1 << 27;
490 default:
491 return u_pipe_screen_get_param_defaults(screen, param);
492 }
493 }
494
495
496 static int
497 vgpu9_get_shader_param(struct pipe_screen *screen,
498 enum pipe_shader_type shader,
499 enum pipe_shader_cap param)
500 {
501 struct svga_screen *svgascreen = svga_screen(screen);
502 struct svga_winsys_screen *sws = svgascreen->sws;
503 unsigned val;
504
505 assert(!sws->have_vgpu10);
506
507 switch (shader)
508 {
509 case PIPE_SHADER_FRAGMENT:
510 switch (param)
511 {
512 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
513 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
514 return get_uint_cap(sws,
515 SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_INSTRUCTIONS,
516 512);
517 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
518 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
519 return 512;
520 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
521 return SVGA3D_MAX_NESTING_LEVEL;
522 case PIPE_SHADER_CAP_MAX_INPUTS:
523 return 10;
524 case PIPE_SHADER_CAP_MAX_OUTPUTS:
525 return svgascreen->max_color_buffers;
526 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
527 return 224 * sizeof(float[4]);
528 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
529 return 1;
530 case PIPE_SHADER_CAP_MAX_TEMPS:
531 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_FRAGMENT_SHADER_TEMPS, 32);
532 return MIN2(val, SVGA3D_TEMPREG_MAX);
533 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
534 /*
535 * Although PS 3.0 has some addressing abilities it can only represent
536 * loops that can be statically determined and unrolled. Given we can
537 * only handle a subset of the cases that the gallium frontend already
538 * does it is better to defer loop unrolling to the gallium frontend.
539 */
540 return 0;
541 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
542 return 0;
543 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
544 return 0;
545 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
546 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
547 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
548 return 0;
549 case PIPE_SHADER_CAP_SUBROUTINES:
550 return 0;
551 case PIPE_SHADER_CAP_INT64_ATOMICS:
552 case PIPE_SHADER_CAP_INTEGERS:
553 return 0;
554 case PIPE_SHADER_CAP_FP16:
555 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
556 case PIPE_SHADER_CAP_INT16:
557 return 0;
558 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
559 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
560 return 16;
561 case PIPE_SHADER_CAP_PREFERRED_IR:
562 return PIPE_SHADER_IR_TGSI;
563 case PIPE_SHADER_CAP_SUPPORTED_IRS:
564 return 0;
565 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
566 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
567 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
568 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
569 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
570 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
571 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
572 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
573 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
574 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
575 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
576 return 0;
577 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
578 return 32;
579 }
580 /* If we get here, we failed to handle a cap above */
581 debug_printf("Unexpected fragment shader query %u\n", param);
582 return 0;
583 case PIPE_SHADER_VERTEX:
584 switch (param)
585 {
586 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
587 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
588 return get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_INSTRUCTIONS,
589 512);
590 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
591 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
592 /* XXX: until we have vertex texture support */
593 return 0;
594 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
595 return SVGA3D_MAX_NESTING_LEVEL;
596 case PIPE_SHADER_CAP_MAX_INPUTS:
597 return 16;
598 case PIPE_SHADER_CAP_MAX_OUTPUTS:
599 return 10;
600 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
601 return 256 * sizeof(float[4]);
602 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
603 return 1;
604 case PIPE_SHADER_CAP_MAX_TEMPS:
605 val = get_uint_cap(sws, SVGA3D_DEVCAP_MAX_VERTEX_SHADER_TEMPS, 32);
606 return MIN2(val, SVGA3D_TEMPREG_MAX);
607 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
608 return 0;
609 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
610 return 0;
611 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
612 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
613 return 1;
614 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
615 return 0;
616 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
617 return 1;
618 case PIPE_SHADER_CAP_SUBROUTINES:
619 return 0;
620 case PIPE_SHADER_CAP_INT64_ATOMICS:
621 case PIPE_SHADER_CAP_INTEGERS:
622 return 0;
623 case PIPE_SHADER_CAP_FP16:
624 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
625 case PIPE_SHADER_CAP_INT16:
626 return 0;
627 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
628 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
629 return 0;
630 case PIPE_SHADER_CAP_PREFERRED_IR:
631 return PIPE_SHADER_IR_TGSI;
632 case PIPE_SHADER_CAP_SUPPORTED_IRS:
633 return 0;
634 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
635 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
636 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
637 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
638 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
639 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
640 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
641 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
642 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
643 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
644 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
645 return 0;
646 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
647 return 32;
648 }
649 /* If we get here, we failed to handle a cap above */
650 debug_printf("Unexpected vertex shader query %u\n", param);
651 return 0;
652 case PIPE_SHADER_GEOMETRY:
653 case PIPE_SHADER_COMPUTE:
654 case PIPE_SHADER_TESS_CTRL:
655 case PIPE_SHADER_TESS_EVAL:
656 /* no support for geometry, tess or compute shaders at this time */
657 return 0;
658 default:
659 debug_printf("Unexpected shader type (%u) query\n", shader);
660 return 0;
661 }
662 return 0;
663 }
664
665
666 static int
667 vgpu10_get_shader_param(struct pipe_screen *screen,
668 enum pipe_shader_type shader,
669 enum pipe_shader_cap param)
670 {
671 struct svga_screen *svgascreen = svga_screen(screen);
672 struct svga_winsys_screen *sws = svgascreen->sws;
673
674 assert(sws->have_vgpu10);
675 (void) sws; /* silence unused var warnings in non-debug builds */
676
677 /* Only VS, GS, FS supported */
678 if (shader != PIPE_SHADER_VERTEX &&
679 shader != PIPE_SHADER_GEOMETRY &&
680 shader != PIPE_SHADER_FRAGMENT) {
681 return 0;
682 }
683
684 /* NOTE: we do not query the device for any caps/limits at this time */
685
686 /* Generally the same limits for vertex, geometry and fragment shaders */
687 switch (param) {
688 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
689 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
690 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
691 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
692 return 64 * 1024;
693 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
694 return 64;
695 case PIPE_SHADER_CAP_MAX_INPUTS:
696 if (shader == PIPE_SHADER_FRAGMENT)
697 return VGPU10_MAX_FS_INPUTS;
698 else if (shader == PIPE_SHADER_GEOMETRY)
699 return VGPU10_MAX_GS_INPUTS;
700 else
701 return VGPU10_MAX_VS_INPUTS;
702 case PIPE_SHADER_CAP_MAX_OUTPUTS:
703 if (shader == PIPE_SHADER_FRAGMENT)
704 return VGPU10_MAX_FS_OUTPUTS;
705 else if (shader == PIPE_SHADER_GEOMETRY)
706 return VGPU10_MAX_GS_OUTPUTS;
707 else
708 return VGPU10_MAX_VS_OUTPUTS;
709 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
710 return VGPU10_MAX_CONSTANT_BUFFER_ELEMENT_COUNT * sizeof(float[4]);
711 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
712 return svgascreen->max_const_buffers;
713 case PIPE_SHADER_CAP_MAX_TEMPS:
714 return VGPU10_MAX_TEMPS;
715 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
716 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
717 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
718 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
719 return TRUE; /* XXX verify */
720 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
721 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
722 case PIPE_SHADER_CAP_SUBROUTINES:
723 case PIPE_SHADER_CAP_INTEGERS:
724 return TRUE;
725 case PIPE_SHADER_CAP_FP16:
726 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
727 case PIPE_SHADER_CAP_INT16:
728 return FALSE;
729 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
730 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
731 return SVGA3D_DX_MAX_SAMPLERS;
732 case PIPE_SHADER_CAP_PREFERRED_IR:
733 return PIPE_SHADER_IR_TGSI;
734 case PIPE_SHADER_CAP_SUPPORTED_IRS:
735 return 0;
736 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
737 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
738 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
739 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
740 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
741 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
742 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
743 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
744 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
745 case PIPE_SHADER_CAP_INT64_ATOMICS:
746 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
747 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
748 return 0;
749 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
750 return 32;
751 default:
752 debug_printf("Unexpected vgpu10 shader query %u\n", param);
753 return 0;
754 }
755 return 0;
756 }
757
758
759 static int
760 svga_get_shader_param(struct pipe_screen *screen, enum pipe_shader_type shader,
761 enum pipe_shader_cap param)
762 {
763 struct svga_screen *svgascreen = svga_screen(screen);
764 struct svga_winsys_screen *sws = svgascreen->sws;
765 if (sws->have_vgpu10) {
766 return vgpu10_get_shader_param(screen, shader, param);
767 }
768 else {
769 return vgpu9_get_shader_param(screen, shader, param);
770 }
771 }
772
773
774 static void
775 svga_fence_reference(struct pipe_screen *screen,
776 struct pipe_fence_handle **ptr,
777 struct pipe_fence_handle *fence)
778 {
779 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
780 sws->fence_reference(sws, ptr, fence);
781 }
782
783
784 static bool
785 svga_fence_finish(struct pipe_screen *screen,
786 struct pipe_context *ctx,
787 struct pipe_fence_handle *fence,
788 uint64_t timeout)
789 {
790 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
791 bool retVal;
792
793 SVGA_STATS_TIME_PUSH(sws, SVGA_STATS_TIME_FENCEFINISH);
794
795 if (!timeout) {
796 retVal = sws->fence_signalled(sws, fence, 0) == 0;
797 }
798 else {
799 SVGA_DBG(DEBUG_DMA|DEBUG_PERF, "%s fence_ptr %p\n",
800 __FUNCTION__, fence);
801
802 retVal = sws->fence_finish(sws, fence, timeout, 0) == 0;
803 }
804
805 SVGA_STATS_TIME_POP(sws);
806
807 return retVal;
808 }
809
810
811 static int
812 svga_fence_get_fd(struct pipe_screen *screen,
813 struct pipe_fence_handle *fence)
814 {
815 struct svga_winsys_screen *sws = svga_screen(screen)->sws;
816
817 return sws->fence_get_fd(sws, fence, TRUE);
818 }
819
820
821 static int
822 svga_get_driver_query_info(struct pipe_screen *screen,
823 unsigned index,
824 struct pipe_driver_query_info *info)
825 {
826 #define QUERY(NAME, ENUM, UNITS) \
827 {NAME, ENUM, {0}, UNITS, PIPE_DRIVER_QUERY_RESULT_TYPE_AVERAGE, 0, 0x0}
828
829 static const struct pipe_driver_query_info queries[] = {
830 /* per-frame counters */
831 QUERY("num-draw-calls", SVGA_QUERY_NUM_DRAW_CALLS,
832 PIPE_DRIVER_QUERY_TYPE_UINT64),
833 QUERY("num-fallbacks", SVGA_QUERY_NUM_FALLBACKS,
834 PIPE_DRIVER_QUERY_TYPE_UINT64),
835 QUERY("num-flushes", SVGA_QUERY_NUM_FLUSHES,
836 PIPE_DRIVER_QUERY_TYPE_UINT64),
837 QUERY("num-validations", SVGA_QUERY_NUM_VALIDATIONS,
838 PIPE_DRIVER_QUERY_TYPE_UINT64),
839 QUERY("map-buffer-time", SVGA_QUERY_MAP_BUFFER_TIME,
840 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
841 QUERY("num-buffers-mapped", SVGA_QUERY_NUM_BUFFERS_MAPPED,
842 PIPE_DRIVER_QUERY_TYPE_UINT64),
843 QUERY("num-textures-mapped", SVGA_QUERY_NUM_TEXTURES_MAPPED,
844 PIPE_DRIVER_QUERY_TYPE_UINT64),
845 QUERY("num-bytes-uploaded", SVGA_QUERY_NUM_BYTES_UPLOADED,
846 PIPE_DRIVER_QUERY_TYPE_BYTES),
847 QUERY("command-buffer-size", SVGA_QUERY_COMMAND_BUFFER_SIZE,
848 PIPE_DRIVER_QUERY_TYPE_BYTES),
849 QUERY("flush-time", SVGA_QUERY_FLUSH_TIME,
850 PIPE_DRIVER_QUERY_TYPE_MICROSECONDS),
851 QUERY("surface-write-flushes", SVGA_QUERY_SURFACE_WRITE_FLUSHES,
852 PIPE_DRIVER_QUERY_TYPE_UINT64),
853 QUERY("num-readbacks", SVGA_QUERY_NUM_READBACKS,
854 PIPE_DRIVER_QUERY_TYPE_UINT64),
855 QUERY("num-resource-updates", SVGA_QUERY_NUM_RESOURCE_UPDATES,
856 PIPE_DRIVER_QUERY_TYPE_UINT64),
857 QUERY("num-buffer-uploads", SVGA_QUERY_NUM_BUFFER_UPLOADS,
858 PIPE_DRIVER_QUERY_TYPE_UINT64),
859 QUERY("num-const-buf-updates", SVGA_QUERY_NUM_CONST_BUF_UPDATES,
860 PIPE_DRIVER_QUERY_TYPE_UINT64),
861 QUERY("num-const-updates", SVGA_QUERY_NUM_CONST_UPDATES,
862 PIPE_DRIVER_QUERY_TYPE_UINT64),
863
864 /* running total counters */
865 QUERY("memory-used", SVGA_QUERY_MEMORY_USED,
866 PIPE_DRIVER_QUERY_TYPE_BYTES),
867 QUERY("num-shaders", SVGA_QUERY_NUM_SHADERS,
868 PIPE_DRIVER_QUERY_TYPE_UINT64),
869 QUERY("num-resources", SVGA_QUERY_NUM_RESOURCES,
870 PIPE_DRIVER_QUERY_TYPE_UINT64),
871 QUERY("num-state-objects", SVGA_QUERY_NUM_STATE_OBJECTS,
872 PIPE_DRIVER_QUERY_TYPE_UINT64),
873 QUERY("num-surface-views", SVGA_QUERY_NUM_SURFACE_VIEWS,
874 PIPE_DRIVER_QUERY_TYPE_UINT64),
875 QUERY("num-generate-mipmap", SVGA_QUERY_NUM_GENERATE_MIPMAP,
876 PIPE_DRIVER_QUERY_TYPE_UINT64),
877 QUERY("num-failed-allocations", SVGA_QUERY_NUM_FAILED_ALLOCATIONS,
878 PIPE_DRIVER_QUERY_TYPE_UINT64),
879 QUERY("num-commands-per-draw", SVGA_QUERY_NUM_COMMANDS_PER_DRAW,
880 PIPE_DRIVER_QUERY_TYPE_FLOAT),
881 };
882 #undef QUERY
883
884 if (!info)
885 return ARRAY_SIZE(queries);
886
887 if (index >= ARRAY_SIZE(queries))
888 return 0;
889
890 *info = queries[index];
891 return 1;
892 }
893
894
895 static void
896 init_logging(struct pipe_screen *screen)
897 {
898 struct svga_screen *svgascreen = svga_screen(screen);
899 static const char *log_prefix = "Mesa: ";
900 char host_log[1000];
901
902 /* Log Version to Host */
903 snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
904 "%s%s\n", log_prefix, svga_get_name(screen));
905 svgascreen->sws->host_log(svgascreen->sws, host_log);
906
907 snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
908 "%s" PACKAGE_VERSION MESA_GIT_SHA1, log_prefix);
909 svgascreen->sws->host_log(svgascreen->sws, host_log);
910
911 /* If the SVGA_EXTRA_LOGGING env var is set, log the process's command
912 * line (program name and arguments).
913 */
914 if (debug_get_bool_option("SVGA_EXTRA_LOGGING", FALSE)) {
915 char cmdline[1000];
916 if (os_get_command_line(cmdline, sizeof(cmdline))) {
917 snprintf(host_log, sizeof(host_log) - strlen(log_prefix),
918 "%s%s\n", log_prefix, cmdline);
919 svgascreen->sws->host_log(svgascreen->sws, host_log);
920 }
921 }
922 }
923
924
925 /**
926 * no-op logging function to use when SVGA_NO_LOGGING is set.
927 */
928 static void
929 nop_host_log(struct svga_winsys_screen *sws, const char *message)
930 {
931 /* nothing */
932 }
933
934
935 static void
936 svga_destroy_screen( struct pipe_screen *screen )
937 {
938 struct svga_screen *svgascreen = svga_screen(screen);
939
940 svga_screen_cache_cleanup(svgascreen);
941
942 mtx_destroy(&svgascreen->swc_mutex);
943 mtx_destroy(&svgascreen->tex_mutex);
944
945 svgascreen->sws->destroy(svgascreen->sws);
946
947 FREE(svgascreen);
948 }
949
950
951 /**
952 * Create a new svga_screen object
953 */
954 struct pipe_screen *
955 svga_screen_create(struct svga_winsys_screen *sws)
956 {
957 struct svga_screen *svgascreen;
958 struct pipe_screen *screen;
959
960 #ifdef DEBUG
961 SVGA_DEBUG = debug_get_flags_option("SVGA_DEBUG", svga_debug_flags, 0 );
962 #endif
963
964 svgascreen = CALLOC_STRUCT(svga_screen);
965 if (!svgascreen)
966 goto error1;
967
968 svgascreen->debug.force_level_surface_view =
969 debug_get_bool_option("SVGA_FORCE_LEVEL_SURFACE_VIEW", FALSE);
970 svgascreen->debug.force_surface_view =
971 debug_get_bool_option("SVGA_FORCE_SURFACE_VIEW", FALSE);
972 svgascreen->debug.force_sampler_view =
973 debug_get_bool_option("SVGA_FORCE_SAMPLER_VIEW", FALSE);
974 svgascreen->debug.no_surface_view =
975 debug_get_bool_option("SVGA_NO_SURFACE_VIEW", FALSE);
976 svgascreen->debug.no_sampler_view =
977 debug_get_bool_option("SVGA_NO_SAMPLER_VIEW", FALSE);
978 svgascreen->debug.no_cache_index_buffers =
979 debug_get_bool_option("SVGA_NO_CACHE_INDEX_BUFFERS", FALSE);
980
981 screen = &svgascreen->screen;
982
983 screen->destroy = svga_destroy_screen;
984 screen->get_name = svga_get_name;
985 screen->get_vendor = svga_get_vendor;
986 screen->get_device_vendor = svga_get_vendor; // TODO actual device vendor
987 screen->get_param = svga_get_param;
988 screen->get_shader_param = svga_get_shader_param;
989 screen->get_paramf = svga_get_paramf;
990 screen->get_timestamp = NULL;
991 screen->is_format_supported = svga_is_format_supported;
992 screen->context_create = svga_context_create;
993 screen->fence_reference = svga_fence_reference;
994 screen->fence_finish = svga_fence_finish;
995 screen->fence_get_fd = svga_fence_get_fd;
996
997 screen->get_driver_query_info = svga_get_driver_query_info;
998 svgascreen->sws = sws;
999
1000 svga_init_screen_resource_functions(svgascreen);
1001
1002 if (sws->get_hw_version) {
1003 svgascreen->hw_version = sws->get_hw_version(sws);
1004 } else {
1005 svgascreen->hw_version = SVGA3D_HWVERSION_WS65_B1;
1006 }
1007
1008 if (svgascreen->hw_version < SVGA3D_HWVERSION_WS8_B1) {
1009 /* too old for 3D acceleration */
1010 debug_printf("Hardware version 0x%x is too old for accerated 3D\n",
1011 svgascreen->hw_version);
1012 goto error2;
1013 }
1014
1015 debug_printf("%s enabled = %u\n",
1016 sws->have_sm4_1 ? "SM4_1" : "VGPU10",
1017 sws->have_sm4_1 ? 1 : sws->have_vgpu10);
1018
1019 debug_printf("Mesa: %s %s (%s)\n", svga_get_name(screen),
1020 PACKAGE_VERSION, MESA_GIT_SHA1);
1021
1022 /*
1023 * The D16, D24X8, and D24S8 formats always do an implicit shadow compare
1024 * when sampled from, where as the DF16, DF24, and D24S8_INT do not. So
1025 * we prefer the later when available.
1026 *
1027 * This mimics hardware vendors extensions for D3D depth sampling. See also
1028 * http://aras-p.info/texts/D3D9GPUHacks.html
1029 */
1030
1031 {
1032 boolean has_df16, has_df24, has_d24s8_int;
1033 SVGA3dSurfaceFormatCaps caps;
1034 SVGA3dSurfaceFormatCaps mask;
1035 mask.value = 0;
1036 mask.zStencil = 1;
1037 mask.texture = 1;
1038
1039 svgascreen->depth.z16 = SVGA3D_Z_D16;
1040 svgascreen->depth.x8z24 = SVGA3D_Z_D24X8;
1041 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8;
1042
1043 svga_get_format_cap(svgascreen, SVGA3D_Z_DF16, &caps);
1044 has_df16 = (caps.value & mask.value) == mask.value;
1045
1046 svga_get_format_cap(svgascreen, SVGA3D_Z_DF24, &caps);
1047 has_df24 = (caps.value & mask.value) == mask.value;
1048
1049 svga_get_format_cap(svgascreen, SVGA3D_Z_D24S8_INT, &caps);
1050 has_d24s8_int = (caps.value & mask.value) == mask.value;
1051
1052 /* XXX: We might want some other logic here.
1053 * Like if we only have d24s8_int we should
1054 * emulate the other formats with that.
1055 */
1056 if (has_df16) {
1057 svgascreen->depth.z16 = SVGA3D_Z_DF16;
1058 }
1059 if (has_df24) {
1060 svgascreen->depth.x8z24 = SVGA3D_Z_DF24;
1061 }
1062 if (has_d24s8_int) {
1063 svgascreen->depth.s8z24 = SVGA3D_Z_D24S8_INT;
1064 }
1065 }
1066
1067 /* Query device caps
1068 */
1069 if (sws->have_vgpu10) {
1070 svgascreen->haveProvokingVertex
1071 = get_bool_cap(sws, SVGA3D_DEVCAP_DX_PROVOKING_VERTEX, FALSE);
1072 svgascreen->haveLineSmooth = TRUE;
1073 svgascreen->maxPointSize = 80.0F;
1074 svgascreen->max_color_buffers = SVGA3D_DX_MAX_RENDER_TARGETS;
1075
1076 /* Multisample samples per pixel */
1077 if (sws->have_sm4_1 && debug_get_bool_option("SVGA_MSAA", TRUE)) {
1078 if (get_bool_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_2X, FALSE))
1079 svgascreen->ms_samples |= 1 << 1;
1080 if (get_bool_cap(sws, SVGA3D_DEVCAP_MULTISAMPLE_4X, FALSE))
1081 svgascreen->ms_samples |= 1 << 3;
1082 }
1083
1084 /* Maximum number of constant buffers */
1085 svgascreen->max_const_buffers =
1086 get_uint_cap(sws, SVGA3D_DEVCAP_DX_MAX_CONSTANT_BUFFERS, 1);
1087 svgascreen->max_const_buffers = MIN2(svgascreen->max_const_buffers,
1088 SVGA_MAX_CONST_BUFS);
1089
1090 screen->is_format_supported = svga_is_dx_format_supported;
1091 }
1092 else {
1093 /* VGPU9 */
1094 unsigned vs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_VERTEX_SHADER_VERSION,
1095 SVGA3DVSVERSION_NONE);
1096 unsigned fs_ver = get_uint_cap(sws, SVGA3D_DEVCAP_FRAGMENT_SHADER_VERSION,
1097 SVGA3DPSVERSION_NONE);
1098
1099 /* we require Shader model 3.0 or later */
1100 if (fs_ver < SVGA3DPSVERSION_30 || vs_ver < SVGA3DVSVERSION_30) {
1101 goto error2;
1102 }
1103
1104 svgascreen->haveProvokingVertex = FALSE;
1105
1106 svgascreen->haveLineSmooth =
1107 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_AA, FALSE);
1108
1109 svgascreen->maxPointSize =
1110 get_float_cap(sws, SVGA3D_DEVCAP_MAX_POINT_SIZE, 1.0f);
1111 /* Keep this to a reasonable size to avoid failures in conform/pntaa.c */
1112 svgascreen->maxPointSize = MIN2(svgascreen->maxPointSize, 80.0f);
1113
1114 /* The SVGA3D device always supports 4 targets at this time, regardless
1115 * of what querying SVGA3D_DEVCAP_MAX_RENDER_TARGETS might return.
1116 */
1117 svgascreen->max_color_buffers = 4;
1118
1119 /* Only support one constant buffer
1120 */
1121 svgascreen->max_const_buffers = 1;
1122
1123 /* No multisampling */
1124 svgascreen->ms_samples = 0;
1125 }
1126
1127 /* common VGPU9 / VGPU10 caps */
1128 svgascreen->haveLineStipple =
1129 get_bool_cap(sws, SVGA3D_DEVCAP_LINE_STIPPLE, FALSE);
1130
1131 svgascreen->maxLineWidth =
1132 MAX2(1.0, get_float_cap(sws, SVGA3D_DEVCAP_MAX_LINE_WIDTH, 1.0f));
1133
1134 svgascreen->maxLineWidthAA =
1135 MAX2(1.0, get_float_cap(sws, SVGA3D_DEVCAP_MAX_AA_LINE_WIDTH, 1.0f));
1136
1137 if (0) {
1138 debug_printf("svga: haveProvokingVertex %u\n",
1139 svgascreen->haveProvokingVertex);
1140 debug_printf("svga: haveLineStip %u "
1141 "haveLineSmooth %u maxLineWidth %.2f maxLineWidthAA %.2f\n",
1142 svgascreen->haveLineStipple, svgascreen->haveLineSmooth,
1143 svgascreen->maxLineWidth, svgascreen->maxLineWidthAA);
1144 debug_printf("svga: maxPointSize %g\n", svgascreen->maxPointSize);
1145 debug_printf("svga: msaa samples mask: 0x%x\n", svgascreen->ms_samples);
1146 }
1147
1148 (void) mtx_init(&svgascreen->tex_mutex, mtx_plain);
1149 (void) mtx_init(&svgascreen->swc_mutex, mtx_recursive);
1150
1151 svga_screen_cache_init(svgascreen);
1152
1153 if (debug_get_bool_option("SVGA_NO_LOGGING", FALSE) == TRUE) {
1154 svgascreen->sws->host_log = nop_host_log;
1155 } else {
1156 init_logging(screen);
1157 }
1158
1159 return screen;
1160 error2:
1161 FREE(svgascreen);
1162 error1:
1163 return NULL;
1164 }
1165
1166
1167 struct svga_winsys_screen *
1168 svga_winsys_screen(struct pipe_screen *screen)
1169 {
1170 return svga_screen(screen)->sws;
1171 }
1172
1173
1174 #ifdef DEBUG
1175 struct svga_screen *
1176 svga_screen(struct pipe_screen *screen)
1177 {
1178 assert(screen);
1179 assert(screen->destroy == svga_destroy_screen);
1180 return (struct svga_screen *)screen;
1181 }
1182 #endif