zink: add note about enabling PIPE_CAP_CLIP_HALFZ
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "state_tracker/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i)
84 size += screen->mem_props.memoryHeaps[i].size;
85 return (int)(size >> 20);
86 }
87
88 static int
89 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
90 {
91 struct zink_screen *screen = zink_screen(pscreen);
92
93 switch (param) {
94 case PIPE_CAP_NPOT_TEXTURES:
95 return 1;
96
97 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
98 return screen->props.limits.maxFragmentDualSrcAttachments;
99
100 case PIPE_CAP_POINT_SPRITE:
101 return 1;
102
103 case PIPE_CAP_MAX_RENDER_TARGETS:
104 return screen->props.limits.maxColorAttachments;
105
106 case PIPE_CAP_OCCLUSION_QUERY:
107 case PIPE_CAP_QUERY_TIME_ELAPSED:
108 return 1;
109
110 case PIPE_CAP_TEXTURE_SWIZZLE:
111 return 1;
112
113 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
114 return screen->props.limits.maxImageDimension2D;
115 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
116 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
117 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
118 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
119
120 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
121 return 1;
122
123 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
124 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
125 case PIPE_CAP_VERTEX_SHADER_SATURATE:
126 return 1;
127
128 case PIPE_CAP_INDEP_BLEND_ENABLE:
129 case PIPE_CAP_INDEP_BLEND_FUNC:
130 return 1;
131
132 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
133 return screen->props.limits.maxImageArrayLayers;
134
135 #if 0 /* TODO: Enable me */
136 case PIPE_CAP_DEPTH_CLIP_DISABLE:
137 return 0;
138 #endif
139
140 #if 0 /* TODO: Enable me */
141 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
142 return 1;
143 #endif
144
145 case PIPE_CAP_SEAMLESS_CUBE_MAP:
146 return 1;
147
148 case PIPE_CAP_MIN_TEXEL_OFFSET:
149 return screen->props.limits.minTexelOffset;
150 case PIPE_CAP_MAX_TEXEL_OFFSET:
151 return screen->props.limits.maxTexelOffset;
152
153 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
154 return 1;
155
156 case PIPE_CAP_GLSL_FEATURE_LEVEL:
157 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
158 return 120;
159
160 #if 0 /* TODO: Enable me */
161 case PIPE_CAP_COMPUTE:
162 return 1;
163 #endif
164
165 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
166 return screen->props.limits.minUniformBufferOffsetAlignment;
167
168 case PIPE_CAP_QUERY_TIMESTAMP:
169 return 1;
170
171 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
172 return screen->props.limits.minMemoryMapAlignment;
173
174 case PIPE_CAP_CUBE_MAP_ARRAY:
175 return screen->feats.imageCubeArray;
176
177 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
178 return 0; /* unsure */
179
180 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
181 return screen->props.limits.maxTexelBufferElements;
182
183 case PIPE_CAP_ENDIANNESS:
184 return PIPE_ENDIAN_NATIVE; /* unsure */
185
186 case PIPE_CAP_MAX_VIEWPORTS:
187 return screen->props.limits.maxViewports;
188
189 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
190 return 1;
191
192 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
193 return screen->props.limits.maxGeometryOutputVertices;
194 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
195 return screen->props.limits.maxGeometryOutputComponents;
196
197 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
198 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
199 return 4;
200 #endif
201
202 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
203 return screen->props.limits.minTexelGatherOffset;
204 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
205 return screen->props.limits.maxTexelGatherOffset;
206
207 case PIPE_CAP_VENDOR_ID:
208 return screen->props.vendorID;
209 case PIPE_CAP_DEVICE_ID:
210 return screen->props.deviceID;
211
212 case PIPE_CAP_ACCELERATED:
213 return 1;
214 case PIPE_CAP_VIDEO_MEMORY:
215 return get_video_mem(screen);
216 case PIPE_CAP_UMA:
217 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
218
219 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
220 return screen->props.limits.maxVertexInputBindingStride;
221
222 #if 0 /* TODO: Enable me */
223 case PIPE_CAP_SAMPLER_VIEW_TARGET:
224 return 1;
225 #endif
226
227 #if 0 /* TODO: Enable me */
228 case PIPE_CAP_CLIP_HALFZ:
229 return 1;
230 #endif
231
232 #if 0 /* TODO: Enable me */
233 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
234 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
235 return 1;
236 #endif
237
238 case PIPE_CAP_SHAREABLE_SHADERS:
239 return 1;
240
241 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
242 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
243 return screen->props.limits.minStorageBufferOffsetAlignment;
244 #endif
245
246 case PIPE_CAP_PCI_GROUP:
247 case PIPE_CAP_PCI_BUS:
248 case PIPE_CAP_PCI_DEVICE:
249 case PIPE_CAP_PCI_FUNCTION:
250 return 0; /* TODO: figure these out */
251
252 #if 0 /* TODO: Enable me */
253 case PIPE_CAP_CULL_DISTANCE:
254 return screen->feats.shaderCullDistance;
255 #endif
256
257 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
258 return screen->props.limits.viewportSubPixelBits;
259
260 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
261 return 0; /* not sure */
262
263 case PIPE_CAP_MAX_GS_INVOCATIONS:
264 return 0; /* not implemented */
265
266 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
267 return screen->props.limits.maxDescriptorSetStorageBuffers;
268
269 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
270 return screen->props.limits.maxStorageBufferRange; /* unsure */
271
272 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
273 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
274 return 1;
275
276 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
277 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
278 return 0;
279
280 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
281 return 1;
282
283 case PIPE_CAP_NIR_COMPACT_ARRAYS:
284 return 1;
285
286 case PIPE_CAP_FLATSHADE:
287 case PIPE_CAP_ALPHA_TEST:
288 case PIPE_CAP_CLIP_PLANES:
289 return 0;
290
291 default:
292 return u_pipe_screen_get_param_defaults(pscreen, param);
293 }
294 }
295
296 static float
297 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
298 {
299 struct zink_screen *screen = zink_screen(pscreen);
300
301 switch (param) {
302 case PIPE_CAPF_MAX_LINE_WIDTH:
303 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
304 return screen->props.limits.lineWidthRange[1];
305
306 case PIPE_CAPF_MAX_POINT_WIDTH:
307 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
308 return screen->props.limits.pointSizeRange[1];
309
310 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
311 return screen->props.limits.maxSamplerAnisotropy;
312
313 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
314 return screen->props.limits.maxSamplerLodBias;
315
316 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
317 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
318 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
319 return 0.0f; /* not implemented */
320 }
321
322 /* should only get here on unhandled cases */
323 return 0.0;
324 }
325
326 static int
327 zink_get_shader_param(struct pipe_screen *pscreen,
328 enum pipe_shader_type shader,
329 enum pipe_shader_cap param)
330 {
331 struct zink_screen *screen = zink_screen(pscreen);
332
333 switch (param) {
334 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
335 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
336 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
337 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
338 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
339 if (shader == PIPE_SHADER_VERTEX ||
340 shader == PIPE_SHADER_FRAGMENT)
341 return INT_MAX;
342 return 0;
343
344 case PIPE_SHADER_CAP_MAX_INPUTS:
345 switch (shader) {
346 case PIPE_SHADER_VERTEX:
347 return MIN2(screen->props.limits.maxVertexInputAttributes,
348 PIPE_MAX_SHADER_INPUTS);
349 case PIPE_SHADER_FRAGMENT:
350 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
351 PIPE_MAX_SHADER_INPUTS);
352 default:
353 return 0; /* unsupported stage */
354 }
355
356 case PIPE_SHADER_CAP_MAX_OUTPUTS:
357 switch (shader) {
358 case PIPE_SHADER_VERTEX:
359 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
360 PIPE_MAX_SHADER_OUTPUTS);
361 case PIPE_SHADER_FRAGMENT:
362 return MIN2(screen->props.limits.maxColorAttachments,
363 PIPE_MAX_SHADER_OUTPUTS);
364 default:
365 return 0; /* unsupported stage */
366 }
367
368 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
369 /* this might be a bit simplistic... */
370 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
371 PIPE_MAX_SAMPLERS);
372
373 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
374 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
375
376 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
377 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
378
379 case PIPE_SHADER_CAP_MAX_TEMPS:
380 return INT_MAX;
381
382 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
383 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
384 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
385 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
386 case PIPE_SHADER_CAP_SUBROUTINES:
387 case PIPE_SHADER_CAP_INTEGERS:
388 case PIPE_SHADER_CAP_INT64_ATOMICS:
389 case PIPE_SHADER_CAP_FP16:
390 return 0; /* not implemented */
391
392 case PIPE_SHADER_CAP_PREFERRED_IR:
393 return PIPE_SHADER_IR_NIR;
394
395 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
396 return 0; /* not implemented */
397
398 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
399 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
400 PIPE_MAX_SHADER_SAMPLER_VIEWS);
401
402 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
403 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
404 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
405 return 0; /* not implemented */
406
407 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
408 return 0; /* no idea */
409
410 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
411 return 32; /* arbitrary */
412
413 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
414 /* TODO: this limitation is dumb, and will need some fixes in mesa */
415 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, 8);
416
417 case PIPE_SHADER_CAP_SUPPORTED_IRS:
418 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
419
420 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
421 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
422 PIPE_MAX_SHADER_IMAGES);
423
424 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
425 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
426 return 0; /* unsure */
427
428 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
429 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
430 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
431 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
432 return 0; /* not implemented */
433 }
434
435 /* should only get here on unhandled cases */
436 return 0;
437 }
438
439 static const VkFormat formats[PIPE_FORMAT_COUNT] = {
440 #define MAP_FORMAT_NORM(FMT) \
441 [PIPE_FORMAT_ ## FMT ## _UNORM] = VK_FORMAT_ ## FMT ## _UNORM, \
442 [PIPE_FORMAT_ ## FMT ## _SNORM] = VK_FORMAT_ ## FMT ## _SNORM,
443
444 #define MAP_FORMAT_SCALED(FMT) \
445 [PIPE_FORMAT_ ## FMT ## _USCALED] = VK_FORMAT_ ## FMT ## _USCALED, \
446 [PIPE_FORMAT_ ## FMT ## _SSCALED] = VK_FORMAT_ ## FMT ## _SSCALED,
447
448 #define MAP_FORMAT_INT(FMT) \
449 [PIPE_FORMAT_ ## FMT ## _UINT] = VK_FORMAT_ ## FMT ## _UINT, \
450 [PIPE_FORMAT_ ## FMT ## _SINT] = VK_FORMAT_ ## FMT ## _SINT,
451
452 #define MAP_FORMAT_SRGB(FMT) \
453 [PIPE_FORMAT_ ## FMT ## _SRGB] = VK_FORMAT_ ## FMT ## _SRGB,
454
455 #define MAP_FORMAT_FLOAT(FMT) \
456 [PIPE_FORMAT_ ## FMT ## _FLOAT] = VK_FORMAT_ ## FMT ## _SFLOAT,
457
458 // one component
459
460 // 8-bits
461 MAP_FORMAT_NORM(R8)
462 MAP_FORMAT_SCALED(R8)
463 MAP_FORMAT_INT(R8)
464 // 16-bits
465 MAP_FORMAT_NORM(R16)
466 MAP_FORMAT_SCALED(R16)
467 MAP_FORMAT_INT(R16)
468 MAP_FORMAT_FLOAT(R16)
469 // 32-bits
470 MAP_FORMAT_INT(R32)
471 MAP_FORMAT_FLOAT(R32)
472
473 // two components
474
475 // 8-bits
476 MAP_FORMAT_NORM(R8G8)
477 MAP_FORMAT_SCALED(R8G8)
478 MAP_FORMAT_INT(R8G8)
479 // 16-bits
480 MAP_FORMAT_NORM(R16G16)
481 MAP_FORMAT_SCALED(R16G16)
482 MAP_FORMAT_INT(R16G16)
483 MAP_FORMAT_FLOAT(R16G16)
484 // 32-bits
485 MAP_FORMAT_INT(R32G32)
486 MAP_FORMAT_FLOAT(R32G32)
487
488 // three components
489
490 // 8-bits
491 MAP_FORMAT_NORM(R8G8B8)
492 MAP_FORMAT_SCALED(R8G8B8)
493 MAP_FORMAT_INT(R8G8B8)
494 MAP_FORMAT_SRGB(R8G8B8)
495 // 16-bits
496 MAP_FORMAT_NORM(R16G16B16)
497 MAP_FORMAT_SCALED(R16G16B16)
498 MAP_FORMAT_INT(R16G16B16)
499 MAP_FORMAT_FLOAT(R16G16B16)
500 // 32-bits
501 MAP_FORMAT_INT(R32G32B32)
502 MAP_FORMAT_FLOAT(R32G32B32)
503
504 // four components
505
506 // 8-bits
507 MAP_FORMAT_NORM(R8G8B8A8)
508 MAP_FORMAT_SCALED(R8G8B8A8)
509 MAP_FORMAT_INT(R8G8B8A8)
510 MAP_FORMAT_SRGB(R8G8B8A8)
511 [PIPE_FORMAT_B8G8R8A8_UNORM] = VK_FORMAT_B8G8R8A8_UNORM,
512 MAP_FORMAT_SRGB(B8G8R8A8)
513 [PIPE_FORMAT_A8B8G8R8_SRGB] = VK_FORMAT_A8B8G8R8_SRGB_PACK32,
514 // 16-bits
515 MAP_FORMAT_NORM(R16G16B16A16)
516 MAP_FORMAT_SCALED(R16G16B16A16)
517 MAP_FORMAT_INT(R16G16B16A16)
518 MAP_FORMAT_FLOAT(R16G16B16A16)
519 // 32-bits
520 MAP_FORMAT_INT(R32G32B32A32)
521 MAP_FORMAT_FLOAT(R32G32B32A32)
522
523 // other color formats
524 [PIPE_FORMAT_B5G6R5_UNORM] = VK_FORMAT_R5G6B5_UNORM_PACK16,
525 [PIPE_FORMAT_B5G5R5A1_UNORM] = VK_FORMAT_B5G5R5A1_UNORM_PACK16,
526 [PIPE_FORMAT_R11G11B10_FLOAT] = VK_FORMAT_B10G11R11_UFLOAT_PACK32,
527 [PIPE_FORMAT_R9G9B9E5_FLOAT] = VK_FORMAT_E5B9G9R9_UFLOAT_PACK32,
528 [PIPE_FORMAT_R10G10B10A2_UNORM] = VK_FORMAT_A2B10G10R10_UNORM_PACK32,
529 [PIPE_FORMAT_B10G10R10A2_UNORM] = VK_FORMAT_A2R10G10B10_UNORM_PACK32,
530 [PIPE_FORMAT_R10G10B10A2_UINT] = VK_FORMAT_A2B10G10R10_UINT_PACK32,
531 [PIPE_FORMAT_B10G10R10A2_UINT] = VK_FORMAT_A2R10G10B10_UINT_PACK32,
532
533 // depth/stencil formats
534 [PIPE_FORMAT_Z32_FLOAT] = VK_FORMAT_D32_SFLOAT,
535 [PIPE_FORMAT_Z32_FLOAT_S8X24_UINT] = VK_FORMAT_D32_SFLOAT_S8_UINT,
536 [PIPE_FORMAT_Z16_UNORM] = VK_FORMAT_D16_UNORM,
537 [PIPE_FORMAT_X8Z24_UNORM] = VK_FORMAT_X8_D24_UNORM_PACK32,
538 [PIPE_FORMAT_Z24_UNORM_S8_UINT] = VK_FORMAT_D24_UNORM_S8_UINT,
539
540 // compressed formats
541 [PIPE_FORMAT_DXT1_RGB] = VK_FORMAT_BC1_RGB_UNORM_BLOCK,
542 [PIPE_FORMAT_DXT1_RGBA] = VK_FORMAT_BC1_RGBA_UNORM_BLOCK,
543 [PIPE_FORMAT_DXT3_RGBA] = VK_FORMAT_BC2_UNORM_BLOCK,
544 [PIPE_FORMAT_DXT5_RGBA] = VK_FORMAT_BC3_UNORM_BLOCK,
545 [PIPE_FORMAT_RGTC1_UNORM] = VK_FORMAT_BC4_UNORM_BLOCK,
546 [PIPE_FORMAT_RGTC1_SNORM] = VK_FORMAT_BC4_SNORM_BLOCK,
547 [PIPE_FORMAT_RGTC2_UNORM] = VK_FORMAT_BC5_UNORM_BLOCK,
548 [PIPE_FORMAT_RGTC2_SNORM] = VK_FORMAT_BC5_SNORM_BLOCK,
549 [PIPE_FORMAT_BPTC_RGBA_UNORM] = VK_FORMAT_BC7_UNORM_BLOCK,
550 [PIPE_FORMAT_BPTC_SRGBA] = VK_FORMAT_BC7_SRGB_BLOCK,
551 [PIPE_FORMAT_BPTC_RGB_FLOAT] = VK_FORMAT_BC6H_SFLOAT_BLOCK,
552 [PIPE_FORMAT_BPTC_RGB_UFLOAT] = VK_FORMAT_BC6H_UFLOAT_BLOCK,
553 };
554
555 VkFormat
556 zink_get_format(enum pipe_format format)
557 {
558 return formats[format];
559 }
560
561 static VkSampleCountFlagBits
562 vk_sample_count_flags(uint32_t sample_count)
563 {
564 switch (sample_count) {
565 case 1: return VK_SAMPLE_COUNT_1_BIT;
566 case 2: return VK_SAMPLE_COUNT_2_BIT;
567 case 4: return VK_SAMPLE_COUNT_4_BIT;
568 case 8: return VK_SAMPLE_COUNT_8_BIT;
569 case 16: return VK_SAMPLE_COUNT_16_BIT;
570 case 32: return VK_SAMPLE_COUNT_32_BIT;
571 case 64: return VK_SAMPLE_COUNT_64_BIT;
572 default:
573 return 0;
574 }
575 }
576
577 static bool
578 zink_is_format_supported(struct pipe_screen *pscreen,
579 enum pipe_format format,
580 enum pipe_texture_target target,
581 unsigned sample_count,
582 unsigned storage_sample_count,
583 unsigned bind)
584 {
585 struct zink_screen *screen = zink_screen(pscreen);
586
587 if (format == PIPE_FORMAT_NONE)
588 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
589 vk_sample_count_flags(sample_count);
590
591 VkFormat vkformat = formats[format];
592 if (vkformat == VK_FORMAT_UNDEFINED)
593 return FALSE;
594
595 if (sample_count >= 1) {
596 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
597 const struct util_format_description *desc = util_format_description(format);
598 if (util_format_is_depth_or_stencil(format)) {
599 if (util_format_has_depth(desc)) {
600 if (bind & PIPE_BIND_DEPTH_STENCIL &&
601 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
602 return FALSE;
603 if (bind & PIPE_BIND_SAMPLER_VIEW &&
604 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
605 return FALSE;
606 }
607 if (util_format_has_stencil(desc)) {
608 if (bind & PIPE_BIND_DEPTH_STENCIL &&
609 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
610 return FALSE;
611 if (bind & PIPE_BIND_SAMPLER_VIEW &&
612 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
613 return FALSE;
614 }
615 } else if (util_format_is_pure_integer(format)) {
616 if (bind & PIPE_BIND_RENDER_TARGET &&
617 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
618 return FALSE;
619 if (bind & PIPE_BIND_SAMPLER_VIEW &&
620 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
621 return FALSE;
622 } else {
623 if (bind & PIPE_BIND_RENDER_TARGET &&
624 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
625 return FALSE;
626 if (bind & PIPE_BIND_SAMPLER_VIEW &&
627 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
628 return FALSE;
629 }
630 }
631
632 VkFormatProperties props;
633 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
634
635 if (target == PIPE_BUFFER) {
636 if (bind & PIPE_BIND_VERTEX_BUFFER &&
637 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
638 return FALSE;
639 } else {
640 /* all other targets are texture-targets */
641 if (bind & PIPE_BIND_RENDER_TARGET &&
642 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
643 return FALSE;
644
645 if (bind & PIPE_BIND_BLENDABLE &&
646 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
647 return FALSE;
648
649 if (bind & PIPE_BIND_SAMPLER_VIEW &&
650 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
651 return FALSE;
652
653 if (bind & PIPE_BIND_DEPTH_STENCIL &&
654 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
655 return FALSE;
656 }
657
658 if (util_format_is_compressed(format)) {
659 const struct util_format_description *desc = util_format_description(format);
660 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
661 !screen->feats.textureCompressionBC)
662 return FALSE;
663 }
664
665 return TRUE;
666 }
667
668 static void
669 zink_destroy_screen(struct pipe_screen *pscreen)
670 {
671 struct zink_screen *screen = zink_screen(pscreen);
672 slab_destroy_parent(&screen->transfer_pool);
673 FREE(screen);
674 }
675
676 static VkInstance
677 create_instance()
678 {
679 VkApplicationInfo ai = {};
680 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
681
682 char proc_name[128];
683 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
684 ai.pApplicationName = proc_name;
685 else
686 ai.pApplicationName = "unknown";
687
688 ai.pEngineName = "mesa zink";
689 ai.apiVersion = VK_API_VERSION_1_0;
690
691 const char *extensions[] = {
692 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
693 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
694 };
695
696 VkInstanceCreateInfo ici = {};
697 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
698 ici.pApplicationInfo = &ai;
699 ici.ppEnabledExtensionNames = extensions;
700 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
701
702 VkInstance instance = VK_NULL_HANDLE;
703 VkResult err = vkCreateInstance(&ici, NULL, &instance);
704 if (err != VK_SUCCESS)
705 return VK_NULL_HANDLE;
706
707 return instance;
708 }
709
710 static VkPhysicalDevice
711 choose_pdev(const VkInstance instance)
712 {
713 uint32_t i, pdev_count;
714 VkPhysicalDevice *pdevs, pdev;
715 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
716 assert(pdev_count > 0);
717
718 pdevs = malloc(sizeof(*pdevs) * pdev_count);
719 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
720 assert(pdev_count > 0);
721
722 pdev = pdevs[0];
723 for (i = 0; i < pdev_count; ++i) {
724 VkPhysicalDeviceProperties props;
725 vkGetPhysicalDeviceProperties(pdevs[i], &props);
726 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
727 pdev = pdevs[i];
728 break;
729 }
730 }
731 free(pdevs);
732 return pdev;
733 }
734
735 static uint32_t
736 find_gfx_queue(const VkPhysicalDevice pdev)
737 {
738 uint32_t num_queues;
739 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, NULL);
740 assert(num_queues > 0);
741
742 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
743 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, props);
744
745 for (uint32_t i = 0; i < num_queues; i++) {
746 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
747 free(props);
748 return i;
749 }
750 }
751
752 return UINT32_MAX;
753 }
754
755 static void
756 zink_flush_frontbuffer(struct pipe_screen *pscreen,
757 struct pipe_resource *pres,
758 unsigned level, unsigned layer,
759 void *winsys_drawable_handle,
760 struct pipe_box *sub_box)
761 {
762 struct zink_screen *screen = zink_screen(pscreen);
763 struct sw_winsys *winsys = screen->winsys;
764 struct zink_resource *res = zink_resource(pres);
765
766 if (!winsys)
767 return;
768 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
769
770 if (map) {
771 VkImageSubresource isr = {};
772 isr.aspectMask = res->aspect;
773 isr.mipLevel = level;
774 isr.arrayLayer = layer;
775 VkSubresourceLayout layout;
776 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
777
778 void *ptr;
779 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
780 if (result != VK_SUCCESS) {
781 debug_printf("failed to map memory for display\n");
782 return;
783 }
784 for (int i = 0; i < pres->height0; ++i) {
785 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
786 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
787 memcpy(dst, src, res->dt_stride);
788 }
789 vkUnmapMemory(screen->dev, res->mem);
790 }
791
792 winsys->displaytarget_unmap(winsys, res->dt);
793
794 assert(res->dt);
795 if (res->dt)
796 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
797 }
798
799 static struct pipe_screen *
800 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
801 {
802 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
803 if (!screen)
804 return NULL;
805
806 zink_debug = debug_get_option_zink_debug();
807
808 screen->instance = create_instance();
809 screen->pdev = choose_pdev(screen->instance);
810 screen->gfx_queue = find_gfx_queue(screen->pdev);
811
812 vkGetPhysicalDeviceProperties(screen->pdev, &screen->props);
813 vkGetPhysicalDeviceFeatures(screen->pdev, &screen->feats);
814 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
815
816 uint32_t num_extensions = 0;
817 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
818 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
819 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
820 num_extensions);
821 if (extensions) {
822 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
823 &num_extensions, extensions);
824
825 for (uint32_t i = 0; i < num_extensions; ++i) {
826 if (!strcmp(extensions[i].extensionName,
827 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
828 screen->have_VK_KHR_maintenance1 = true;
829 }
830 FREE(extensions);
831 }
832 }
833
834 VkDeviceQueueCreateInfo qci = {};
835 float dummy = 0.0f;
836 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
837 qci.queueFamilyIndex = screen->gfx_queue;
838 qci.queueCount = 1;
839 qci.pQueuePriorities = &dummy;
840
841 VkDeviceCreateInfo dci = {};
842 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
843 dci.queueCreateInfoCount = 1;
844 dci.pQueueCreateInfos = &qci;
845 dci.pEnabledFeatures = &screen->feats;
846 const char *extensions[] = {
847 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
848 VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME,
849 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME,
850 };
851 dci.ppEnabledExtensionNames = extensions;
852 dci.enabledExtensionCount = ARRAY_SIZE(extensions);
853 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
854 goto fail;
855
856 screen->winsys = winsys;
857
858 screen->base.get_name = zink_get_name;
859 screen->base.get_vendor = zink_get_vendor;
860 screen->base.get_device_vendor = zink_get_device_vendor;
861 screen->base.get_param = zink_get_param;
862 screen->base.get_paramf = zink_get_paramf;
863 screen->base.get_shader_param = zink_get_shader_param;
864 screen->base.get_compiler_options = zink_get_compiler_options;
865 screen->base.is_format_supported = zink_is_format_supported;
866 screen->base.context_create = zink_context_create;
867 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
868 screen->base.destroy = zink_destroy_screen;
869
870 zink_screen_resource_init(&screen->base);
871 zink_screen_fence_init(&screen->base);
872
873 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
874
875 return &screen->base;
876
877 fail:
878 FREE(screen);
879 return NULL;
880 }
881
882 struct pipe_screen *
883 zink_create_screen(struct sw_winsys *winsys)
884 {
885 return zink_internal_create_screen(winsys, -1);
886 }
887
888 struct pipe_screen *
889 zink_drm_create_screen(int fd)
890 {
891 return zink_internal_create_screen(NULL, fd);
892 }