e7dcebe0c8b77fdd7547c8c86833dc752a431352
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "state_tracker/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i)
84 size += screen->mem_props.memoryHeaps[i].size;
85 return (int)(size >> 20);
86 }
87
88 static int
89 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
90 {
91 struct zink_screen *screen = zink_screen(pscreen);
92
93 switch (param) {
94 case PIPE_CAP_NPOT_TEXTURES:
95 return 1;
96
97 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
98 return screen->props.limits.maxFragmentDualSrcAttachments;
99
100 case PIPE_CAP_POINT_SPRITE:
101 return 1;
102
103 case PIPE_CAP_MAX_RENDER_TARGETS:
104 return screen->props.limits.maxColorAttachments;
105
106 case PIPE_CAP_OCCLUSION_QUERY:
107 return 1;
108
109 #if 0 /* TODO: Enable me */
110 case PIPE_CAP_QUERY_TIME_ELAPSED:
111 return 1;
112 #endif
113
114 case PIPE_CAP_TEXTURE_SWIZZLE:
115 return 1;
116
117 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
118 return screen->props.limits.maxImageDimension2D;
119 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
120 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
121 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
122 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
123
124 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
125 return 1;
126
127 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
128 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
129 case PIPE_CAP_VERTEX_SHADER_SATURATE:
130 return 1;
131
132 case PIPE_CAP_INDEP_BLEND_ENABLE:
133 case PIPE_CAP_INDEP_BLEND_FUNC:
134 return 1;
135
136 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
137 return screen->props.limits.maxImageArrayLayers;
138
139 #if 0 /* TODO: Enable me */
140 case PIPE_CAP_DEPTH_CLIP_DISABLE:
141 return 0;
142 #endif
143
144 #if 0 /* TODO: Enable me */
145 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
146 return 1;
147 #endif
148
149 case PIPE_CAP_SEAMLESS_CUBE_MAP:
150 return 1;
151
152 case PIPE_CAP_MIN_TEXEL_OFFSET:
153 return screen->props.limits.minTexelOffset;
154 case PIPE_CAP_MAX_TEXEL_OFFSET:
155 return screen->props.limits.maxTexelOffset;
156
157 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
158 return 1;
159
160 case PIPE_CAP_GLSL_FEATURE_LEVEL:
161 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
162 return 120;
163
164 #if 0 /* TODO: Enable me */
165 case PIPE_CAP_COMPUTE:
166 return 1;
167 #endif
168
169 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
170 return screen->props.limits.minUniformBufferOffsetAlignment;
171
172 #if 0 /* TODO: Enable me */
173 case PIPE_CAP_QUERY_TIMESTAMP:
174 return 1;
175 #endif
176
177 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
178 return screen->props.limits.minMemoryMapAlignment;
179
180 case PIPE_CAP_CUBE_MAP_ARRAY:
181 return screen->feats.imageCubeArray;
182
183 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
184 return 0; /* unsure */
185
186 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
187 return screen->props.limits.maxTexelBufferElements;
188
189 case PIPE_CAP_ENDIANNESS:
190 return PIPE_ENDIAN_NATIVE; /* unsure */
191
192 case PIPE_CAP_MAX_VIEWPORTS:
193 return screen->props.limits.maxViewports;
194
195 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
196 return 1;
197
198 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
199 return screen->props.limits.maxGeometryOutputVertices;
200 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
201 return screen->props.limits.maxGeometryOutputComponents;
202
203 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
204 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
205 return 4;
206 #endif
207
208 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
209 return screen->props.limits.minTexelGatherOffset;
210 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
211 return screen->props.limits.maxTexelGatherOffset;
212
213 case PIPE_CAP_VENDOR_ID:
214 return screen->props.vendorID;
215 case PIPE_CAP_DEVICE_ID:
216 return screen->props.deviceID;
217
218 case PIPE_CAP_ACCELERATED:
219 return 1;
220 case PIPE_CAP_VIDEO_MEMORY:
221 return get_video_mem(screen);
222 case PIPE_CAP_UMA:
223 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
224
225 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
226 return screen->props.limits.maxVertexInputBindingStride;
227
228 #if 0 /* TODO: Enable me */
229 case PIPE_CAP_SAMPLER_VIEW_TARGET:
230 return 1;
231 #endif
232
233 #if 0 /* TODO: Enable me */
234 case PIPE_CAP_CLIP_HALFZ:
235 return 1;
236 #endif
237
238 #if 0 /* TODO: Enable me */
239 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
240 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
241 return 1;
242 #endif
243
244 case PIPE_CAP_SHAREABLE_SHADERS:
245 return 1;
246
247 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
248 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
249 return screen->props.limits.minStorageBufferOffsetAlignment;
250 #endif
251
252 case PIPE_CAP_PCI_GROUP:
253 case PIPE_CAP_PCI_BUS:
254 case PIPE_CAP_PCI_DEVICE:
255 case PIPE_CAP_PCI_FUNCTION:
256 return 0; /* TODO: figure these out */
257
258 #if 0 /* TODO: Enable me */
259 case PIPE_CAP_CULL_DISTANCE:
260 return screen->feats.shaderCullDistance;
261 #endif
262
263 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
264 return screen->props.limits.viewportSubPixelBits;
265
266 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
267 return 0; /* not sure */
268
269 case PIPE_CAP_MAX_GS_INVOCATIONS:
270 return 0; /* not implemented */
271
272 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
273 return screen->props.limits.maxDescriptorSetStorageBuffers;
274
275 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
276 return screen->props.limits.maxStorageBufferRange; /* unsure */
277
278 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
279 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
280 return 1;
281
282 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
283 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
284 return 0;
285
286 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
287 return 1;
288
289 case PIPE_CAP_NIR_COMPACT_ARRAYS:
290 return 1;
291
292 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
293 return 1;
294
295 case PIPE_CAP_FLATSHADE:
296 case PIPE_CAP_ALPHA_TEST:
297 case PIPE_CAP_CLIP_PLANES:
298 case PIPE_CAP_POINT_SIZE_FIXED:
299 case PIPE_CAP_TWO_SIDED_COLOR:
300 return 0;
301
302 default:
303 return u_pipe_screen_get_param_defaults(pscreen, param);
304 }
305 }
306
307 static float
308 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
309 {
310 struct zink_screen *screen = zink_screen(pscreen);
311
312 switch (param) {
313 case PIPE_CAPF_MAX_LINE_WIDTH:
314 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
315 return screen->props.limits.lineWidthRange[1];
316
317 case PIPE_CAPF_MAX_POINT_WIDTH:
318 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
319 return screen->props.limits.pointSizeRange[1];
320
321 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
322 return screen->props.limits.maxSamplerAnisotropy;
323
324 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
325 return screen->props.limits.maxSamplerLodBias;
326
327 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
328 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
329 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
330 return 0.0f; /* not implemented */
331 }
332
333 /* should only get here on unhandled cases */
334 return 0.0;
335 }
336
337 static int
338 zink_get_shader_param(struct pipe_screen *pscreen,
339 enum pipe_shader_type shader,
340 enum pipe_shader_cap param)
341 {
342 struct zink_screen *screen = zink_screen(pscreen);
343
344 switch (param) {
345 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
346 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
347 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
348 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
349 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
350 if (shader == PIPE_SHADER_VERTEX ||
351 shader == PIPE_SHADER_FRAGMENT)
352 return INT_MAX;
353 return 0;
354
355 case PIPE_SHADER_CAP_MAX_INPUTS:
356 switch (shader) {
357 case PIPE_SHADER_VERTEX:
358 return MIN2(screen->props.limits.maxVertexInputAttributes,
359 PIPE_MAX_SHADER_INPUTS);
360 case PIPE_SHADER_FRAGMENT:
361 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
362 PIPE_MAX_SHADER_INPUTS);
363 default:
364 return 0; /* unsupported stage */
365 }
366
367 case PIPE_SHADER_CAP_MAX_OUTPUTS:
368 switch (shader) {
369 case PIPE_SHADER_VERTEX:
370 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
371 PIPE_MAX_SHADER_OUTPUTS);
372 case PIPE_SHADER_FRAGMENT:
373 return MIN2(screen->props.limits.maxColorAttachments,
374 PIPE_MAX_SHADER_OUTPUTS);
375 default:
376 return 0; /* unsupported stage */
377 }
378
379 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
380 /* this might be a bit simplistic... */
381 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
382 PIPE_MAX_SAMPLERS);
383
384 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
385 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
386
387 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
388 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
389
390 case PIPE_SHADER_CAP_MAX_TEMPS:
391 return INT_MAX;
392
393 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
394 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
395 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
396 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
397 case PIPE_SHADER_CAP_SUBROUTINES:
398 case PIPE_SHADER_CAP_INTEGERS:
399 case PIPE_SHADER_CAP_INT64_ATOMICS:
400 case PIPE_SHADER_CAP_FP16:
401 return 0; /* not implemented */
402
403 case PIPE_SHADER_CAP_PREFERRED_IR:
404 return PIPE_SHADER_IR_NIR;
405
406 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
407 return 0; /* not implemented */
408
409 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
410 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
411 PIPE_MAX_SHADER_SAMPLER_VIEWS);
412
413 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
414 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
415 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
416 return 0; /* not implemented */
417
418 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
419 return 0; /* no idea */
420
421 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
422 return 32; /* arbitrary */
423
424 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
425 /* TODO: this limitation is dumb, and will need some fixes in mesa */
426 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, 8);
427
428 case PIPE_SHADER_CAP_SUPPORTED_IRS:
429 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
430
431 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
432 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
433 PIPE_MAX_SHADER_IMAGES);
434
435 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
436 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
437 return 0; /* unsure */
438
439 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
440 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
441 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
442 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
443 return 0; /* not implemented */
444 }
445
446 /* should only get here on unhandled cases */
447 return 0;
448 }
449
450 static const VkFormat formats[PIPE_FORMAT_COUNT] = {
451 #define MAP_FORMAT_NORM(FMT) \
452 [PIPE_FORMAT_ ## FMT ## _UNORM] = VK_FORMAT_ ## FMT ## _UNORM, \
453 [PIPE_FORMAT_ ## FMT ## _SNORM] = VK_FORMAT_ ## FMT ## _SNORM,
454
455 #define MAP_FORMAT_SCALED(FMT) \
456 [PIPE_FORMAT_ ## FMT ## _USCALED] = VK_FORMAT_ ## FMT ## _USCALED, \
457 [PIPE_FORMAT_ ## FMT ## _SSCALED] = VK_FORMAT_ ## FMT ## _SSCALED,
458
459 #define MAP_FORMAT_INT(FMT) \
460 [PIPE_FORMAT_ ## FMT ## _UINT] = VK_FORMAT_ ## FMT ## _UINT, \
461 [PIPE_FORMAT_ ## FMT ## _SINT] = VK_FORMAT_ ## FMT ## _SINT,
462
463 #define MAP_FORMAT_SRGB(FMT) \
464 [PIPE_FORMAT_ ## FMT ## _SRGB] = VK_FORMAT_ ## FMT ## _SRGB,
465
466 #define MAP_FORMAT_FLOAT(FMT) \
467 [PIPE_FORMAT_ ## FMT ## _FLOAT] = VK_FORMAT_ ## FMT ## _SFLOAT,
468
469 // one component
470
471 // 8-bits
472 MAP_FORMAT_NORM(R8)
473 MAP_FORMAT_SCALED(R8)
474 MAP_FORMAT_INT(R8)
475 // 16-bits
476 MAP_FORMAT_NORM(R16)
477 MAP_FORMAT_SCALED(R16)
478 MAP_FORMAT_INT(R16)
479 MAP_FORMAT_FLOAT(R16)
480 // 32-bits
481 MAP_FORMAT_INT(R32)
482 MAP_FORMAT_FLOAT(R32)
483
484 // two components
485
486 // 8-bits
487 MAP_FORMAT_NORM(R8G8)
488 MAP_FORMAT_SCALED(R8G8)
489 MAP_FORMAT_INT(R8G8)
490 // 16-bits
491 MAP_FORMAT_NORM(R16G16)
492 MAP_FORMAT_SCALED(R16G16)
493 MAP_FORMAT_INT(R16G16)
494 MAP_FORMAT_FLOAT(R16G16)
495 // 32-bits
496 MAP_FORMAT_INT(R32G32)
497 MAP_FORMAT_FLOAT(R32G32)
498
499 // three components
500
501 // 8-bits
502 MAP_FORMAT_NORM(R8G8B8)
503 MAP_FORMAT_SCALED(R8G8B8)
504 MAP_FORMAT_INT(R8G8B8)
505 MAP_FORMAT_SRGB(R8G8B8)
506 // 16-bits
507 MAP_FORMAT_NORM(R16G16B16)
508 MAP_FORMAT_SCALED(R16G16B16)
509 MAP_FORMAT_INT(R16G16B16)
510 MAP_FORMAT_FLOAT(R16G16B16)
511 // 32-bits
512 MAP_FORMAT_INT(R32G32B32)
513 MAP_FORMAT_FLOAT(R32G32B32)
514
515 // four components
516
517 // 8-bits
518 MAP_FORMAT_NORM(R8G8B8A8)
519 MAP_FORMAT_SCALED(R8G8B8A8)
520 MAP_FORMAT_INT(R8G8B8A8)
521 MAP_FORMAT_SRGB(R8G8B8A8)
522 [PIPE_FORMAT_B8G8R8A8_UNORM] = VK_FORMAT_B8G8R8A8_UNORM,
523 MAP_FORMAT_SRGB(B8G8R8A8)
524 [PIPE_FORMAT_A8B8G8R8_SRGB] = VK_FORMAT_A8B8G8R8_SRGB_PACK32,
525 // 16-bits
526 MAP_FORMAT_NORM(R16G16B16A16)
527 MAP_FORMAT_SCALED(R16G16B16A16)
528 MAP_FORMAT_INT(R16G16B16A16)
529 MAP_FORMAT_FLOAT(R16G16B16A16)
530 // 32-bits
531 MAP_FORMAT_INT(R32G32B32A32)
532 MAP_FORMAT_FLOAT(R32G32B32A32)
533
534 // other color formats
535 [PIPE_FORMAT_B5G6R5_UNORM] = VK_FORMAT_R5G6B5_UNORM_PACK16,
536 [PIPE_FORMAT_B5G5R5A1_UNORM] = VK_FORMAT_B5G5R5A1_UNORM_PACK16,
537 [PIPE_FORMAT_R11G11B10_FLOAT] = VK_FORMAT_B10G11R11_UFLOAT_PACK32,
538 [PIPE_FORMAT_R9G9B9E5_FLOAT] = VK_FORMAT_E5B9G9R9_UFLOAT_PACK32,
539 [PIPE_FORMAT_R10G10B10A2_UNORM] = VK_FORMAT_A2B10G10R10_UNORM_PACK32,
540 [PIPE_FORMAT_B10G10R10A2_UNORM] = VK_FORMAT_A2R10G10B10_UNORM_PACK32,
541 [PIPE_FORMAT_R10G10B10A2_UINT] = VK_FORMAT_A2B10G10R10_UINT_PACK32,
542 [PIPE_FORMAT_B10G10R10A2_UINT] = VK_FORMAT_A2R10G10B10_UINT_PACK32,
543
544 // depth/stencil formats
545 [PIPE_FORMAT_Z32_FLOAT] = VK_FORMAT_D32_SFLOAT,
546 [PIPE_FORMAT_Z32_FLOAT_S8X24_UINT] = VK_FORMAT_D32_SFLOAT_S8_UINT,
547 [PIPE_FORMAT_Z16_UNORM] = VK_FORMAT_D16_UNORM,
548 [PIPE_FORMAT_X8Z24_UNORM] = VK_FORMAT_X8_D24_UNORM_PACK32,
549 [PIPE_FORMAT_Z24_UNORM_S8_UINT] = VK_FORMAT_D24_UNORM_S8_UINT,
550
551 // compressed formats
552 [PIPE_FORMAT_DXT1_RGB] = VK_FORMAT_BC1_RGB_UNORM_BLOCK,
553 [PIPE_FORMAT_DXT1_RGBA] = VK_FORMAT_BC1_RGBA_UNORM_BLOCK,
554 [PIPE_FORMAT_DXT3_RGBA] = VK_FORMAT_BC2_UNORM_BLOCK,
555 [PIPE_FORMAT_DXT5_RGBA] = VK_FORMAT_BC3_UNORM_BLOCK,
556 [PIPE_FORMAT_DXT1_SRGB] = VK_FORMAT_BC1_RGB_SRGB_BLOCK,
557 [PIPE_FORMAT_DXT1_SRGBA] = VK_FORMAT_BC1_RGBA_SRGB_BLOCK,
558 [PIPE_FORMAT_DXT3_SRGBA] = VK_FORMAT_BC2_SRGB_BLOCK,
559 [PIPE_FORMAT_DXT5_SRGBA] = VK_FORMAT_BC3_SRGB_BLOCK,
560
561 [PIPE_FORMAT_RGTC1_UNORM] = VK_FORMAT_BC4_UNORM_BLOCK,
562 [PIPE_FORMAT_RGTC1_SNORM] = VK_FORMAT_BC4_SNORM_BLOCK,
563 [PIPE_FORMAT_RGTC2_UNORM] = VK_FORMAT_BC5_UNORM_BLOCK,
564 [PIPE_FORMAT_RGTC2_SNORM] = VK_FORMAT_BC5_SNORM_BLOCK,
565 [PIPE_FORMAT_BPTC_RGBA_UNORM] = VK_FORMAT_BC7_UNORM_BLOCK,
566 [PIPE_FORMAT_BPTC_SRGBA] = VK_FORMAT_BC7_SRGB_BLOCK,
567 [PIPE_FORMAT_BPTC_RGB_FLOAT] = VK_FORMAT_BC6H_SFLOAT_BLOCK,
568 [PIPE_FORMAT_BPTC_RGB_UFLOAT] = VK_FORMAT_BC6H_UFLOAT_BLOCK,
569 };
570
571 VkFormat
572 zink_get_format(enum pipe_format format)
573 {
574 return formats[format];
575 }
576
577 static VkSampleCountFlagBits
578 vk_sample_count_flags(uint32_t sample_count)
579 {
580 switch (sample_count) {
581 case 1: return VK_SAMPLE_COUNT_1_BIT;
582 case 2: return VK_SAMPLE_COUNT_2_BIT;
583 case 4: return VK_SAMPLE_COUNT_4_BIT;
584 case 8: return VK_SAMPLE_COUNT_8_BIT;
585 case 16: return VK_SAMPLE_COUNT_16_BIT;
586 case 32: return VK_SAMPLE_COUNT_32_BIT;
587 case 64: return VK_SAMPLE_COUNT_64_BIT;
588 default:
589 return 0;
590 }
591 }
592
593 static bool
594 zink_is_format_supported(struct pipe_screen *pscreen,
595 enum pipe_format format,
596 enum pipe_texture_target target,
597 unsigned sample_count,
598 unsigned storage_sample_count,
599 unsigned bind)
600 {
601 struct zink_screen *screen = zink_screen(pscreen);
602
603 if (format == PIPE_FORMAT_NONE)
604 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
605 vk_sample_count_flags(sample_count);
606
607 VkFormat vkformat = formats[format];
608 if (vkformat == VK_FORMAT_UNDEFINED)
609 return FALSE;
610
611 if (sample_count >= 1) {
612 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
613 const struct util_format_description *desc = util_format_description(format);
614 if (util_format_is_depth_or_stencil(format)) {
615 if (util_format_has_depth(desc)) {
616 if (bind & PIPE_BIND_DEPTH_STENCIL &&
617 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
618 return FALSE;
619 if (bind & PIPE_BIND_SAMPLER_VIEW &&
620 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
621 return FALSE;
622 }
623 if (util_format_has_stencil(desc)) {
624 if (bind & PIPE_BIND_DEPTH_STENCIL &&
625 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
626 return FALSE;
627 if (bind & PIPE_BIND_SAMPLER_VIEW &&
628 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
629 return FALSE;
630 }
631 } else if (util_format_is_pure_integer(format)) {
632 if (bind & PIPE_BIND_RENDER_TARGET &&
633 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
634 return FALSE;
635 if (bind & PIPE_BIND_SAMPLER_VIEW &&
636 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
637 return FALSE;
638 } else {
639 if (bind & PIPE_BIND_RENDER_TARGET &&
640 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
641 return FALSE;
642 if (bind & PIPE_BIND_SAMPLER_VIEW &&
643 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
644 return FALSE;
645 }
646 }
647
648 VkFormatProperties props;
649 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
650
651 if (target == PIPE_BUFFER) {
652 if (bind & PIPE_BIND_VERTEX_BUFFER &&
653 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
654 return FALSE;
655 } else {
656 /* all other targets are texture-targets */
657 if (bind & PIPE_BIND_RENDER_TARGET &&
658 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
659 return FALSE;
660
661 if (bind & PIPE_BIND_BLENDABLE &&
662 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
663 return FALSE;
664
665 if (bind & PIPE_BIND_SAMPLER_VIEW &&
666 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
667 return FALSE;
668
669 if (bind & PIPE_BIND_DEPTH_STENCIL &&
670 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
671 return FALSE;
672 }
673
674 if (util_format_is_compressed(format)) {
675 const struct util_format_description *desc = util_format_description(format);
676 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
677 !screen->feats.textureCompressionBC)
678 return FALSE;
679 }
680
681 return TRUE;
682 }
683
684 static void
685 zink_destroy_screen(struct pipe_screen *pscreen)
686 {
687 struct zink_screen *screen = zink_screen(pscreen);
688 slab_destroy_parent(&screen->transfer_pool);
689 FREE(screen);
690 }
691
692 static VkInstance
693 create_instance()
694 {
695 VkApplicationInfo ai = {};
696 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
697
698 char proc_name[128];
699 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
700 ai.pApplicationName = proc_name;
701 else
702 ai.pApplicationName = "unknown";
703
704 ai.pEngineName = "mesa zink";
705 ai.apiVersion = VK_API_VERSION_1_0;
706
707 const char *extensions[] = {
708 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
709 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
710 };
711
712 VkInstanceCreateInfo ici = {};
713 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
714 ici.pApplicationInfo = &ai;
715 ici.ppEnabledExtensionNames = extensions;
716 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
717
718 VkInstance instance = VK_NULL_HANDLE;
719 VkResult err = vkCreateInstance(&ici, NULL, &instance);
720 if (err != VK_SUCCESS)
721 return VK_NULL_HANDLE;
722
723 return instance;
724 }
725
726 static VkPhysicalDevice
727 choose_pdev(const VkInstance instance)
728 {
729 uint32_t i, pdev_count;
730 VkPhysicalDevice *pdevs, pdev;
731 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
732 assert(pdev_count > 0);
733
734 pdevs = malloc(sizeof(*pdevs) * pdev_count);
735 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
736 assert(pdev_count > 0);
737
738 pdev = pdevs[0];
739 for (i = 0; i < pdev_count; ++i) {
740 VkPhysicalDeviceProperties props;
741 vkGetPhysicalDeviceProperties(pdevs[i], &props);
742 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
743 pdev = pdevs[i];
744 break;
745 }
746 }
747 free(pdevs);
748 return pdev;
749 }
750
751 static uint32_t
752 find_gfx_queue(const VkPhysicalDevice pdev)
753 {
754 uint32_t num_queues;
755 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, NULL);
756 assert(num_queues > 0);
757
758 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
759 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, props);
760
761 for (uint32_t i = 0; i < num_queues; i++) {
762 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
763 free(props);
764 return i;
765 }
766 }
767
768 return UINT32_MAX;
769 }
770
771 static void
772 zink_flush_frontbuffer(struct pipe_screen *pscreen,
773 struct pipe_resource *pres,
774 unsigned level, unsigned layer,
775 void *winsys_drawable_handle,
776 struct pipe_box *sub_box)
777 {
778 struct zink_screen *screen = zink_screen(pscreen);
779 struct sw_winsys *winsys = screen->winsys;
780 struct zink_resource *res = zink_resource(pres);
781
782 if (!winsys)
783 return;
784 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
785
786 if (map) {
787 VkImageSubresource isr = {};
788 isr.aspectMask = res->aspect;
789 isr.mipLevel = level;
790 isr.arrayLayer = layer;
791 VkSubresourceLayout layout;
792 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
793
794 void *ptr;
795 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
796 if (result != VK_SUCCESS) {
797 debug_printf("failed to map memory for display\n");
798 return;
799 }
800 for (int i = 0; i < pres->height0; ++i) {
801 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
802 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
803 memcpy(dst, src, res->dt_stride);
804 }
805 vkUnmapMemory(screen->dev, res->mem);
806 }
807
808 winsys->displaytarget_unmap(winsys, res->dt);
809
810 assert(res->dt);
811 if (res->dt)
812 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
813 }
814
815 static struct pipe_screen *
816 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
817 {
818 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
819 if (!screen)
820 return NULL;
821
822 zink_debug = debug_get_option_zink_debug();
823
824 screen->instance = create_instance();
825 screen->pdev = choose_pdev(screen->instance);
826 screen->gfx_queue = find_gfx_queue(screen->pdev);
827
828 vkGetPhysicalDeviceProperties(screen->pdev, &screen->props);
829 vkGetPhysicalDeviceFeatures(screen->pdev, &screen->feats);
830 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
831
832 uint32_t num_extensions = 0;
833 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
834 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
835 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
836 num_extensions);
837 if (extensions) {
838 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
839 &num_extensions, extensions);
840
841 for (uint32_t i = 0; i < num_extensions; ++i) {
842 if (!strcmp(extensions[i].extensionName,
843 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
844 screen->have_VK_KHR_maintenance1 = true;
845 }
846 FREE(extensions);
847 }
848 }
849
850 VkDeviceQueueCreateInfo qci = {};
851 float dummy = 0.0f;
852 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
853 qci.queueFamilyIndex = screen->gfx_queue;
854 qci.queueCount = 1;
855 qci.pQueuePriorities = &dummy;
856
857 VkDeviceCreateInfo dci = {};
858 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
859 dci.queueCreateInfoCount = 1;
860 dci.pQueueCreateInfos = &qci;
861 dci.pEnabledFeatures = &screen->feats;
862 const char *extensions[] = {
863 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
864 VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME,
865 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME,
866 };
867 dci.ppEnabledExtensionNames = extensions;
868 dci.enabledExtensionCount = ARRAY_SIZE(extensions);
869 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
870 goto fail;
871
872 screen->winsys = winsys;
873
874 screen->base.get_name = zink_get_name;
875 screen->base.get_vendor = zink_get_vendor;
876 screen->base.get_device_vendor = zink_get_device_vendor;
877 screen->base.get_param = zink_get_param;
878 screen->base.get_paramf = zink_get_paramf;
879 screen->base.get_shader_param = zink_get_shader_param;
880 screen->base.get_compiler_options = zink_get_compiler_options;
881 screen->base.is_format_supported = zink_is_format_supported;
882 screen->base.context_create = zink_context_create;
883 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
884 screen->base.destroy = zink_destroy_screen;
885
886 zink_screen_resource_init(&screen->base);
887 zink_screen_fence_init(&screen->base);
888
889 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
890
891 return &screen->base;
892
893 fail:
894 FREE(screen);
895 return NULL;
896 }
897
898 struct pipe_screen *
899 zink_create_screen(struct sw_winsys *winsys)
900 {
901 return zink_internal_create_screen(winsys, -1);
902 }
903
904 struct pipe_screen *
905 zink_drm_create_screen(int fd)
906 {
907 return zink_internal_create_screen(NULL, fd);
908 }