gallium: add shader caps INT16 and FP16_DERIVATIVES
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/format/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "frontend/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i)
84 size += screen->mem_props.memoryHeaps[i].size;
85 return (int)(size >> 20);
86 }
87
88 static int
89 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
90 {
91 struct zink_screen *screen = zink_screen(pscreen);
92
93 switch (param) {
94 case PIPE_CAP_NPOT_TEXTURES:
95 return 1;
96
97 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
98 if (!screen->feats.dualSrcBlend)
99 return 0;
100 return screen->props.limits.maxFragmentDualSrcAttachments;
101
102 case PIPE_CAP_POINT_SPRITE:
103 return 1;
104
105 case PIPE_CAP_MAX_RENDER_TARGETS:
106 return screen->props.limits.maxColorAttachments;
107
108 case PIPE_CAP_OCCLUSION_QUERY:
109 return 1;
110
111 #if 0 /* TODO: Enable me */
112 case PIPE_CAP_QUERY_TIME_ELAPSED:
113 return 1;
114 #endif
115
116 case PIPE_CAP_TEXTURE_MULTISAMPLE:
117 return 1;
118
119 case PIPE_CAP_TEXTURE_SWIZZLE:
120 return 1;
121
122 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
123 return screen->props.limits.maxImageDimension2D;
124 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
125 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
126 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
127 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
128
129 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
130 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
131 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
132 case PIPE_CAP_VERTEX_SHADER_SATURATE:
133 return 1;
134
135 case PIPE_CAP_INDEP_BLEND_ENABLE:
136 case PIPE_CAP_INDEP_BLEND_FUNC:
137 return 1;
138
139 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
140 return screen->props.limits.maxImageArrayLayers;
141
142 #if 0 /* TODO: Enable me */
143 case PIPE_CAP_DEPTH_CLIP_DISABLE:
144 return 0;
145 #endif
146
147 case PIPE_CAP_TGSI_INSTANCEID:
148 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
149 case PIPE_CAP_SEAMLESS_CUBE_MAP:
150 return 1;
151
152 case PIPE_CAP_MIN_TEXEL_OFFSET:
153 return screen->props.limits.minTexelOffset;
154 case PIPE_CAP_MAX_TEXEL_OFFSET:
155 return screen->props.limits.maxTexelOffset;
156
157 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
158 return 1;
159
160 case PIPE_CAP_CONDITIONAL_RENDER:
161 return screen->have_EXT_conditional_rendering;
162
163 case PIPE_CAP_GLSL_FEATURE_LEVEL:
164 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
165 return 120;
166
167 #if 0 /* TODO: Enable me */
168 case PIPE_CAP_COMPUTE:
169 return 1;
170 #endif
171
172 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
173 return screen->props.limits.minUniformBufferOffsetAlignment;
174
175 #if 0 /* TODO: Enable me */
176 case PIPE_CAP_QUERY_TIMESTAMP:
177 return 1;
178 #endif
179
180 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
181 return screen->props.limits.minMemoryMapAlignment;
182
183 case PIPE_CAP_CUBE_MAP_ARRAY:
184 return screen->feats.imageCubeArray;
185
186 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
187 return 1;
188
189 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
190 return screen->props.limits.minTexelBufferOffsetAlignment;
191
192 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
193 return 0; /* unsure */
194
195 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
196 return screen->props.limits.maxTexelBufferElements;
197
198 case PIPE_CAP_ENDIANNESS:
199 return PIPE_ENDIAN_NATIVE; /* unsure */
200
201 case PIPE_CAP_MAX_VIEWPORTS:
202 return 1; /* TODO: When GS is supported, use screen->props.limits.maxViewports */
203
204 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
205 return 1;
206
207 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
208 return screen->props.limits.maxGeometryOutputVertices;
209 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
210 return screen->props.limits.maxGeometryOutputComponents;
211
212 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
213 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
214 return 4;
215 #endif
216
217 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
218 return screen->props.limits.minTexelGatherOffset;
219 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
220 return screen->props.limits.maxTexelGatherOffset;
221
222 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
223 return 1;
224
225 case PIPE_CAP_VENDOR_ID:
226 return screen->props.vendorID;
227 case PIPE_CAP_DEVICE_ID:
228 return screen->props.deviceID;
229
230 case PIPE_CAP_ACCELERATED:
231 return 1;
232 case PIPE_CAP_VIDEO_MEMORY:
233 return get_video_mem(screen);
234 case PIPE_CAP_UMA:
235 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
236
237 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
238 return screen->props.limits.maxVertexInputBindingStride;
239
240 #if 0 /* TODO: Enable me */
241 case PIPE_CAP_SAMPLER_VIEW_TARGET:
242 return 1;
243 #endif
244
245 #if 0 /* TODO: Enable me */
246 case PIPE_CAP_CLIP_HALFZ:
247 return 1;
248 #endif
249
250 #if 0 /* TODO: Enable me */
251 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
252 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
253 return 1;
254 #endif
255
256 case PIPE_CAP_SHAREABLE_SHADERS:
257 return 1;
258
259 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
260 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
261 return screen->props.limits.minStorageBufferOffsetAlignment;
262 #endif
263
264 case PIPE_CAP_PCI_GROUP:
265 case PIPE_CAP_PCI_BUS:
266 case PIPE_CAP_PCI_DEVICE:
267 case PIPE_CAP_PCI_FUNCTION:
268 return 0; /* TODO: figure these out */
269
270 #if 0 /* TODO: Enable me */
271 case PIPE_CAP_CULL_DISTANCE:
272 return screen->feats.shaderCullDistance;
273 #endif
274
275 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
276 return screen->props.limits.viewportSubPixelBits;
277
278 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
279 return 0; /* not sure */
280
281 case PIPE_CAP_MAX_GS_INVOCATIONS:
282 return 0; /* not implemented */
283
284 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
285 return screen->props.limits.maxDescriptorSetStorageBuffers;
286
287 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
288 return screen->props.limits.maxStorageBufferRange; /* unsure */
289
290 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
291 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
292 return 1;
293
294 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
295 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
296 return 0;
297
298 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
299 return 0;
300
301 case PIPE_CAP_NIR_COMPACT_ARRAYS:
302 return 1;
303
304 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
305 return 1;
306
307 case PIPE_CAP_FLATSHADE:
308 case PIPE_CAP_ALPHA_TEST:
309 case PIPE_CAP_CLIP_PLANES:
310 case PIPE_CAP_POINT_SIZE_FIXED:
311 case PIPE_CAP_TWO_SIDED_COLOR:
312 return 0;
313
314 case PIPE_CAP_DMABUF:
315 return screen->have_KHR_external_memory_fd;
316
317 default:
318 return u_pipe_screen_get_param_defaults(pscreen, param);
319 }
320 }
321
322 static float
323 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
324 {
325 struct zink_screen *screen = zink_screen(pscreen);
326
327 switch (param) {
328 case PIPE_CAPF_MAX_LINE_WIDTH:
329 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
330 return screen->props.limits.lineWidthRange[1];
331
332 case PIPE_CAPF_MAX_POINT_WIDTH:
333 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
334 return screen->props.limits.pointSizeRange[1];
335
336 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
337 return screen->props.limits.maxSamplerAnisotropy;
338
339 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
340 return screen->props.limits.maxSamplerLodBias;
341
342 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
343 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
344 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
345 return 0.0f; /* not implemented */
346 }
347
348 /* should only get here on unhandled cases */
349 return 0.0;
350 }
351
352 static int
353 zink_get_shader_param(struct pipe_screen *pscreen,
354 enum pipe_shader_type shader,
355 enum pipe_shader_cap param)
356 {
357 struct zink_screen *screen = zink_screen(pscreen);
358
359 switch (param) {
360 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
361 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
362 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
363 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
364 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
365 if (shader == PIPE_SHADER_VERTEX ||
366 shader == PIPE_SHADER_FRAGMENT)
367 return INT_MAX;
368 return 0;
369
370 case PIPE_SHADER_CAP_MAX_INPUTS:
371 switch (shader) {
372 case PIPE_SHADER_VERTEX:
373 return MIN2(screen->props.limits.maxVertexInputAttributes,
374 PIPE_MAX_SHADER_INPUTS);
375 case PIPE_SHADER_FRAGMENT:
376 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
377 PIPE_MAX_SHADER_INPUTS);
378 default:
379 return 0; /* unsupported stage */
380 }
381
382 case PIPE_SHADER_CAP_MAX_OUTPUTS:
383 switch (shader) {
384 case PIPE_SHADER_VERTEX:
385 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
386 PIPE_MAX_SHADER_OUTPUTS);
387 case PIPE_SHADER_FRAGMENT:
388 return MIN2(screen->props.limits.maxColorAttachments,
389 PIPE_MAX_SHADER_OUTPUTS);
390 default:
391 return 0; /* unsupported stage */
392 }
393
394 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
395 switch (shader) {
396 case PIPE_SHADER_VERTEX:
397 case PIPE_SHADER_FRAGMENT:
398 /* this might be a bit simplistic... */
399 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
400 PIPE_MAX_SAMPLERS);
401 default:
402 return 0; /* unsupported stage */
403 }
404
405 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
406 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
407
408 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
409 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
410
411 case PIPE_SHADER_CAP_MAX_TEMPS:
412 return INT_MAX;
413
414 case PIPE_SHADER_CAP_INTEGERS:
415 return 1;
416
417 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
418 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
419 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
420 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
421 case PIPE_SHADER_CAP_SUBROUTINES:
422 case PIPE_SHADER_CAP_INT64_ATOMICS:
423 case PIPE_SHADER_CAP_FP16:
424 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
425 case PIPE_SHADER_CAP_INT16:
426 return 0; /* not implemented */
427
428 case PIPE_SHADER_CAP_PREFERRED_IR:
429 return PIPE_SHADER_IR_NIR;
430
431 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
432 return 0; /* not implemented */
433
434 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
435 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
436 PIPE_MAX_SHADER_SAMPLER_VIEWS);
437
438 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
439 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
440 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
441 return 0; /* not implemented */
442
443 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
444 return 0; /* no idea */
445
446 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
447 return 32; /* arbitrary */
448
449 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
450 /* TODO: this limitation is dumb, and will need some fixes in mesa */
451 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, 8);
452
453 case PIPE_SHADER_CAP_SUPPORTED_IRS:
454 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
455
456 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
457 #if 0 /* TODO: needs compiler support */
458 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
459 PIPE_MAX_SHADER_IMAGES);
460 #else
461 return 0;
462 #endif
463
464 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
465 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
466 return 0; /* unsure */
467
468 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
469 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
470 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
471 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
472 return 0; /* not implemented */
473 }
474
475 /* should only get here on unhandled cases */
476 return 0;
477 }
478
479 static VkSampleCountFlagBits
480 vk_sample_count_flags(uint32_t sample_count)
481 {
482 switch (sample_count) {
483 case 1: return VK_SAMPLE_COUNT_1_BIT;
484 case 2: return VK_SAMPLE_COUNT_2_BIT;
485 case 4: return VK_SAMPLE_COUNT_4_BIT;
486 case 8: return VK_SAMPLE_COUNT_8_BIT;
487 case 16: return VK_SAMPLE_COUNT_16_BIT;
488 case 32: return VK_SAMPLE_COUNT_32_BIT;
489 case 64: return VK_SAMPLE_COUNT_64_BIT;
490 default:
491 return 0;
492 }
493 }
494
495 static bool
496 zink_is_format_supported(struct pipe_screen *pscreen,
497 enum pipe_format format,
498 enum pipe_texture_target target,
499 unsigned sample_count,
500 unsigned storage_sample_count,
501 unsigned bind)
502 {
503 struct zink_screen *screen = zink_screen(pscreen);
504
505 if (format == PIPE_FORMAT_NONE)
506 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
507 vk_sample_count_flags(sample_count);
508
509 VkFormat vkformat = zink_get_format(screen, format);
510 if (vkformat == VK_FORMAT_UNDEFINED)
511 return false;
512
513 if (sample_count >= 1) {
514 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
515 if (!sample_mask)
516 return false;
517 const struct util_format_description *desc = util_format_description(format);
518 if (util_format_is_depth_or_stencil(format)) {
519 if (util_format_has_depth(desc)) {
520 if (bind & PIPE_BIND_DEPTH_STENCIL &&
521 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
522 return false;
523 if (bind & PIPE_BIND_SAMPLER_VIEW &&
524 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
525 return false;
526 }
527 if (util_format_has_stencil(desc)) {
528 if (bind & PIPE_BIND_DEPTH_STENCIL &&
529 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
530 return false;
531 if (bind & PIPE_BIND_SAMPLER_VIEW &&
532 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
533 return false;
534 }
535 } else if (util_format_is_pure_integer(format)) {
536 if (bind & PIPE_BIND_RENDER_TARGET &&
537 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
538 return false;
539 if (bind & PIPE_BIND_SAMPLER_VIEW &&
540 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
541 return false;
542 } else {
543 if (bind & PIPE_BIND_RENDER_TARGET &&
544 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
545 return false;
546 if (bind & PIPE_BIND_SAMPLER_VIEW &&
547 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
548 return false;
549 }
550 }
551
552 VkFormatProperties props;
553 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
554
555 if (target == PIPE_BUFFER) {
556 if (bind & PIPE_BIND_VERTEX_BUFFER &&
557 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
558 return false;
559 } else {
560 /* all other targets are texture-targets */
561 if (bind & PIPE_BIND_RENDER_TARGET &&
562 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
563 return false;
564
565 if (bind & PIPE_BIND_BLENDABLE &&
566 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
567 return false;
568
569 if (bind & PIPE_BIND_SAMPLER_VIEW &&
570 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
571 return false;
572
573 if (bind & PIPE_BIND_DEPTH_STENCIL &&
574 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
575 return false;
576 }
577
578 if (util_format_is_compressed(format)) {
579 const struct util_format_description *desc = util_format_description(format);
580 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
581 !screen->feats.textureCompressionBC)
582 return false;
583 }
584
585 return true;
586 }
587
588 static void
589 zink_destroy_screen(struct pipe_screen *pscreen)
590 {
591 struct zink_screen *screen = zink_screen(pscreen);
592 slab_destroy_parent(&screen->transfer_pool);
593 FREE(screen);
594 }
595
596 static VkInstance
597 create_instance()
598 {
599 VkApplicationInfo ai = {};
600 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
601
602 char proc_name[128];
603 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
604 ai.pApplicationName = proc_name;
605 else
606 ai.pApplicationName = "unknown";
607
608 ai.pEngineName = "mesa zink";
609 ai.apiVersion = VK_API_VERSION_1_0;
610
611 const char *extensions[] = {
612 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
613 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
614 };
615
616 VkInstanceCreateInfo ici = {};
617 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
618 ici.pApplicationInfo = &ai;
619 ici.ppEnabledExtensionNames = extensions;
620 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
621
622 VkInstance instance = VK_NULL_HANDLE;
623 VkResult err = vkCreateInstance(&ici, NULL, &instance);
624 if (err != VK_SUCCESS)
625 return VK_NULL_HANDLE;
626
627 return instance;
628 }
629
630 static VkPhysicalDevice
631 choose_pdev(const VkInstance instance)
632 {
633 uint32_t i, pdev_count;
634 VkPhysicalDevice *pdevs, pdev;
635 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
636 assert(pdev_count > 0);
637
638 pdevs = malloc(sizeof(*pdevs) * pdev_count);
639 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
640 assert(pdev_count > 0);
641
642 pdev = pdevs[0];
643 for (i = 0; i < pdev_count; ++i) {
644 VkPhysicalDeviceProperties props;
645 vkGetPhysicalDeviceProperties(pdevs[i], &props);
646 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
647 pdev = pdevs[i];
648 break;
649 }
650 }
651 free(pdevs);
652 return pdev;
653 }
654
655 static uint32_t
656 find_gfx_queue(const VkPhysicalDevice pdev)
657 {
658 uint32_t num_queues;
659 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, NULL);
660 assert(num_queues > 0);
661
662 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
663 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, props);
664
665 for (uint32_t i = 0; i < num_queues; i++) {
666 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
667 free(props);
668 return i;
669 }
670 }
671
672 return UINT32_MAX;
673 }
674
675 static void
676 zink_flush_frontbuffer(struct pipe_screen *pscreen,
677 struct pipe_resource *pres,
678 unsigned level, unsigned layer,
679 void *winsys_drawable_handle,
680 struct pipe_box *sub_box)
681 {
682 struct zink_screen *screen = zink_screen(pscreen);
683 struct sw_winsys *winsys = screen->winsys;
684 struct zink_resource *res = zink_resource(pres);
685
686 if (!winsys)
687 return;
688 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
689
690 if (map) {
691 VkImageSubresource isr = {};
692 isr.aspectMask = res->aspect;
693 isr.mipLevel = level;
694 isr.arrayLayer = layer;
695 VkSubresourceLayout layout;
696 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
697
698 void *ptr;
699 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
700 if (result != VK_SUCCESS) {
701 debug_printf("failed to map memory for display\n");
702 return;
703 }
704 for (int i = 0; i < pres->height0; ++i) {
705 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
706 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
707 memcpy(dst, src, res->dt_stride);
708 }
709 vkUnmapMemory(screen->dev, res->mem);
710 }
711
712 winsys->displaytarget_unmap(winsys, res->dt);
713
714 assert(res->dt);
715 if (res->dt)
716 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
717 }
718
719 static bool
720 load_device_extensions(struct zink_screen *screen)
721 {
722 #define GET_PROC_ADDR(x) do { \
723 screen->vk_##x = (PFN_vk##x)vkGetDeviceProcAddr(screen->dev, "vk"#x); \
724 if (!screen->vk_##x) \
725 return false; \
726 } while (0)
727
728 if (screen->have_KHR_external_memory_fd)
729 GET_PROC_ADDR(GetMemoryFdKHR);
730
731 if (screen->have_EXT_conditional_rendering) {
732 GET_PROC_ADDR(CmdBeginConditionalRenderingEXT);
733 GET_PROC_ADDR(CmdEndConditionalRenderingEXT);
734 }
735
736 #undef GET_PROC_ADDR
737
738 return true;
739 }
740
741 static struct pipe_screen *
742 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
743 {
744 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
745 if (!screen)
746 return NULL;
747
748 zink_debug = debug_get_option_zink_debug();
749
750 screen->instance = create_instance();
751 screen->pdev = choose_pdev(screen->instance);
752 screen->gfx_queue = find_gfx_queue(screen->pdev);
753
754 vkGetPhysicalDeviceProperties(screen->pdev, &screen->props);
755 vkGetPhysicalDeviceFeatures(screen->pdev, &screen->feats);
756 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
757
758 screen->have_X8_D24_UNORM_PACK32 = zink_is_depth_format_supported(screen,
759 VK_FORMAT_X8_D24_UNORM_PACK32);
760 screen->have_D24_UNORM_S8_UINT = zink_is_depth_format_supported(screen,
761 VK_FORMAT_D24_UNORM_S8_UINT);
762
763 uint32_t num_extensions = 0;
764 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
765 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
766 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
767 num_extensions);
768 if (extensions) {
769 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
770 &num_extensions, extensions);
771
772 for (uint32_t i = 0; i < num_extensions; ++i) {
773 if (!strcmp(extensions[i].extensionName,
774 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
775 screen->have_KHR_maintenance1 = true;
776 if (!strcmp(extensions[i].extensionName,
777 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME))
778 screen->have_KHR_external_memory_fd = true;
779 if (!strcmp(extensions[i].extensionName,
780 VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME))
781 screen->have_EXT_conditional_rendering = true;
782 }
783 FREE(extensions);
784 }
785 }
786
787 if (!screen->have_KHR_maintenance1) {
788 debug_printf("ZINK: VK_KHR_maintenance1 required!\n");
789 goto fail;
790 }
791
792 VkDeviceQueueCreateInfo qci = {};
793 float dummy = 0.0f;
794 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
795 qci.queueFamilyIndex = screen->gfx_queue;
796 qci.queueCount = 1;
797 qci.pQueuePriorities = &dummy;
798
799 VkDeviceCreateInfo dci = {};
800 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
801 dci.queueCreateInfoCount = 1;
802 dci.pQueueCreateInfos = &qci;
803 dci.pEnabledFeatures = &screen->feats;
804 const char *extensions[4] = {
805 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
806 };
807 num_extensions = 1;
808
809 if (fd >= 0 && !screen->have_KHR_external_memory_fd) {
810 debug_printf("ZINK: KHR_external_memory_fd required!\n");
811 goto fail;
812 }
813
814 if (screen->have_KHR_external_memory_fd) {
815 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME;
816 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME;
817 }
818
819 if (screen->have_EXT_conditional_rendering)
820 extensions[num_extensions++] = VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME;
821
822 assert(num_extensions <= ARRAY_SIZE(extensions));
823
824 dci.ppEnabledExtensionNames = extensions;
825 dci.enabledExtensionCount = num_extensions;
826 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
827 goto fail;
828
829 if (!load_device_extensions(screen))
830 goto fail;
831
832 screen->winsys = winsys;
833
834 screen->base.get_name = zink_get_name;
835 screen->base.get_vendor = zink_get_vendor;
836 screen->base.get_device_vendor = zink_get_device_vendor;
837 screen->base.get_param = zink_get_param;
838 screen->base.get_paramf = zink_get_paramf;
839 screen->base.get_shader_param = zink_get_shader_param;
840 screen->base.get_compiler_options = zink_get_compiler_options;
841 screen->base.is_format_supported = zink_is_format_supported;
842 screen->base.context_create = zink_context_create;
843 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
844 screen->base.destroy = zink_destroy_screen;
845
846 zink_screen_resource_init(&screen->base);
847 zink_screen_fence_init(&screen->base);
848
849 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
850
851 return &screen->base;
852
853 fail:
854 FREE(screen);
855 return NULL;
856 }
857
858 struct pipe_screen *
859 zink_create_screen(struct sw_winsys *winsys)
860 {
861 return zink_internal_create_screen(winsys, -1);
862 }
863
864 struct pipe_screen *
865 zink_drm_create_screen(int fd)
866 {
867 return zink_internal_create_screen(NULL, fd);
868 }