zink: implement support for derivative-control
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/format/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "state_tracker/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i)
84 size += screen->mem_props.memoryHeaps[i].size;
85 return (int)(size >> 20);
86 }
87
88 static int
89 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
90 {
91 struct zink_screen *screen = zink_screen(pscreen);
92
93 switch (param) {
94 case PIPE_CAP_NPOT_TEXTURES:
95 return 1;
96
97 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
98 return screen->props.limits.maxFragmentDualSrcAttachments;
99
100 case PIPE_CAP_POINT_SPRITE:
101 return 1;
102
103 case PIPE_CAP_MAX_RENDER_TARGETS:
104 return screen->props.limits.maxColorAttachments;
105
106 case PIPE_CAP_OCCLUSION_QUERY:
107 return 1;
108
109 #if 0 /* TODO: Enable me */
110 case PIPE_CAP_QUERY_TIME_ELAPSED:
111 return 1;
112 #endif
113
114 case PIPE_CAP_TEXTURE_SWIZZLE:
115 return 1;
116
117 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
118 return screen->props.limits.maxImageDimension2D;
119 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
120 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
121 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
122 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
123
124 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
125 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
126 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
127 case PIPE_CAP_VERTEX_SHADER_SATURATE:
128 return 1;
129
130 case PIPE_CAP_INDEP_BLEND_ENABLE:
131 case PIPE_CAP_INDEP_BLEND_FUNC:
132 return 1;
133
134 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
135 return screen->props.limits.maxImageArrayLayers;
136
137 #if 0 /* TODO: Enable me */
138 case PIPE_CAP_DEPTH_CLIP_DISABLE:
139 return 0;
140 #endif
141
142 case PIPE_CAP_TGSI_INSTANCEID:
143 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
144 case PIPE_CAP_SEAMLESS_CUBE_MAP:
145 return 1;
146
147 case PIPE_CAP_MIN_TEXEL_OFFSET:
148 return screen->props.limits.minTexelOffset;
149 case PIPE_CAP_MAX_TEXEL_OFFSET:
150 return screen->props.limits.maxTexelOffset;
151
152 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
153 return 1;
154
155 case PIPE_CAP_GLSL_FEATURE_LEVEL:
156 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
157 return 120;
158
159 #if 0 /* TODO: Enable me */
160 case PIPE_CAP_COMPUTE:
161 return 1;
162 #endif
163
164 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
165 return screen->props.limits.minUniformBufferOffsetAlignment;
166
167 #if 0 /* TODO: Enable me */
168 case PIPE_CAP_QUERY_TIMESTAMP:
169 return 1;
170 #endif
171
172 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
173 return screen->props.limits.minMemoryMapAlignment;
174
175 case PIPE_CAP_CUBE_MAP_ARRAY:
176 return screen->feats.imageCubeArray;
177
178 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
179 return 1;
180
181 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
182 return screen->props.limits.minTexelBufferOffsetAlignment;
183
184 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
185 return 0; /* unsure */
186
187 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
188 return screen->props.limits.maxTexelBufferElements;
189
190 case PIPE_CAP_ENDIANNESS:
191 return PIPE_ENDIAN_NATIVE; /* unsure */
192
193 case PIPE_CAP_MAX_VIEWPORTS:
194 return screen->props.limits.maxViewports;
195
196 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
197 return 1;
198
199 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
200 return screen->props.limits.maxGeometryOutputVertices;
201 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
202 return screen->props.limits.maxGeometryOutputComponents;
203
204 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
205 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
206 return 4;
207 #endif
208
209 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
210 return screen->props.limits.minTexelGatherOffset;
211 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
212 return screen->props.limits.maxTexelGatherOffset;
213
214 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
215 return 1;
216
217 case PIPE_CAP_VENDOR_ID:
218 return screen->props.vendorID;
219 case PIPE_CAP_DEVICE_ID:
220 return screen->props.deviceID;
221
222 case PIPE_CAP_ACCELERATED:
223 return 1;
224 case PIPE_CAP_VIDEO_MEMORY:
225 return get_video_mem(screen);
226 case PIPE_CAP_UMA:
227 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
228
229 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
230 return screen->props.limits.maxVertexInputBindingStride;
231
232 #if 0 /* TODO: Enable me */
233 case PIPE_CAP_SAMPLER_VIEW_TARGET:
234 return 1;
235 #endif
236
237 #if 0 /* TODO: Enable me */
238 case PIPE_CAP_CLIP_HALFZ:
239 return 1;
240 #endif
241
242 #if 0 /* TODO: Enable me */
243 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
244 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
245 return 1;
246 #endif
247
248 case PIPE_CAP_SHAREABLE_SHADERS:
249 return 1;
250
251 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
252 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
253 return screen->props.limits.minStorageBufferOffsetAlignment;
254 #endif
255
256 case PIPE_CAP_PCI_GROUP:
257 case PIPE_CAP_PCI_BUS:
258 case PIPE_CAP_PCI_DEVICE:
259 case PIPE_CAP_PCI_FUNCTION:
260 return 0; /* TODO: figure these out */
261
262 #if 0 /* TODO: Enable me */
263 case PIPE_CAP_CULL_DISTANCE:
264 return screen->feats.shaderCullDistance;
265 #endif
266
267 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
268 return screen->props.limits.viewportSubPixelBits;
269
270 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
271 return 0; /* not sure */
272
273 case PIPE_CAP_MAX_GS_INVOCATIONS:
274 return 0; /* not implemented */
275
276 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
277 return screen->props.limits.maxDescriptorSetStorageBuffers;
278
279 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
280 return screen->props.limits.maxStorageBufferRange; /* unsure */
281
282 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
283 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
284 return 1;
285
286 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
287 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
288 return 0;
289
290 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
291 return 0;
292
293 case PIPE_CAP_NIR_COMPACT_ARRAYS:
294 return 1;
295
296 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
297 return 1;
298
299 case PIPE_CAP_FLATSHADE:
300 case PIPE_CAP_ALPHA_TEST:
301 case PIPE_CAP_CLIP_PLANES:
302 case PIPE_CAP_POINT_SIZE_FIXED:
303 case PIPE_CAP_TWO_SIDED_COLOR:
304 return 0;
305
306 case PIPE_CAP_DMABUF:
307 return screen->have_KHR_external_memory_fd;
308
309 default:
310 return u_pipe_screen_get_param_defaults(pscreen, param);
311 }
312 }
313
314 static float
315 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
316 {
317 struct zink_screen *screen = zink_screen(pscreen);
318
319 switch (param) {
320 case PIPE_CAPF_MAX_LINE_WIDTH:
321 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
322 return screen->props.limits.lineWidthRange[1];
323
324 case PIPE_CAPF_MAX_POINT_WIDTH:
325 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
326 return screen->props.limits.pointSizeRange[1];
327
328 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
329 return screen->props.limits.maxSamplerAnisotropy;
330
331 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
332 return screen->props.limits.maxSamplerLodBias;
333
334 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
335 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
336 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
337 return 0.0f; /* not implemented */
338 }
339
340 /* should only get here on unhandled cases */
341 return 0.0;
342 }
343
344 static int
345 zink_get_shader_param(struct pipe_screen *pscreen,
346 enum pipe_shader_type shader,
347 enum pipe_shader_cap param)
348 {
349 struct zink_screen *screen = zink_screen(pscreen);
350
351 switch (param) {
352 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
353 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
354 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
355 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
356 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
357 if (shader == PIPE_SHADER_VERTEX ||
358 shader == PIPE_SHADER_FRAGMENT)
359 return INT_MAX;
360 return 0;
361
362 case PIPE_SHADER_CAP_MAX_INPUTS:
363 switch (shader) {
364 case PIPE_SHADER_VERTEX:
365 return MIN2(screen->props.limits.maxVertexInputAttributes,
366 PIPE_MAX_SHADER_INPUTS);
367 case PIPE_SHADER_FRAGMENT:
368 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
369 PIPE_MAX_SHADER_INPUTS);
370 default:
371 return 0; /* unsupported stage */
372 }
373
374 case PIPE_SHADER_CAP_MAX_OUTPUTS:
375 switch (shader) {
376 case PIPE_SHADER_VERTEX:
377 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
378 PIPE_MAX_SHADER_OUTPUTS);
379 case PIPE_SHADER_FRAGMENT:
380 return MIN2(screen->props.limits.maxColorAttachments,
381 PIPE_MAX_SHADER_OUTPUTS);
382 default:
383 return 0; /* unsupported stage */
384 }
385
386 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
387 /* this might be a bit simplistic... */
388 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
389 PIPE_MAX_SAMPLERS);
390
391 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
392 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
393
394 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
395 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
396
397 case PIPE_SHADER_CAP_MAX_TEMPS:
398 return INT_MAX;
399
400 case PIPE_SHADER_CAP_INTEGERS:
401 return 1;
402
403 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
404 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
405 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
406 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
407 case PIPE_SHADER_CAP_SUBROUTINES:
408 case PIPE_SHADER_CAP_INT64_ATOMICS:
409 case PIPE_SHADER_CAP_FP16:
410 return 0; /* not implemented */
411
412 case PIPE_SHADER_CAP_PREFERRED_IR:
413 return PIPE_SHADER_IR_NIR;
414
415 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
416 return 0; /* not implemented */
417
418 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
419 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
420 PIPE_MAX_SHADER_SAMPLER_VIEWS);
421
422 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
423 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
424 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
425 return 0; /* not implemented */
426
427 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
428 return 0; /* no idea */
429
430 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
431 return 32; /* arbitrary */
432
433 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
434 /* TODO: this limitation is dumb, and will need some fixes in mesa */
435 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, 8);
436
437 case PIPE_SHADER_CAP_SUPPORTED_IRS:
438 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
439
440 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
441 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
442 PIPE_MAX_SHADER_IMAGES);
443
444 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
445 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
446 return 0; /* unsure */
447
448 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
449 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
450 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
451 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
452 return 0; /* not implemented */
453 }
454
455 /* should only get here on unhandled cases */
456 return 0;
457 }
458
459 static VkSampleCountFlagBits
460 vk_sample_count_flags(uint32_t sample_count)
461 {
462 switch (sample_count) {
463 case 1: return VK_SAMPLE_COUNT_1_BIT;
464 case 2: return VK_SAMPLE_COUNT_2_BIT;
465 case 4: return VK_SAMPLE_COUNT_4_BIT;
466 case 8: return VK_SAMPLE_COUNT_8_BIT;
467 case 16: return VK_SAMPLE_COUNT_16_BIT;
468 case 32: return VK_SAMPLE_COUNT_32_BIT;
469 case 64: return VK_SAMPLE_COUNT_64_BIT;
470 default:
471 return 0;
472 }
473 }
474
475 static bool
476 zink_is_format_supported(struct pipe_screen *pscreen,
477 enum pipe_format format,
478 enum pipe_texture_target target,
479 unsigned sample_count,
480 unsigned storage_sample_count,
481 unsigned bind)
482 {
483 struct zink_screen *screen = zink_screen(pscreen);
484
485 if (format == PIPE_FORMAT_NONE)
486 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
487 vk_sample_count_flags(sample_count);
488
489 VkFormat vkformat = zink_get_format(screen, format);
490 if (vkformat == VK_FORMAT_UNDEFINED)
491 return false;
492
493 if (sample_count >= 1) {
494 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
495 if (!sample_mask)
496 return false;
497 const struct util_format_description *desc = util_format_description(format);
498 if (util_format_is_depth_or_stencil(format)) {
499 if (util_format_has_depth(desc)) {
500 if (bind & PIPE_BIND_DEPTH_STENCIL &&
501 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
502 return false;
503 if (bind & PIPE_BIND_SAMPLER_VIEW &&
504 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
505 return false;
506 }
507 if (util_format_has_stencil(desc)) {
508 if (bind & PIPE_BIND_DEPTH_STENCIL &&
509 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
510 return false;
511 if (bind & PIPE_BIND_SAMPLER_VIEW &&
512 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
513 return false;
514 }
515 } else if (util_format_is_pure_integer(format)) {
516 if (bind & PIPE_BIND_RENDER_TARGET &&
517 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
518 return false;
519 if (bind & PIPE_BIND_SAMPLER_VIEW &&
520 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
521 return false;
522 } else {
523 if (bind & PIPE_BIND_RENDER_TARGET &&
524 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
525 return false;
526 if (bind & PIPE_BIND_SAMPLER_VIEW &&
527 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
528 return false;
529 }
530 }
531
532 VkFormatProperties props;
533 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
534
535 if (target == PIPE_BUFFER) {
536 if (bind & PIPE_BIND_VERTEX_BUFFER &&
537 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
538 return false;
539 } else {
540 /* all other targets are texture-targets */
541 if (bind & PIPE_BIND_RENDER_TARGET &&
542 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
543 return false;
544
545 if (bind & PIPE_BIND_BLENDABLE &&
546 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
547 return false;
548
549 if (bind & PIPE_BIND_SAMPLER_VIEW &&
550 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
551 return false;
552
553 if (bind & PIPE_BIND_DEPTH_STENCIL &&
554 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
555 return false;
556 }
557
558 if (util_format_is_compressed(format)) {
559 const struct util_format_description *desc = util_format_description(format);
560 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
561 !screen->feats.textureCompressionBC)
562 return false;
563 }
564
565 return true;
566 }
567
568 static void
569 zink_destroy_screen(struct pipe_screen *pscreen)
570 {
571 struct zink_screen *screen = zink_screen(pscreen);
572 slab_destroy_parent(&screen->transfer_pool);
573 FREE(screen);
574 }
575
576 static VkInstance
577 create_instance()
578 {
579 VkApplicationInfo ai = {};
580 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
581
582 char proc_name[128];
583 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
584 ai.pApplicationName = proc_name;
585 else
586 ai.pApplicationName = "unknown";
587
588 ai.pEngineName = "mesa zink";
589 ai.apiVersion = VK_API_VERSION_1_0;
590
591 const char *extensions[] = {
592 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
593 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
594 };
595
596 VkInstanceCreateInfo ici = {};
597 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
598 ici.pApplicationInfo = &ai;
599 ici.ppEnabledExtensionNames = extensions;
600 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
601
602 VkInstance instance = VK_NULL_HANDLE;
603 VkResult err = vkCreateInstance(&ici, NULL, &instance);
604 if (err != VK_SUCCESS)
605 return VK_NULL_HANDLE;
606
607 return instance;
608 }
609
610 static VkPhysicalDevice
611 choose_pdev(const VkInstance instance)
612 {
613 uint32_t i, pdev_count;
614 VkPhysicalDevice *pdevs, pdev;
615 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
616 assert(pdev_count > 0);
617
618 pdevs = malloc(sizeof(*pdevs) * pdev_count);
619 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
620 assert(pdev_count > 0);
621
622 pdev = pdevs[0];
623 for (i = 0; i < pdev_count; ++i) {
624 VkPhysicalDeviceProperties props;
625 vkGetPhysicalDeviceProperties(pdevs[i], &props);
626 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
627 pdev = pdevs[i];
628 break;
629 }
630 }
631 free(pdevs);
632 return pdev;
633 }
634
635 static uint32_t
636 find_gfx_queue(const VkPhysicalDevice pdev)
637 {
638 uint32_t num_queues;
639 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, NULL);
640 assert(num_queues > 0);
641
642 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
643 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, props);
644
645 for (uint32_t i = 0; i < num_queues; i++) {
646 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
647 free(props);
648 return i;
649 }
650 }
651
652 return UINT32_MAX;
653 }
654
655 static void
656 zink_flush_frontbuffer(struct pipe_screen *pscreen,
657 struct pipe_resource *pres,
658 unsigned level, unsigned layer,
659 void *winsys_drawable_handle,
660 struct pipe_box *sub_box)
661 {
662 struct zink_screen *screen = zink_screen(pscreen);
663 struct sw_winsys *winsys = screen->winsys;
664 struct zink_resource *res = zink_resource(pres);
665
666 if (!winsys)
667 return;
668 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
669
670 if (map) {
671 VkImageSubresource isr = {};
672 isr.aspectMask = res->aspect;
673 isr.mipLevel = level;
674 isr.arrayLayer = layer;
675 VkSubresourceLayout layout;
676 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
677
678 void *ptr;
679 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
680 if (result != VK_SUCCESS) {
681 debug_printf("failed to map memory for display\n");
682 return;
683 }
684 for (int i = 0; i < pres->height0; ++i) {
685 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
686 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
687 memcpy(dst, src, res->dt_stride);
688 }
689 vkUnmapMemory(screen->dev, res->mem);
690 }
691
692 winsys->displaytarget_unmap(winsys, res->dt);
693
694 assert(res->dt);
695 if (res->dt)
696 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
697 }
698
699 static struct pipe_screen *
700 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
701 {
702 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
703 if (!screen)
704 return NULL;
705
706 zink_debug = debug_get_option_zink_debug();
707
708 screen->instance = create_instance();
709 screen->pdev = choose_pdev(screen->instance);
710 screen->gfx_queue = find_gfx_queue(screen->pdev);
711
712 vkGetPhysicalDeviceProperties(screen->pdev, &screen->props);
713 vkGetPhysicalDeviceFeatures(screen->pdev, &screen->feats);
714 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
715
716 screen->have_X8_D24_UNORM_PACK32 = zink_is_depth_format_supported(screen,
717 VK_FORMAT_X8_D24_UNORM_PACK32);
718 screen->have_D24_UNORM_S8_UINT = zink_is_depth_format_supported(screen,
719 VK_FORMAT_D24_UNORM_S8_UINT);
720
721 uint32_t num_extensions = 0;
722 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
723 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
724 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
725 num_extensions);
726 if (extensions) {
727 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
728 &num_extensions, extensions);
729
730 for (uint32_t i = 0; i < num_extensions; ++i) {
731 if (!strcmp(extensions[i].extensionName,
732 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
733 screen->have_KHR_maintenance1 = true;
734 if (!strcmp(extensions[i].extensionName,
735 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME))
736 screen->have_KHR_external_memory_fd = true;
737 }
738 FREE(extensions);
739 }
740 }
741
742 if (!screen->have_KHR_maintenance1) {
743 debug_printf("ZINK: VK_KHR_maintenance1 required!\n");
744 goto fail;
745 }
746
747 VkDeviceQueueCreateInfo qci = {};
748 float dummy = 0.0f;
749 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
750 qci.queueFamilyIndex = screen->gfx_queue;
751 qci.queueCount = 1;
752 qci.pQueuePriorities = &dummy;
753
754 VkDeviceCreateInfo dci = {};
755 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
756 dci.queueCreateInfoCount = 1;
757 dci.pQueueCreateInfos = &qci;
758 dci.pEnabledFeatures = &screen->feats;
759 const char *extensions[3] = {
760 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
761 };
762 num_extensions = 1;
763
764 if (fd >= 0 && !screen->have_KHR_external_memory_fd) {
765 debug_printf("ZINK: KHR_external_memory_fd required!\n");
766 goto fail;
767 }
768
769 if (screen->have_KHR_external_memory_fd) {
770 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME;
771 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME;
772 }
773 assert(num_extensions <= ARRAY_SIZE(extensions));
774
775 dci.ppEnabledExtensionNames = extensions;
776 dci.enabledExtensionCount = num_extensions;
777 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
778 goto fail;
779
780 screen->winsys = winsys;
781
782 screen->base.get_name = zink_get_name;
783 screen->base.get_vendor = zink_get_vendor;
784 screen->base.get_device_vendor = zink_get_device_vendor;
785 screen->base.get_param = zink_get_param;
786 screen->base.get_paramf = zink_get_paramf;
787 screen->base.get_shader_param = zink_get_shader_param;
788 screen->base.get_compiler_options = zink_get_compiler_options;
789 screen->base.is_format_supported = zink_is_format_supported;
790 screen->base.context_create = zink_context_create;
791 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
792 screen->base.destroy = zink_destroy_screen;
793
794 zink_screen_resource_init(&screen->base);
795 zink_screen_fence_init(&screen->base);
796
797 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
798
799 return &screen->base;
800
801 fail:
802 FREE(screen);
803 return NULL;
804 }
805
806 struct pipe_screen *
807 zink_create_screen(struct sw_winsys *winsys)
808 {
809 return zink_internal_create_screen(winsys, -1);
810 }
811
812 struct pipe_screen *
813 zink_drm_create_screen(int fd)
814 {
815 return zink_internal_create_screen(NULL, fd);
816 }