921581d517dd2d75ea5655058b11f924993db66f
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/format/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "frontend/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i) {
84 if (screen->mem_props.memoryHeaps[i].flags &
85 VK_MEMORY_HEAP_DEVICE_LOCAL_BIT)
86 size += screen->mem_props.memoryHeaps[i].size;
87 }
88 return (int)(size >> 20);
89 }
90
91 static int
92 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
93 {
94 struct zink_screen *screen = zink_screen(pscreen);
95
96 switch (param) {
97 case PIPE_CAP_NPOT_TEXTURES:
98 case PIPE_CAP_TGSI_TEXCOORD:
99 return 1;
100
101 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
102 if (!screen->feats.dualSrcBlend)
103 return 0;
104 return screen->props.limits.maxFragmentDualSrcAttachments;
105
106 case PIPE_CAP_POINT_SPRITE:
107 return 1;
108
109 case PIPE_CAP_MAX_RENDER_TARGETS:
110 return screen->props.limits.maxColorAttachments;
111
112 case PIPE_CAP_OCCLUSION_QUERY:
113 return 1;
114
115 #if 0 /* TODO: Enable me */
116 case PIPE_CAP_QUERY_TIME_ELAPSED:
117 return 1;
118 #endif
119
120 case PIPE_CAP_TEXTURE_MULTISAMPLE:
121 return 1;
122
123 case PIPE_CAP_TEXTURE_SWIZZLE:
124 return 1;
125
126 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
127 return screen->props.limits.maxImageDimension2D;
128 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
129 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
130 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
131 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
132
133 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
134 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
135 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
136 case PIPE_CAP_VERTEX_SHADER_SATURATE:
137 return 1;
138
139 case PIPE_CAP_INDEP_BLEND_ENABLE:
140 case PIPE_CAP_INDEP_BLEND_FUNC:
141 return 1;
142
143 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
144 return screen->have_EXT_transform_feedback ? screen->tf_props.maxTransformFeedbackBuffers : 0;
145 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
146 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
147 return 1;
148
149 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
150 return screen->props.limits.maxImageArrayLayers;
151
152 case PIPE_CAP_DEPTH_CLIP_DISABLE:
153 return screen->feats.depthClamp;
154
155 case PIPE_CAP_TGSI_INSTANCEID:
156 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
157 case PIPE_CAP_SEAMLESS_CUBE_MAP:
158 return 1;
159
160 case PIPE_CAP_MIN_TEXEL_OFFSET:
161 return screen->props.limits.minTexelOffset;
162 case PIPE_CAP_MAX_TEXEL_OFFSET:
163 return screen->props.limits.maxTexelOffset;
164
165 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
166 return 1;
167
168 case PIPE_CAP_CONDITIONAL_RENDER:
169 return screen->have_EXT_conditional_rendering;
170
171 case PIPE_CAP_GLSL_FEATURE_LEVEL:
172 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
173 return 130;
174
175 #if 0 /* TODO: Enable me */
176 case PIPE_CAP_COMPUTE:
177 return 1;
178 #endif
179
180 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
181 return screen->props.limits.minUniformBufferOffsetAlignment;
182
183 #if 0 /* TODO: Enable me */
184 case PIPE_CAP_QUERY_TIMESTAMP:
185 return 1;
186 #endif
187
188 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
189 return screen->props.limits.minMemoryMapAlignment;
190
191 case PIPE_CAP_CUBE_MAP_ARRAY:
192 return screen->feats.imageCubeArray;
193
194 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
195 return 1;
196
197 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
198 return screen->props.limits.minTexelBufferOffsetAlignment;
199
200 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
201 return 0; /* unsure */
202
203 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
204 return screen->props.limits.maxTexelBufferElements;
205
206 case PIPE_CAP_ENDIANNESS:
207 return PIPE_ENDIAN_NATIVE; /* unsure */
208
209 case PIPE_CAP_MAX_VIEWPORTS:
210 return 1; /* TODO: When GS is supported, use screen->props.limits.maxViewports */
211
212 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
213 return 1;
214
215 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
216 return screen->props.limits.maxGeometryOutputVertices;
217 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
218 return screen->props.limits.maxGeometryOutputComponents;
219
220 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
221 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
222 return 4;
223 #endif
224
225 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
226 return screen->props.limits.minTexelGatherOffset;
227 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
228 return screen->props.limits.maxTexelGatherOffset;
229
230 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
231 return 1;
232
233 case PIPE_CAP_VENDOR_ID:
234 return screen->props.vendorID;
235 case PIPE_CAP_DEVICE_ID:
236 return screen->props.deviceID;
237
238 case PIPE_CAP_ACCELERATED:
239 return 1;
240 case PIPE_CAP_VIDEO_MEMORY:
241 return get_video_mem(screen);
242 case PIPE_CAP_UMA:
243 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
244
245 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
246 return screen->props.limits.maxVertexInputBindingStride;
247
248 #if 0 /* TODO: Enable me */
249 case PIPE_CAP_SAMPLER_VIEW_TARGET:
250 return 1;
251 #endif
252
253 #if 0 /* TODO: Enable me */
254 case PIPE_CAP_CLIP_HALFZ:
255 return 1;
256 #endif
257
258 #if 0 /* TODO: Enable me */
259 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
260 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
261 return 1;
262 #endif
263
264 case PIPE_CAP_SHAREABLE_SHADERS:
265 return 1;
266
267 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
268 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
269 return screen->props.limits.minStorageBufferOffsetAlignment;
270 #endif
271
272 case PIPE_CAP_PCI_GROUP:
273 case PIPE_CAP_PCI_BUS:
274 case PIPE_CAP_PCI_DEVICE:
275 case PIPE_CAP_PCI_FUNCTION:
276 return 0; /* TODO: figure these out */
277
278 case PIPE_CAP_CULL_DISTANCE:
279 return screen->feats.shaderCullDistance;
280
281 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
282 return screen->props.limits.viewportSubPixelBits;
283
284 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
285 return 0; /* not sure */
286
287 case PIPE_CAP_MAX_GS_INVOCATIONS:
288 return 0; /* not implemented */
289
290 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
291 return screen->props.limits.maxDescriptorSetStorageBuffers;
292
293 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
294 return screen->props.limits.maxStorageBufferRange; /* unsure */
295
296 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
297 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
298 return 1;
299
300 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
301 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
302 return 0;
303
304 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
305 return 0;
306
307 case PIPE_CAP_NIR_COMPACT_ARRAYS:
308 return 1;
309
310 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
311 return 1;
312
313 case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED:
314 return 1;
315
316 case PIPE_CAP_FLATSHADE:
317 case PIPE_CAP_ALPHA_TEST:
318 case PIPE_CAP_CLIP_PLANES:
319 case PIPE_CAP_POINT_SIZE_FIXED:
320 case PIPE_CAP_TWO_SIDED_COLOR:
321 return 0;
322
323 case PIPE_CAP_DMABUF:
324 return screen->have_KHR_external_memory_fd;
325
326 default:
327 return u_pipe_screen_get_param_defaults(pscreen, param);
328 }
329 }
330
331 static float
332 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
333 {
334 struct zink_screen *screen = zink_screen(pscreen);
335
336 switch (param) {
337 case PIPE_CAPF_MAX_LINE_WIDTH:
338 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
339 return screen->props.limits.lineWidthRange[1];
340
341 case PIPE_CAPF_MAX_POINT_WIDTH:
342 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
343 return screen->props.limits.pointSizeRange[1];
344
345 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
346 return screen->props.limits.maxSamplerAnisotropy;
347
348 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
349 return screen->props.limits.maxSamplerLodBias;
350
351 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
352 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
353 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
354 return 0.0f; /* not implemented */
355 }
356
357 /* should only get here on unhandled cases */
358 return 0.0;
359 }
360
361 static int
362 zink_get_shader_param(struct pipe_screen *pscreen,
363 enum pipe_shader_type shader,
364 enum pipe_shader_cap param)
365 {
366 struct zink_screen *screen = zink_screen(pscreen);
367
368 switch (param) {
369 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
370 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
371 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
372 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
373 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
374 if (shader == PIPE_SHADER_VERTEX ||
375 shader == PIPE_SHADER_FRAGMENT)
376 return INT_MAX;
377 return 0;
378
379 case PIPE_SHADER_CAP_MAX_INPUTS:
380 switch (shader) {
381 case PIPE_SHADER_VERTEX:
382 return MIN2(screen->props.limits.maxVertexInputAttributes,
383 PIPE_MAX_SHADER_INPUTS);
384 case PIPE_SHADER_FRAGMENT:
385 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
386 PIPE_MAX_SHADER_INPUTS);
387 default:
388 return 0; /* unsupported stage */
389 }
390
391 case PIPE_SHADER_CAP_MAX_OUTPUTS:
392 switch (shader) {
393 case PIPE_SHADER_VERTEX:
394 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
395 PIPE_MAX_SHADER_OUTPUTS);
396 case PIPE_SHADER_FRAGMENT:
397 return MIN2(screen->props.limits.maxColorAttachments,
398 PIPE_MAX_SHADER_OUTPUTS);
399 default:
400 return 0; /* unsupported stage */
401 }
402
403 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
404 switch (shader) {
405 case PIPE_SHADER_VERTEX:
406 case PIPE_SHADER_FRAGMENT:
407 /* this might be a bit simplistic... */
408 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
409 PIPE_MAX_SAMPLERS);
410 default:
411 return 0; /* unsupported stage */
412 }
413
414 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
415 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
416
417 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
418 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
419
420 case PIPE_SHADER_CAP_MAX_TEMPS:
421 return INT_MAX;
422
423 case PIPE_SHADER_CAP_INTEGERS:
424 return 1;
425
426 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
427 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
428 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
429 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
430 case PIPE_SHADER_CAP_SUBROUTINES:
431 case PIPE_SHADER_CAP_INT64_ATOMICS:
432 case PIPE_SHADER_CAP_FP16:
433 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
434 case PIPE_SHADER_CAP_INT16:
435 case PIPE_SHADER_CAP_GLSL_16BIT_TEMPS:
436 return 0; /* not implemented */
437
438 case PIPE_SHADER_CAP_PREFERRED_IR:
439 return PIPE_SHADER_IR_NIR;
440
441 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
442 return 0; /* not implemented */
443
444 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
445 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
446 PIPE_MAX_SHADER_SAMPLER_VIEWS);
447
448 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
449 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
450 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
451 return 0; /* not implemented */
452
453 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
454 return 0; /* no idea */
455
456 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
457 return 32; /* arbitrary */
458
459 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
460 /* TODO: this limitation is dumb, and will need some fixes in mesa */
461 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, PIPE_MAX_SHADER_BUFFERS);
462
463 case PIPE_SHADER_CAP_SUPPORTED_IRS:
464 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
465
466 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
467 #if 0 /* TODO: needs compiler support */
468 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
469 PIPE_MAX_SHADER_IMAGES);
470 #else
471 return 0;
472 #endif
473
474 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
475 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
476 return 0; /* unsure */
477
478 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
479 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
480 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
481 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
482 return 0; /* not implemented */
483 }
484
485 /* should only get here on unhandled cases */
486 return 0;
487 }
488
489 static VkSampleCountFlagBits
490 vk_sample_count_flags(uint32_t sample_count)
491 {
492 switch (sample_count) {
493 case 1: return VK_SAMPLE_COUNT_1_BIT;
494 case 2: return VK_SAMPLE_COUNT_2_BIT;
495 case 4: return VK_SAMPLE_COUNT_4_BIT;
496 case 8: return VK_SAMPLE_COUNT_8_BIT;
497 case 16: return VK_SAMPLE_COUNT_16_BIT;
498 case 32: return VK_SAMPLE_COUNT_32_BIT;
499 case 64: return VK_SAMPLE_COUNT_64_BIT;
500 default:
501 return 0;
502 }
503 }
504
505 static bool
506 zink_is_format_supported(struct pipe_screen *pscreen,
507 enum pipe_format format,
508 enum pipe_texture_target target,
509 unsigned sample_count,
510 unsigned storage_sample_count,
511 unsigned bind)
512 {
513 struct zink_screen *screen = zink_screen(pscreen);
514
515 if (format == PIPE_FORMAT_NONE)
516 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
517 vk_sample_count_flags(sample_count);
518
519 VkFormat vkformat = zink_get_format(screen, format);
520 if (vkformat == VK_FORMAT_UNDEFINED)
521 return false;
522
523 if (sample_count >= 1) {
524 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
525 if (!sample_mask)
526 return false;
527 const struct util_format_description *desc = util_format_description(format);
528 if (util_format_is_depth_or_stencil(format)) {
529 if (util_format_has_depth(desc)) {
530 if (bind & PIPE_BIND_DEPTH_STENCIL &&
531 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
532 return false;
533 if (bind & PIPE_BIND_SAMPLER_VIEW &&
534 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
535 return false;
536 }
537 if (util_format_has_stencil(desc)) {
538 if (bind & PIPE_BIND_DEPTH_STENCIL &&
539 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
540 return false;
541 if (bind & PIPE_BIND_SAMPLER_VIEW &&
542 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
543 return false;
544 }
545 } else if (util_format_is_pure_integer(format)) {
546 if (bind & PIPE_BIND_RENDER_TARGET &&
547 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
548 return false;
549 if (bind & PIPE_BIND_SAMPLER_VIEW &&
550 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
551 return false;
552 } else {
553 if (bind & PIPE_BIND_RENDER_TARGET &&
554 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
555 return false;
556 if (bind & PIPE_BIND_SAMPLER_VIEW &&
557 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
558 return false;
559 }
560 }
561
562 VkFormatProperties props;
563 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
564
565 if (target == PIPE_BUFFER) {
566 if (bind & PIPE_BIND_VERTEX_BUFFER &&
567 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
568 return false;
569 } else {
570 /* all other targets are texture-targets */
571 if (bind & PIPE_BIND_RENDER_TARGET &&
572 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
573 return false;
574
575 if (bind & PIPE_BIND_BLENDABLE &&
576 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
577 return false;
578
579 if (bind & PIPE_BIND_SAMPLER_VIEW &&
580 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
581 return false;
582
583 if (bind & PIPE_BIND_DEPTH_STENCIL &&
584 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
585 return false;
586 }
587
588 if (util_format_is_compressed(format)) {
589 const struct util_format_description *desc = util_format_description(format);
590 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
591 !screen->feats.textureCompressionBC)
592 return false;
593 }
594
595 return true;
596 }
597
598 static void
599 zink_destroy_screen(struct pipe_screen *pscreen)
600 {
601 struct zink_screen *screen = zink_screen(pscreen);
602 slab_destroy_parent(&screen->transfer_pool);
603 FREE(screen);
604 }
605
606 static VkInstance
607 create_instance()
608 {
609 VkApplicationInfo ai = {};
610 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
611
612 char proc_name[128];
613 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
614 ai.pApplicationName = proc_name;
615 else
616 ai.pApplicationName = "unknown";
617
618 ai.pEngineName = "mesa zink";
619 ai.apiVersion = VK_API_VERSION_1_0;
620
621 const char *extensions[] = {
622 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
623 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
624 };
625
626 VkInstanceCreateInfo ici = {};
627 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
628 ici.pApplicationInfo = &ai;
629 ici.ppEnabledExtensionNames = extensions;
630 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
631
632 VkInstance instance = VK_NULL_HANDLE;
633 VkResult err = vkCreateInstance(&ici, NULL, &instance);
634 if (err != VK_SUCCESS)
635 return VK_NULL_HANDLE;
636
637 return instance;
638 }
639
640 static VkPhysicalDevice
641 choose_pdev(const VkInstance instance)
642 {
643 uint32_t i, pdev_count;
644 VkPhysicalDevice *pdevs, pdev;
645 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
646 assert(pdev_count > 0);
647
648 pdevs = malloc(sizeof(*pdevs) * pdev_count);
649 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
650 assert(pdev_count > 0);
651
652 pdev = pdevs[0];
653 for (i = 0; i < pdev_count; ++i) {
654 VkPhysicalDeviceProperties props;
655 vkGetPhysicalDeviceProperties(pdevs[i], &props);
656 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
657 pdev = pdevs[i];
658 break;
659 }
660 }
661 free(pdevs);
662 return pdev;
663 }
664
665 static void
666 update_queue_props(struct zink_screen *screen)
667 {
668 uint32_t num_queues;
669 vkGetPhysicalDeviceQueueFamilyProperties(screen->pdev, &num_queues, NULL);
670 assert(num_queues > 0);
671
672 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
673 vkGetPhysicalDeviceQueueFamilyProperties(screen->pdev, &num_queues, props);
674
675 for (uint32_t i = 0; i < num_queues; i++) {
676 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
677 screen->gfx_queue = i;
678 screen->timestamp_valid_bits = props[i].timestampValidBits;
679 assert(screen->timestamp_valid_bits);
680 break;
681 }
682 }
683 free(props);
684 }
685
686 static void
687 zink_flush_frontbuffer(struct pipe_screen *pscreen,
688 struct pipe_resource *pres,
689 unsigned level, unsigned layer,
690 void *winsys_drawable_handle,
691 struct pipe_box *sub_box)
692 {
693 struct zink_screen *screen = zink_screen(pscreen);
694 struct sw_winsys *winsys = screen->winsys;
695 struct zink_resource *res = zink_resource(pres);
696
697 if (!winsys)
698 return;
699 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
700
701 if (map) {
702 VkImageSubresource isr = {};
703 isr.aspectMask = res->aspect;
704 isr.mipLevel = level;
705 isr.arrayLayer = layer;
706 VkSubresourceLayout layout;
707 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
708
709 void *ptr;
710 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
711 if (result != VK_SUCCESS) {
712 debug_printf("failed to map memory for display\n");
713 return;
714 }
715 for (int i = 0; i < pres->height0; ++i) {
716 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
717 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
718 memcpy(dst, src, res->dt_stride);
719 }
720 vkUnmapMemory(screen->dev, res->mem);
721 }
722
723 winsys->displaytarget_unmap(winsys, res->dt);
724
725 assert(res->dt);
726 if (res->dt)
727 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
728 }
729
730 static bool
731 load_device_extensions(struct zink_screen *screen)
732 {
733 #define GET_PROC_ADDR(x) do { \
734 screen->vk_##x = (PFN_vk##x)vkGetDeviceProcAddr(screen->dev, "vk"#x); \
735 if (!screen->vk_##x) \
736 return false; \
737 } while (0)
738
739 #define GET_PROC_ADDR_INSTANCE(x) do { \
740 screen->vk_##x = (PFN_vk##x)vkGetInstanceProcAddr(screen->instance, "vk"#x); \
741 if (!screen->vk_##x) { \
742 debug_printf("GetInstanceProcAddr failed: vk"#x"\n"); \
743 return false; \
744 } \
745 } while (0)
746 if (screen->have_EXT_transform_feedback) {
747 GET_PROC_ADDR(CmdBindTransformFeedbackBuffersEXT);
748 GET_PROC_ADDR(CmdBeginTransformFeedbackEXT);
749 GET_PROC_ADDR(CmdEndTransformFeedbackEXT);
750 GET_PROC_ADDR(CmdBeginQueryIndexedEXT);
751 GET_PROC_ADDR(CmdEndQueryIndexedEXT);
752 GET_PROC_ADDR(CmdDrawIndirectByteCountEXT);
753 }
754 if (screen->have_KHR_external_memory_fd)
755 GET_PROC_ADDR(GetMemoryFdKHR);
756
757 if (screen->have_EXT_conditional_rendering) {
758 GET_PROC_ADDR(CmdBeginConditionalRenderingEXT);
759 GET_PROC_ADDR(CmdEndConditionalRenderingEXT);
760 }
761
762 if (screen->have_EXT_calibrated_timestamps) {
763 GET_PROC_ADDR_INSTANCE(GetPhysicalDeviceCalibrateableTimeDomainsEXT);
764 GET_PROC_ADDR(GetCalibratedTimestampsEXT);
765
766 uint32_t num_domains = 0;
767 screen->vk_GetPhysicalDeviceCalibrateableTimeDomainsEXT(screen->pdev, &num_domains, NULL);
768 assert(num_domains > 0);
769
770 VkTimeDomainEXT *domains = malloc(sizeof(VkTimeDomainEXT) * num_domains);
771 screen->vk_GetPhysicalDeviceCalibrateableTimeDomainsEXT(screen->pdev, &num_domains, domains);
772
773 /* VK_TIME_DOMAIN_DEVICE_EXT is used for the ctx->get_timestamp hook and is the only one we really need */
774 bool have_device_time = false;
775 for (unsigned i = 0; i < num_domains; i++) {
776 if (domains[i] == VK_TIME_DOMAIN_DEVICE_EXT) {
777 have_device_time = true;
778 break;
779 }
780 }
781 assert(have_device_time);
782 free(domains);
783 }
784
785 #undef GET_PROC_ADDR
786
787 return true;
788 }
789
790 static struct pipe_screen *
791 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
792 {
793 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
794 bool have_tf_ext = false, have_cond_render_ext = false, have_EXT_index_type_uint8 = false,
795 have_EXT_robustness2_features = false, have_EXT_vertex_attribute_divisor = false,
796 have_EXT_calibrated_timestamps = false;
797 if (!screen)
798 return NULL;
799
800 zink_debug = debug_get_option_zink_debug();
801
802 screen->instance = create_instance();
803 screen->pdev = choose_pdev(screen->instance);
804 update_queue_props(screen);
805
806 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
807
808 screen->have_X8_D24_UNORM_PACK32 = zink_is_depth_format_supported(screen,
809 VK_FORMAT_X8_D24_UNORM_PACK32);
810 screen->have_D24_UNORM_S8_UINT = zink_is_depth_format_supported(screen,
811 VK_FORMAT_D24_UNORM_S8_UINT);
812
813 uint32_t num_extensions = 0;
814 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
815 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
816 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
817 num_extensions);
818 if (extensions) {
819 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
820 &num_extensions, extensions);
821
822 for (uint32_t i = 0; i < num_extensions; ++i) {
823 if (!strcmp(extensions[i].extensionName,
824 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
825 screen->have_KHR_maintenance1 = true;
826 if (!strcmp(extensions[i].extensionName,
827 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME))
828 screen->have_KHR_external_memory_fd = true;
829 if (!strcmp(extensions[i].extensionName,
830 VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME))
831 have_cond_render_ext = true;
832 if (!strcmp(extensions[i].extensionName,
833 VK_EXT_TRANSFORM_FEEDBACK_EXTENSION_NAME))
834 have_tf_ext = true;
835 if (!strcmp(extensions[i].extensionName,
836 VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME))
837 have_EXT_index_type_uint8 = true;
838 if (!strcmp(extensions[i].extensionName,
839 VK_EXT_ROBUSTNESS_2_EXTENSION_NAME))
840 have_EXT_robustness2_features = true;
841 if (!strcmp(extensions[i].extensionName,
842 VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME))
843 have_EXT_vertex_attribute_divisor = true;
844 if (!strcmp(extensions[i].extensionName,
845 VK_EXT_CALIBRATED_TIMESTAMPS_EXTENSION_NAME))
846 have_EXT_calibrated_timestamps = true;
847
848 }
849 FREE(extensions);
850 }
851 }
852 VkPhysicalDeviceFeatures2 feats = {};
853 VkPhysicalDeviceTransformFeedbackFeaturesEXT tf_feats = {};
854 VkPhysicalDeviceConditionalRenderingFeaturesEXT cond_render_feats = {};
855 VkPhysicalDeviceIndexTypeUint8FeaturesEXT index_uint8_feats = {};
856
857 feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2;
858 if (have_tf_ext) {
859 tf_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_TRANSFORM_FEEDBACK_FEATURES_EXT;
860 tf_feats.pNext = feats.pNext;
861 feats.pNext = &tf_feats;
862 }
863 if (have_cond_render_ext) {
864 cond_render_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_CONDITIONAL_RENDERING_FEATURES_EXT;
865 cond_render_feats.pNext = feats.pNext;
866 feats.pNext = &cond_render_feats;
867 }
868 if (have_EXT_index_type_uint8) {
869 index_uint8_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_INDEX_TYPE_UINT8_FEATURES_EXT;
870 index_uint8_feats.pNext = feats.pNext;
871 feats.pNext = &index_uint8_feats;
872 }
873 if (have_EXT_robustness2_features) {
874 screen->rb2_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_ROBUSTNESS_2_FEATURES_EXT;
875 screen->rb2_feats.pNext = feats.pNext;
876 feats.pNext = &screen->rb2_feats;
877 }
878 if (have_EXT_vertex_attribute_divisor) {
879 screen->vdiv_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VERTEX_ATTRIBUTE_DIVISOR_FEATURES_EXT;
880 screen->vdiv_feats.pNext = feats.pNext;
881 feats.pNext = &screen->vdiv_feats;
882 }
883 vkGetPhysicalDeviceFeatures2(screen->pdev, &feats);
884 memcpy(&screen->feats, &feats.features, sizeof(screen->feats));
885 if (have_tf_ext && tf_feats.transformFeedback)
886 screen->have_EXT_transform_feedback = true;
887 if (have_cond_render_ext && cond_render_feats.conditionalRendering)
888 screen->have_EXT_conditional_rendering = true;
889 if (have_EXT_index_type_uint8 && index_uint8_feats.indexTypeUint8)
890 screen->have_EXT_index_type_uint8 = true;
891 screen->have_EXT_robustness2_features = have_EXT_robustness2_features;
892 if (have_EXT_vertex_attribute_divisor && screen->vdiv_feats.vertexAttributeInstanceRateDivisor)
893 screen->have_EXT_vertex_attribute_divisor = true;
894 screen->have_EXT_calibrated_timestamps = have_EXT_calibrated_timestamps;
895
896 VkPhysicalDeviceProperties2 props = {};
897 VkPhysicalDeviceVertexAttributeDivisorPropertiesEXT vdiv_props = {};
898 props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2;
899 if (screen->have_EXT_transform_feedback) {
900 screen->tf_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_TRANSFORM_FEEDBACK_PROPERTIES_EXT;
901 screen->tf_props.pNext = props.pNext;
902 props.pNext = &screen->tf_props;
903 }
904 if (have_EXT_robustness2_features) {
905 screen->rb2_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_ROBUSTNESS_2_PROPERTIES_EXT;
906 screen->rb2_props.pNext = props.pNext;
907 props.pNext = &screen->rb2_props;
908 }
909 if (have_EXT_vertex_attribute_divisor) {
910 vdiv_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VERTEX_ATTRIBUTE_DIVISOR_PROPERTIES_EXT;
911 vdiv_props.pNext = props.pNext;
912 props.pNext = &vdiv_props;
913 }
914 vkGetPhysicalDeviceProperties2(screen->pdev, &props);
915 memcpy(&screen->props, &props.properties, sizeof(screen->props));
916 screen->max_vertex_attrib_divisor = vdiv_props.maxVertexAttribDivisor;
917
918 if (!screen->have_KHR_maintenance1) {
919 debug_printf("ZINK: VK_KHR_maintenance1 required!\n");
920 goto fail;
921 }
922
923 VkDeviceQueueCreateInfo qci = {};
924 float dummy = 0.0f;
925 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
926 qci.queueFamilyIndex = screen->gfx_queue;
927 qci.queueCount = 1;
928 qci.pQueuePriorities = &dummy;
929
930 VkDeviceCreateInfo dci = {};
931 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
932 dci.queueCreateInfoCount = 1;
933 dci.pQueueCreateInfos = &qci;
934 /* extensions don't have bool members in pEnabledFeatures.
935 * this requires us to pass the whole VkPhysicalDeviceFeatures2 struct
936 */
937 dci.pNext = &feats;
938 const char *extensions[9] = {
939 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
940 };
941 num_extensions = 1;
942
943 if (fd >= 0 && !screen->have_KHR_external_memory_fd) {
944 debug_printf("ZINK: KHR_external_memory_fd required!\n");
945 goto fail;
946 }
947
948 if (screen->have_KHR_external_memory_fd) {
949 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME;
950 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME;
951 }
952
953 if (screen->have_EXT_conditional_rendering)
954 extensions[num_extensions++] = VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME;
955
956 if (screen->have_EXT_index_type_uint8)
957 extensions[num_extensions++] = VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME;
958
959 if (screen->have_EXT_transform_feedback)
960 extensions[num_extensions++] = VK_EXT_TRANSFORM_FEEDBACK_EXTENSION_NAME;
961 if (screen->have_EXT_robustness2_features)
962 extensions[num_extensions++] = VK_EXT_ROBUSTNESS_2_EXTENSION_NAME;
963 if (screen->have_EXT_vertex_attribute_divisor)
964 extensions[num_extensions++] = VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME;
965 if (screen->have_EXT_calibrated_timestamps)
966 extensions[num_extensions++] = VK_EXT_CALIBRATED_TIMESTAMPS_EXTENSION_NAME;
967 assert(num_extensions <= ARRAY_SIZE(extensions));
968
969 dci.ppEnabledExtensionNames = extensions;
970 dci.enabledExtensionCount = num_extensions;
971 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
972 goto fail;
973
974 if (!load_device_extensions(screen))
975 goto fail;
976
977 screen->winsys = winsys;
978
979 screen->base.get_name = zink_get_name;
980 screen->base.get_vendor = zink_get_vendor;
981 screen->base.get_device_vendor = zink_get_device_vendor;
982 screen->base.get_param = zink_get_param;
983 screen->base.get_paramf = zink_get_paramf;
984 screen->base.get_shader_param = zink_get_shader_param;
985 screen->base.get_compiler_options = zink_get_compiler_options;
986 screen->base.is_format_supported = zink_is_format_supported;
987 screen->base.context_create = zink_context_create;
988 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
989 screen->base.destroy = zink_destroy_screen;
990
991 zink_screen_resource_init(&screen->base);
992 zink_screen_fence_init(&screen->base);
993
994 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
995
996 return &screen->base;
997
998 fail:
999 FREE(screen);
1000 return NULL;
1001 }
1002
1003 struct pipe_screen *
1004 zink_create_screen(struct sw_winsys *winsys)
1005 {
1006 return zink_internal_create_screen(winsys, -1);
1007 }
1008
1009 struct pipe_screen *
1010 zink_drm_create_screen(int fd)
1011 {
1012 return zink_internal_create_screen(NULL, fd);
1013 }