64ea00786d02aad4ae1af0011d8efaee94cc0c6e
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/format/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "frontend/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i) {
84 if (screen->mem_props.memoryHeaps[i].flags &
85 VK_MEMORY_HEAP_DEVICE_LOCAL_BIT)
86 size += screen->mem_props.memoryHeaps[i].size;
87 }
88 return (int)(size >> 20);
89 }
90
91 static int
92 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
93 {
94 struct zink_screen *screen = zink_screen(pscreen);
95
96 switch (param) {
97 case PIPE_CAP_NPOT_TEXTURES:
98 case PIPE_CAP_TGSI_TEXCOORD:
99 return 1;
100
101 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
102 if (!screen->feats.dualSrcBlend)
103 return 0;
104 return screen->props.limits.maxFragmentDualSrcAttachments;
105
106 case PIPE_CAP_POINT_SPRITE:
107 return 1;
108
109 case PIPE_CAP_MAX_RENDER_TARGETS:
110 return screen->props.limits.maxColorAttachments;
111
112 case PIPE_CAP_OCCLUSION_QUERY:
113 return 1;
114
115 #if 0 /* TODO: Enable me */
116 case PIPE_CAP_QUERY_TIME_ELAPSED:
117 return 1;
118 #endif
119
120 case PIPE_CAP_TEXTURE_MULTISAMPLE:
121 return 1;
122
123 case PIPE_CAP_TEXTURE_SWIZZLE:
124 return 1;
125
126 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
127 return screen->props.limits.maxImageDimension2D;
128 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
129 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
130 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
131 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
132
133 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
134 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
135 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
136 case PIPE_CAP_VERTEX_SHADER_SATURATE:
137 return 1;
138
139 case PIPE_CAP_INDEP_BLEND_ENABLE:
140 case PIPE_CAP_INDEP_BLEND_FUNC:
141 return 1;
142
143 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
144 return screen->have_EXT_transform_feedback ? screen->tf_props.maxTransformFeedbackBuffers : 0;
145 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
146 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
147 return 1;
148
149 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
150 return screen->props.limits.maxImageArrayLayers;
151
152 case PIPE_CAP_DEPTH_CLIP_DISABLE:
153 return screen->feats.depthClamp;
154
155 case PIPE_CAP_TGSI_INSTANCEID:
156 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
157 case PIPE_CAP_SEAMLESS_CUBE_MAP:
158 return 1;
159
160 case PIPE_CAP_MIN_TEXEL_OFFSET:
161 return screen->props.limits.minTexelOffset;
162 case PIPE_CAP_MAX_TEXEL_OFFSET:
163 return screen->props.limits.maxTexelOffset;
164
165 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
166 return 1;
167
168 case PIPE_CAP_CONDITIONAL_RENDER:
169 return screen->have_EXT_conditional_rendering;
170
171 case PIPE_CAP_GLSL_FEATURE_LEVEL:
172 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
173 return 130;
174
175 #if 0 /* TODO: Enable me */
176 case PIPE_CAP_COMPUTE:
177 return 1;
178 #endif
179
180 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
181 return screen->props.limits.minUniformBufferOffsetAlignment;
182
183 #if 0 /* TODO: Enable me */
184 case PIPE_CAP_QUERY_TIMESTAMP:
185 return 1;
186 #endif
187
188 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
189 return screen->props.limits.minMemoryMapAlignment;
190
191 case PIPE_CAP_CUBE_MAP_ARRAY:
192 return screen->feats.imageCubeArray;
193
194 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
195 return 1;
196
197 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
198 return screen->props.limits.minTexelBufferOffsetAlignment;
199
200 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
201 return 0; /* unsure */
202
203 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
204 return screen->props.limits.maxTexelBufferElements;
205
206 case PIPE_CAP_ENDIANNESS:
207 return PIPE_ENDIAN_NATIVE; /* unsure */
208
209 case PIPE_CAP_MAX_VIEWPORTS:
210 return 1; /* TODO: When GS is supported, use screen->props.limits.maxViewports */
211
212 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
213 return 1;
214
215 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
216 return screen->props.limits.maxGeometryOutputVertices;
217 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
218 return screen->props.limits.maxGeometryOutputComponents;
219
220 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
221 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
222 return 4;
223 #endif
224
225 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
226 return screen->props.limits.minTexelGatherOffset;
227 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
228 return screen->props.limits.maxTexelGatherOffset;
229
230 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
231 return 1;
232
233 case PIPE_CAP_VENDOR_ID:
234 return screen->props.vendorID;
235 case PIPE_CAP_DEVICE_ID:
236 return screen->props.deviceID;
237
238 case PIPE_CAP_ACCELERATED:
239 return 1;
240 case PIPE_CAP_VIDEO_MEMORY:
241 return get_video_mem(screen);
242 case PIPE_CAP_UMA:
243 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
244
245 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
246 return screen->props.limits.maxVertexInputBindingStride;
247
248 #if 0 /* TODO: Enable me */
249 case PIPE_CAP_SAMPLER_VIEW_TARGET:
250 return 1;
251 #endif
252
253 #if 0 /* TODO: Enable me */
254 case PIPE_CAP_CLIP_HALFZ:
255 return 1;
256 #endif
257
258 #if 0 /* TODO: Enable me */
259 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
260 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
261 return 1;
262 #endif
263
264 case PIPE_CAP_SHAREABLE_SHADERS:
265 return 1;
266
267 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
268 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
269 return screen->props.limits.minStorageBufferOffsetAlignment;
270 #endif
271
272 case PIPE_CAP_PCI_GROUP:
273 case PIPE_CAP_PCI_BUS:
274 case PIPE_CAP_PCI_DEVICE:
275 case PIPE_CAP_PCI_FUNCTION:
276 return 0; /* TODO: figure these out */
277
278 case PIPE_CAP_CULL_DISTANCE:
279 return screen->feats.shaderCullDistance;
280
281 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
282 return screen->props.limits.viewportSubPixelBits;
283
284 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
285 return 0; /* not sure */
286
287 case PIPE_CAP_MAX_GS_INVOCATIONS:
288 return 0; /* not implemented */
289
290 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
291 return screen->props.limits.maxDescriptorSetStorageBuffers;
292
293 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
294 return screen->props.limits.maxStorageBufferRange; /* unsure */
295
296 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
297 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
298 return 1;
299
300 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
301 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
302 return 0;
303
304 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
305 return 0;
306
307 case PIPE_CAP_NIR_COMPACT_ARRAYS:
308 return 1;
309
310 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
311 return 1;
312
313 case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED:
314 return 1;
315
316 case PIPE_CAP_FLATSHADE:
317 case PIPE_CAP_ALPHA_TEST:
318 case PIPE_CAP_CLIP_PLANES:
319 case PIPE_CAP_POINT_SIZE_FIXED:
320 case PIPE_CAP_TWO_SIDED_COLOR:
321 return 0;
322
323 case PIPE_CAP_DMABUF:
324 return screen->have_KHR_external_memory_fd;
325
326 default:
327 return u_pipe_screen_get_param_defaults(pscreen, param);
328 }
329 }
330
331 static float
332 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
333 {
334 struct zink_screen *screen = zink_screen(pscreen);
335
336 switch (param) {
337 case PIPE_CAPF_MAX_LINE_WIDTH:
338 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
339 return screen->props.limits.lineWidthRange[1];
340
341 case PIPE_CAPF_MAX_POINT_WIDTH:
342 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
343 return screen->props.limits.pointSizeRange[1];
344
345 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
346 return screen->props.limits.maxSamplerAnisotropy;
347
348 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
349 return screen->props.limits.maxSamplerLodBias;
350
351 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
352 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
353 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
354 return 0.0f; /* not implemented */
355 }
356
357 /* should only get here on unhandled cases */
358 return 0.0;
359 }
360
361 static int
362 zink_get_shader_param(struct pipe_screen *pscreen,
363 enum pipe_shader_type shader,
364 enum pipe_shader_cap param)
365 {
366 struct zink_screen *screen = zink_screen(pscreen);
367
368 switch (param) {
369 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
370 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
371 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
372 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
373 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
374 if (shader == PIPE_SHADER_VERTEX ||
375 shader == PIPE_SHADER_FRAGMENT)
376 return INT_MAX;
377 return 0;
378
379 case PIPE_SHADER_CAP_MAX_INPUTS:
380 switch (shader) {
381 case PIPE_SHADER_VERTEX:
382 return MIN2(screen->props.limits.maxVertexInputAttributes,
383 PIPE_MAX_SHADER_INPUTS);
384 case PIPE_SHADER_FRAGMENT:
385 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
386 PIPE_MAX_SHADER_INPUTS);
387 default:
388 return 0; /* unsupported stage */
389 }
390
391 case PIPE_SHADER_CAP_MAX_OUTPUTS:
392 switch (shader) {
393 case PIPE_SHADER_VERTEX:
394 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
395 PIPE_MAX_SHADER_OUTPUTS);
396 case PIPE_SHADER_FRAGMENT:
397 return MIN2(screen->props.limits.maxColorAttachments,
398 PIPE_MAX_SHADER_OUTPUTS);
399 default:
400 return 0; /* unsupported stage */
401 }
402
403 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
404 switch (shader) {
405 case PIPE_SHADER_VERTEX:
406 case PIPE_SHADER_FRAGMENT:
407 /* this might be a bit simplistic... */
408 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
409 PIPE_MAX_SAMPLERS);
410 default:
411 return 0; /* unsupported stage */
412 }
413
414 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
415 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
416
417 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
418 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
419
420 case PIPE_SHADER_CAP_MAX_TEMPS:
421 return INT_MAX;
422
423 case PIPE_SHADER_CAP_INTEGERS:
424 return 1;
425
426 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
427 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
428 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
429 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
430 case PIPE_SHADER_CAP_SUBROUTINES:
431 case PIPE_SHADER_CAP_INT64_ATOMICS:
432 case PIPE_SHADER_CAP_FP16:
433 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
434 case PIPE_SHADER_CAP_INT16:
435 case PIPE_SHADER_CAP_GLSL_16BIT_TEMPS:
436 return 0; /* not implemented */
437
438 case PIPE_SHADER_CAP_PREFERRED_IR:
439 return PIPE_SHADER_IR_NIR;
440
441 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
442 return 0; /* not implemented */
443
444 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
445 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
446 PIPE_MAX_SHADER_SAMPLER_VIEWS);
447
448 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
449 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
450 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
451 return 0; /* not implemented */
452
453 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
454 return 0; /* no idea */
455
456 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
457 return 32; /* arbitrary */
458
459 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
460 /* TODO: this limitation is dumb, and will need some fixes in mesa */
461 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, PIPE_MAX_SHADER_BUFFERS);
462
463 case PIPE_SHADER_CAP_SUPPORTED_IRS:
464 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
465
466 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
467 #if 0 /* TODO: needs compiler support */
468 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
469 PIPE_MAX_SHADER_IMAGES);
470 #else
471 return 0;
472 #endif
473
474 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
475 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
476 return 0; /* unsure */
477
478 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
479 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
480 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
481 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
482 return 0; /* not implemented */
483 }
484
485 /* should only get here on unhandled cases */
486 return 0;
487 }
488
489 static VkSampleCountFlagBits
490 vk_sample_count_flags(uint32_t sample_count)
491 {
492 switch (sample_count) {
493 case 1: return VK_SAMPLE_COUNT_1_BIT;
494 case 2: return VK_SAMPLE_COUNT_2_BIT;
495 case 4: return VK_SAMPLE_COUNT_4_BIT;
496 case 8: return VK_SAMPLE_COUNT_8_BIT;
497 case 16: return VK_SAMPLE_COUNT_16_BIT;
498 case 32: return VK_SAMPLE_COUNT_32_BIT;
499 case 64: return VK_SAMPLE_COUNT_64_BIT;
500 default:
501 return 0;
502 }
503 }
504
505 static bool
506 zink_is_format_supported(struct pipe_screen *pscreen,
507 enum pipe_format format,
508 enum pipe_texture_target target,
509 unsigned sample_count,
510 unsigned storage_sample_count,
511 unsigned bind)
512 {
513 struct zink_screen *screen = zink_screen(pscreen);
514
515 if (format == PIPE_FORMAT_NONE)
516 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
517 vk_sample_count_flags(sample_count);
518
519 VkFormat vkformat = zink_get_format(screen, format);
520 if (vkformat == VK_FORMAT_UNDEFINED)
521 return false;
522
523 if (sample_count >= 1) {
524 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
525 if (!sample_mask)
526 return false;
527 const struct util_format_description *desc = util_format_description(format);
528 if (util_format_is_depth_or_stencil(format)) {
529 if (util_format_has_depth(desc)) {
530 if (bind & PIPE_BIND_DEPTH_STENCIL &&
531 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
532 return false;
533 if (bind & PIPE_BIND_SAMPLER_VIEW &&
534 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
535 return false;
536 }
537 if (util_format_has_stencil(desc)) {
538 if (bind & PIPE_BIND_DEPTH_STENCIL &&
539 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
540 return false;
541 if (bind & PIPE_BIND_SAMPLER_VIEW &&
542 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
543 return false;
544 }
545 } else if (util_format_is_pure_integer(format)) {
546 if (bind & PIPE_BIND_RENDER_TARGET &&
547 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
548 return false;
549 if (bind & PIPE_BIND_SAMPLER_VIEW &&
550 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
551 return false;
552 } else {
553 if (bind & PIPE_BIND_RENDER_TARGET &&
554 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
555 return false;
556 if (bind & PIPE_BIND_SAMPLER_VIEW &&
557 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
558 return false;
559 }
560 }
561
562 VkFormatProperties props;
563 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
564
565 if (target == PIPE_BUFFER) {
566 if (bind & PIPE_BIND_VERTEX_BUFFER &&
567 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
568 return false;
569 } else {
570 /* all other targets are texture-targets */
571 if (bind & PIPE_BIND_RENDER_TARGET &&
572 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
573 return false;
574
575 if (bind & PIPE_BIND_BLENDABLE &&
576 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
577 return false;
578
579 if (bind & PIPE_BIND_SAMPLER_VIEW &&
580 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
581 return false;
582
583 if (bind & PIPE_BIND_DEPTH_STENCIL &&
584 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
585 return false;
586 }
587
588 if (util_format_is_compressed(format)) {
589 const struct util_format_description *desc = util_format_description(format);
590 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
591 !screen->feats.textureCompressionBC)
592 return false;
593 }
594
595 return true;
596 }
597
598 static void
599 zink_destroy_screen(struct pipe_screen *pscreen)
600 {
601 struct zink_screen *screen = zink_screen(pscreen);
602 slab_destroy_parent(&screen->transfer_pool);
603 FREE(screen);
604 }
605
606 static VkInstance
607 create_instance()
608 {
609 VkApplicationInfo ai = {};
610 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
611
612 char proc_name[128];
613 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
614 ai.pApplicationName = proc_name;
615 else
616 ai.pApplicationName = "unknown";
617
618 ai.pEngineName = "mesa zink";
619 ai.apiVersion = VK_API_VERSION_1_0;
620
621 const char *extensions[] = {
622 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
623 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
624 };
625
626 VkInstanceCreateInfo ici = {};
627 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
628 ici.pApplicationInfo = &ai;
629 ici.ppEnabledExtensionNames = extensions;
630 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
631
632 VkInstance instance = VK_NULL_HANDLE;
633 VkResult err = vkCreateInstance(&ici, NULL, &instance);
634 if (err != VK_SUCCESS)
635 return VK_NULL_HANDLE;
636
637 return instance;
638 }
639
640 static VkPhysicalDevice
641 choose_pdev(const VkInstance instance)
642 {
643 uint32_t i, pdev_count;
644 VkPhysicalDevice *pdevs, pdev;
645 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
646 assert(pdev_count > 0);
647
648 pdevs = malloc(sizeof(*pdevs) * pdev_count);
649 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
650 assert(pdev_count > 0);
651
652 pdev = pdevs[0];
653 for (i = 0; i < pdev_count; ++i) {
654 VkPhysicalDeviceProperties props;
655 vkGetPhysicalDeviceProperties(pdevs[i], &props);
656 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
657 pdev = pdevs[i];
658 break;
659 }
660 }
661 free(pdevs);
662 return pdev;
663 }
664
665 static uint32_t
666 find_gfx_queue(const VkPhysicalDevice pdev)
667 {
668 uint32_t num_queues;
669 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, NULL);
670 assert(num_queues > 0);
671
672 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
673 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, props);
674
675 for (uint32_t i = 0; i < num_queues; i++) {
676 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
677 free(props);
678 return i;
679 }
680 }
681
682 return UINT32_MAX;
683 }
684
685 static void
686 zink_flush_frontbuffer(struct pipe_screen *pscreen,
687 struct pipe_resource *pres,
688 unsigned level, unsigned layer,
689 void *winsys_drawable_handle,
690 struct pipe_box *sub_box)
691 {
692 struct zink_screen *screen = zink_screen(pscreen);
693 struct sw_winsys *winsys = screen->winsys;
694 struct zink_resource *res = zink_resource(pres);
695
696 if (!winsys)
697 return;
698 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
699
700 if (map) {
701 VkImageSubresource isr = {};
702 isr.aspectMask = res->aspect;
703 isr.mipLevel = level;
704 isr.arrayLayer = layer;
705 VkSubresourceLayout layout;
706 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
707
708 void *ptr;
709 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
710 if (result != VK_SUCCESS) {
711 debug_printf("failed to map memory for display\n");
712 return;
713 }
714 for (int i = 0; i < pres->height0; ++i) {
715 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
716 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
717 memcpy(dst, src, res->dt_stride);
718 }
719 vkUnmapMemory(screen->dev, res->mem);
720 }
721
722 winsys->displaytarget_unmap(winsys, res->dt);
723
724 assert(res->dt);
725 if (res->dt)
726 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
727 }
728
729 static bool
730 load_device_extensions(struct zink_screen *screen)
731 {
732 #define GET_PROC_ADDR(x) do { \
733 screen->vk_##x = (PFN_vk##x)vkGetDeviceProcAddr(screen->dev, "vk"#x); \
734 if (!screen->vk_##x) \
735 return false; \
736 } while (0)
737 if (screen->have_EXT_transform_feedback) {
738 GET_PROC_ADDR(CmdBindTransformFeedbackBuffersEXT);
739 GET_PROC_ADDR(CmdBeginTransformFeedbackEXT);
740 GET_PROC_ADDR(CmdEndTransformFeedbackEXT);
741 GET_PROC_ADDR(CmdBeginQueryIndexedEXT);
742 GET_PROC_ADDR(CmdEndQueryIndexedEXT);
743 GET_PROC_ADDR(CmdDrawIndirectByteCountEXT);
744 }
745 if (screen->have_KHR_external_memory_fd)
746 GET_PROC_ADDR(GetMemoryFdKHR);
747
748 if (screen->have_EXT_conditional_rendering) {
749 GET_PROC_ADDR(CmdBeginConditionalRenderingEXT);
750 GET_PROC_ADDR(CmdEndConditionalRenderingEXT);
751 }
752
753 #undef GET_PROC_ADDR
754
755 return true;
756 }
757
758 static struct pipe_screen *
759 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
760 {
761 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
762 bool have_tf_ext = false, have_cond_render_ext = false, have_EXT_index_type_uint8 = false,
763 have_EXT_robustness2_features = false, have_EXT_vertex_attribute_divisor = false;
764 if (!screen)
765 return NULL;
766
767 zink_debug = debug_get_option_zink_debug();
768
769 screen->instance = create_instance();
770 screen->pdev = choose_pdev(screen->instance);
771 screen->gfx_queue = find_gfx_queue(screen->pdev);
772
773 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
774
775 screen->have_X8_D24_UNORM_PACK32 = zink_is_depth_format_supported(screen,
776 VK_FORMAT_X8_D24_UNORM_PACK32);
777 screen->have_D24_UNORM_S8_UINT = zink_is_depth_format_supported(screen,
778 VK_FORMAT_D24_UNORM_S8_UINT);
779
780 uint32_t num_extensions = 0;
781 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
782 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
783 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
784 num_extensions);
785 if (extensions) {
786 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
787 &num_extensions, extensions);
788
789 for (uint32_t i = 0; i < num_extensions; ++i) {
790 if (!strcmp(extensions[i].extensionName,
791 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
792 screen->have_KHR_maintenance1 = true;
793 if (!strcmp(extensions[i].extensionName,
794 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME))
795 screen->have_KHR_external_memory_fd = true;
796 if (!strcmp(extensions[i].extensionName,
797 VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME))
798 have_cond_render_ext = true;
799 if (!strcmp(extensions[i].extensionName,
800 VK_EXT_TRANSFORM_FEEDBACK_EXTENSION_NAME))
801 have_tf_ext = true;
802 if (!strcmp(extensions[i].extensionName,
803 VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME))
804 have_EXT_index_type_uint8 = true;
805 if (!strcmp(extensions[i].extensionName,
806 VK_EXT_ROBUSTNESS_2_EXTENSION_NAME))
807 have_EXT_robustness2_features = true;
808 if (!strcmp(extensions[i].extensionName,
809 VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME))
810 have_EXT_vertex_attribute_divisor = true;
811
812 }
813 FREE(extensions);
814 }
815 }
816 VkPhysicalDeviceFeatures2 feats = {};
817 VkPhysicalDeviceTransformFeedbackFeaturesEXT tf_feats = {};
818 VkPhysicalDeviceConditionalRenderingFeaturesEXT cond_render_feats = {};
819 VkPhysicalDeviceIndexTypeUint8FeaturesEXT index_uint8_feats = {};
820
821 feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2;
822 if (have_tf_ext) {
823 tf_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_TRANSFORM_FEEDBACK_FEATURES_EXT;
824 tf_feats.pNext = feats.pNext;
825 feats.pNext = &tf_feats;
826 }
827 if (have_cond_render_ext) {
828 cond_render_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_CONDITIONAL_RENDERING_FEATURES_EXT;
829 cond_render_feats.pNext = feats.pNext;
830 feats.pNext = &cond_render_feats;
831 }
832 if (have_EXT_index_type_uint8) {
833 index_uint8_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_INDEX_TYPE_UINT8_FEATURES_EXT;
834 index_uint8_feats.pNext = feats.pNext;
835 feats.pNext = &index_uint8_feats;
836 }
837 if (have_EXT_robustness2_features) {
838 screen->rb2_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_ROBUSTNESS_2_FEATURES_EXT;
839 screen->rb2_feats.pNext = feats.pNext;
840 feats.pNext = &screen->rb2_feats;
841 }
842 if (have_EXT_vertex_attribute_divisor) {
843 screen->vdiv_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VERTEX_ATTRIBUTE_DIVISOR_FEATURES_EXT;
844 screen->vdiv_feats.pNext = feats.pNext;
845 feats.pNext = &screen->vdiv_feats;
846 }
847 vkGetPhysicalDeviceFeatures2(screen->pdev, &feats);
848 memcpy(&screen->feats, &feats.features, sizeof(screen->feats));
849 if (have_tf_ext && tf_feats.transformFeedback)
850 screen->have_EXT_transform_feedback = true;
851 if (have_cond_render_ext && cond_render_feats.conditionalRendering)
852 screen->have_EXT_conditional_rendering = true;
853 if (have_EXT_index_type_uint8 && index_uint8_feats.indexTypeUint8)
854 screen->have_EXT_index_type_uint8 = true;
855 screen->have_EXT_robustness2_features = have_EXT_robustness2_features;
856 if (have_EXT_vertex_attribute_divisor && screen->vdiv_feats.vertexAttributeInstanceRateDivisor)
857 screen->have_EXT_vertex_attribute_divisor = true;
858
859 VkPhysicalDeviceProperties2 props = {};
860 VkPhysicalDeviceVertexAttributeDivisorPropertiesEXT vdiv_props = {};
861 props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2;
862 if (screen->have_EXT_transform_feedback) {
863 screen->tf_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_TRANSFORM_FEEDBACK_PROPERTIES_EXT;
864 screen->tf_props.pNext = props.pNext;
865 props.pNext = &screen->tf_props;
866 }
867 if (have_EXT_robustness2_features) {
868 screen->rb2_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_ROBUSTNESS_2_PROPERTIES_EXT;
869 screen->rb2_props.pNext = props.pNext;
870 props.pNext = &screen->rb2_props;
871 }
872 if (have_EXT_vertex_attribute_divisor) {
873 vdiv_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VERTEX_ATTRIBUTE_DIVISOR_PROPERTIES_EXT;
874 vdiv_props.pNext = props.pNext;
875 props.pNext = &vdiv_props;
876 }
877 vkGetPhysicalDeviceProperties2(screen->pdev, &props);
878 memcpy(&screen->props, &props.properties, sizeof(screen->props));
879 screen->max_vertex_attrib_divisor = vdiv_props.maxVertexAttribDivisor;
880
881 if (!screen->have_KHR_maintenance1) {
882 debug_printf("ZINK: VK_KHR_maintenance1 required!\n");
883 goto fail;
884 }
885
886 VkDeviceQueueCreateInfo qci = {};
887 float dummy = 0.0f;
888 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
889 qci.queueFamilyIndex = screen->gfx_queue;
890 qci.queueCount = 1;
891 qci.pQueuePriorities = &dummy;
892
893 VkDeviceCreateInfo dci = {};
894 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
895 dci.queueCreateInfoCount = 1;
896 dci.pQueueCreateInfos = &qci;
897 /* extensions don't have bool members in pEnabledFeatures.
898 * this requires us to pass the whole VkPhysicalDeviceFeatures2 struct
899 */
900 dci.pNext = &feats;
901 const char *extensions[8] = {
902 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
903 };
904 num_extensions = 1;
905
906 if (fd >= 0 && !screen->have_KHR_external_memory_fd) {
907 debug_printf("ZINK: KHR_external_memory_fd required!\n");
908 goto fail;
909 }
910
911 if (screen->have_KHR_external_memory_fd) {
912 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME;
913 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME;
914 }
915
916 if (screen->have_EXT_conditional_rendering)
917 extensions[num_extensions++] = VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME;
918
919 if (screen->have_EXT_index_type_uint8)
920 extensions[num_extensions++] = VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME;
921
922 if (screen->have_EXT_transform_feedback)
923 extensions[num_extensions++] = VK_EXT_TRANSFORM_FEEDBACK_EXTENSION_NAME;
924 if (screen->have_EXT_robustness2_features)
925 extensions[num_extensions++] = VK_EXT_ROBUSTNESS_2_EXTENSION_NAME;
926 if (screen->have_EXT_vertex_attribute_divisor)
927 extensions[num_extensions++] = VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME;
928 assert(num_extensions <= ARRAY_SIZE(extensions));
929
930 dci.ppEnabledExtensionNames = extensions;
931 dci.enabledExtensionCount = num_extensions;
932 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
933 goto fail;
934
935 if (!load_device_extensions(screen))
936 goto fail;
937
938 screen->winsys = winsys;
939
940 screen->base.get_name = zink_get_name;
941 screen->base.get_vendor = zink_get_vendor;
942 screen->base.get_device_vendor = zink_get_device_vendor;
943 screen->base.get_param = zink_get_param;
944 screen->base.get_paramf = zink_get_paramf;
945 screen->base.get_shader_param = zink_get_shader_param;
946 screen->base.get_compiler_options = zink_get_compiler_options;
947 screen->base.is_format_supported = zink_is_format_supported;
948 screen->base.context_create = zink_context_create;
949 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
950 screen->base.destroy = zink_destroy_screen;
951
952 zink_screen_resource_init(&screen->base);
953 zink_screen_fence_init(&screen->base);
954
955 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
956
957 return &screen->base;
958
959 fail:
960 FREE(screen);
961 return NULL;
962 }
963
964 struct pipe_screen *
965 zink_create_screen(struct sw_winsys *winsys)
966 {
967 return zink_internal_create_screen(winsys, -1);
968 }
969
970 struct pipe_screen *
971 zink_drm_create_screen(int fd)
972 {
973 return zink_internal_create_screen(NULL, fd);
974 }