zink: store valid timestamp bits onto zink_screen
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/format/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "frontend/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i) {
84 if (screen->mem_props.memoryHeaps[i].flags &
85 VK_MEMORY_HEAP_DEVICE_LOCAL_BIT)
86 size += screen->mem_props.memoryHeaps[i].size;
87 }
88 return (int)(size >> 20);
89 }
90
91 static int
92 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
93 {
94 struct zink_screen *screen = zink_screen(pscreen);
95
96 switch (param) {
97 case PIPE_CAP_NPOT_TEXTURES:
98 case PIPE_CAP_TGSI_TEXCOORD:
99 return 1;
100
101 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
102 if (!screen->feats.dualSrcBlend)
103 return 0;
104 return screen->props.limits.maxFragmentDualSrcAttachments;
105
106 case PIPE_CAP_POINT_SPRITE:
107 return 1;
108
109 case PIPE_CAP_MAX_RENDER_TARGETS:
110 return screen->props.limits.maxColorAttachments;
111
112 case PIPE_CAP_OCCLUSION_QUERY:
113 return 1;
114
115 #if 0 /* TODO: Enable me */
116 case PIPE_CAP_QUERY_TIME_ELAPSED:
117 return 1;
118 #endif
119
120 case PIPE_CAP_TEXTURE_MULTISAMPLE:
121 return 1;
122
123 case PIPE_CAP_TEXTURE_SWIZZLE:
124 return 1;
125
126 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
127 return screen->props.limits.maxImageDimension2D;
128 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
129 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
130 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
131 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
132
133 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
134 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
135 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
136 case PIPE_CAP_VERTEX_SHADER_SATURATE:
137 return 1;
138
139 case PIPE_CAP_INDEP_BLEND_ENABLE:
140 case PIPE_CAP_INDEP_BLEND_FUNC:
141 return 1;
142
143 case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
144 return screen->have_EXT_transform_feedback ? screen->tf_props.maxTransformFeedbackBuffers : 0;
145 case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
146 case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
147 return 1;
148
149 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
150 return screen->props.limits.maxImageArrayLayers;
151
152 case PIPE_CAP_DEPTH_CLIP_DISABLE:
153 return screen->feats.depthClamp;
154
155 case PIPE_CAP_TGSI_INSTANCEID:
156 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
157 case PIPE_CAP_SEAMLESS_CUBE_MAP:
158 return 1;
159
160 case PIPE_CAP_MIN_TEXEL_OFFSET:
161 return screen->props.limits.minTexelOffset;
162 case PIPE_CAP_MAX_TEXEL_OFFSET:
163 return screen->props.limits.maxTexelOffset;
164
165 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
166 return 1;
167
168 case PIPE_CAP_CONDITIONAL_RENDER:
169 return screen->have_EXT_conditional_rendering;
170
171 case PIPE_CAP_GLSL_FEATURE_LEVEL:
172 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
173 return 130;
174
175 #if 0 /* TODO: Enable me */
176 case PIPE_CAP_COMPUTE:
177 return 1;
178 #endif
179
180 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
181 return screen->props.limits.minUniformBufferOffsetAlignment;
182
183 #if 0 /* TODO: Enable me */
184 case PIPE_CAP_QUERY_TIMESTAMP:
185 return 1;
186 #endif
187
188 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
189 return screen->props.limits.minMemoryMapAlignment;
190
191 case PIPE_CAP_CUBE_MAP_ARRAY:
192 return screen->feats.imageCubeArray;
193
194 case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
195 return 1;
196
197 case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
198 return screen->props.limits.minTexelBufferOffsetAlignment;
199
200 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
201 return 0; /* unsure */
202
203 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
204 return screen->props.limits.maxTexelBufferElements;
205
206 case PIPE_CAP_ENDIANNESS:
207 return PIPE_ENDIAN_NATIVE; /* unsure */
208
209 case PIPE_CAP_MAX_VIEWPORTS:
210 return 1; /* TODO: When GS is supported, use screen->props.limits.maxViewports */
211
212 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
213 return 1;
214
215 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
216 return screen->props.limits.maxGeometryOutputVertices;
217 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
218 return screen->props.limits.maxGeometryOutputComponents;
219
220 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
221 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
222 return 4;
223 #endif
224
225 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
226 return screen->props.limits.minTexelGatherOffset;
227 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
228 return screen->props.limits.maxTexelGatherOffset;
229
230 case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
231 return 1;
232
233 case PIPE_CAP_VENDOR_ID:
234 return screen->props.vendorID;
235 case PIPE_CAP_DEVICE_ID:
236 return screen->props.deviceID;
237
238 case PIPE_CAP_ACCELERATED:
239 return 1;
240 case PIPE_CAP_VIDEO_MEMORY:
241 return get_video_mem(screen);
242 case PIPE_CAP_UMA:
243 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
244
245 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
246 return screen->props.limits.maxVertexInputBindingStride;
247
248 #if 0 /* TODO: Enable me */
249 case PIPE_CAP_SAMPLER_VIEW_TARGET:
250 return 1;
251 #endif
252
253 #if 0 /* TODO: Enable me */
254 case PIPE_CAP_CLIP_HALFZ:
255 return 1;
256 #endif
257
258 #if 0 /* TODO: Enable me */
259 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
260 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
261 return 1;
262 #endif
263
264 case PIPE_CAP_SHAREABLE_SHADERS:
265 return 1;
266
267 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
268 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
269 return screen->props.limits.minStorageBufferOffsetAlignment;
270 #endif
271
272 case PIPE_CAP_PCI_GROUP:
273 case PIPE_CAP_PCI_BUS:
274 case PIPE_CAP_PCI_DEVICE:
275 case PIPE_CAP_PCI_FUNCTION:
276 return 0; /* TODO: figure these out */
277
278 case PIPE_CAP_CULL_DISTANCE:
279 return screen->feats.shaderCullDistance;
280
281 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
282 return screen->props.limits.viewportSubPixelBits;
283
284 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
285 return 0; /* not sure */
286
287 case PIPE_CAP_MAX_GS_INVOCATIONS:
288 return 0; /* not implemented */
289
290 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
291 return screen->props.limits.maxDescriptorSetStorageBuffers;
292
293 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
294 return screen->props.limits.maxStorageBufferRange; /* unsure */
295
296 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
297 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
298 return 1;
299
300 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
301 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
302 return 0;
303
304 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
305 return 0;
306
307 case PIPE_CAP_NIR_COMPACT_ARRAYS:
308 return 1;
309
310 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
311 return 1;
312
313 case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED:
314 return 1;
315
316 case PIPE_CAP_FLATSHADE:
317 case PIPE_CAP_ALPHA_TEST:
318 case PIPE_CAP_CLIP_PLANES:
319 case PIPE_CAP_POINT_SIZE_FIXED:
320 case PIPE_CAP_TWO_SIDED_COLOR:
321 return 0;
322
323 case PIPE_CAP_DMABUF:
324 return screen->have_KHR_external_memory_fd;
325
326 default:
327 return u_pipe_screen_get_param_defaults(pscreen, param);
328 }
329 }
330
331 static float
332 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
333 {
334 struct zink_screen *screen = zink_screen(pscreen);
335
336 switch (param) {
337 case PIPE_CAPF_MAX_LINE_WIDTH:
338 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
339 return screen->props.limits.lineWidthRange[1];
340
341 case PIPE_CAPF_MAX_POINT_WIDTH:
342 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
343 return screen->props.limits.pointSizeRange[1];
344
345 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
346 return screen->props.limits.maxSamplerAnisotropy;
347
348 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
349 return screen->props.limits.maxSamplerLodBias;
350
351 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
352 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
353 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
354 return 0.0f; /* not implemented */
355 }
356
357 /* should only get here on unhandled cases */
358 return 0.0;
359 }
360
361 static int
362 zink_get_shader_param(struct pipe_screen *pscreen,
363 enum pipe_shader_type shader,
364 enum pipe_shader_cap param)
365 {
366 struct zink_screen *screen = zink_screen(pscreen);
367
368 switch (param) {
369 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
370 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
371 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
372 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
373 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
374 if (shader == PIPE_SHADER_VERTEX ||
375 shader == PIPE_SHADER_FRAGMENT)
376 return INT_MAX;
377 return 0;
378
379 case PIPE_SHADER_CAP_MAX_INPUTS:
380 switch (shader) {
381 case PIPE_SHADER_VERTEX:
382 return MIN2(screen->props.limits.maxVertexInputAttributes,
383 PIPE_MAX_SHADER_INPUTS);
384 case PIPE_SHADER_FRAGMENT:
385 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
386 PIPE_MAX_SHADER_INPUTS);
387 default:
388 return 0; /* unsupported stage */
389 }
390
391 case PIPE_SHADER_CAP_MAX_OUTPUTS:
392 switch (shader) {
393 case PIPE_SHADER_VERTEX:
394 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
395 PIPE_MAX_SHADER_OUTPUTS);
396 case PIPE_SHADER_FRAGMENT:
397 return MIN2(screen->props.limits.maxColorAttachments,
398 PIPE_MAX_SHADER_OUTPUTS);
399 default:
400 return 0; /* unsupported stage */
401 }
402
403 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
404 switch (shader) {
405 case PIPE_SHADER_VERTEX:
406 case PIPE_SHADER_FRAGMENT:
407 /* this might be a bit simplistic... */
408 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
409 PIPE_MAX_SAMPLERS);
410 default:
411 return 0; /* unsupported stage */
412 }
413
414 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
415 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
416
417 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
418 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
419
420 case PIPE_SHADER_CAP_MAX_TEMPS:
421 return INT_MAX;
422
423 case PIPE_SHADER_CAP_INTEGERS:
424 return 1;
425
426 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
427 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
428 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
429 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
430 case PIPE_SHADER_CAP_SUBROUTINES:
431 case PIPE_SHADER_CAP_INT64_ATOMICS:
432 case PIPE_SHADER_CAP_FP16:
433 case PIPE_SHADER_CAP_FP16_DERIVATIVES:
434 case PIPE_SHADER_CAP_INT16:
435 case PIPE_SHADER_CAP_GLSL_16BIT_TEMPS:
436 return 0; /* not implemented */
437
438 case PIPE_SHADER_CAP_PREFERRED_IR:
439 return PIPE_SHADER_IR_NIR;
440
441 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
442 return 0; /* not implemented */
443
444 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
445 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
446 PIPE_MAX_SHADER_SAMPLER_VIEWS);
447
448 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
449 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
450 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
451 return 0; /* not implemented */
452
453 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
454 return 0; /* no idea */
455
456 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
457 return 32; /* arbitrary */
458
459 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
460 /* TODO: this limitation is dumb, and will need some fixes in mesa */
461 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, PIPE_MAX_SHADER_BUFFERS);
462
463 case PIPE_SHADER_CAP_SUPPORTED_IRS:
464 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
465
466 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
467 #if 0 /* TODO: needs compiler support */
468 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
469 PIPE_MAX_SHADER_IMAGES);
470 #else
471 return 0;
472 #endif
473
474 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
475 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
476 return 0; /* unsure */
477
478 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
479 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
480 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
481 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
482 return 0; /* not implemented */
483 }
484
485 /* should only get here on unhandled cases */
486 return 0;
487 }
488
489 static VkSampleCountFlagBits
490 vk_sample_count_flags(uint32_t sample_count)
491 {
492 switch (sample_count) {
493 case 1: return VK_SAMPLE_COUNT_1_BIT;
494 case 2: return VK_SAMPLE_COUNT_2_BIT;
495 case 4: return VK_SAMPLE_COUNT_4_BIT;
496 case 8: return VK_SAMPLE_COUNT_8_BIT;
497 case 16: return VK_SAMPLE_COUNT_16_BIT;
498 case 32: return VK_SAMPLE_COUNT_32_BIT;
499 case 64: return VK_SAMPLE_COUNT_64_BIT;
500 default:
501 return 0;
502 }
503 }
504
505 static bool
506 zink_is_format_supported(struct pipe_screen *pscreen,
507 enum pipe_format format,
508 enum pipe_texture_target target,
509 unsigned sample_count,
510 unsigned storage_sample_count,
511 unsigned bind)
512 {
513 struct zink_screen *screen = zink_screen(pscreen);
514
515 if (format == PIPE_FORMAT_NONE)
516 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
517 vk_sample_count_flags(sample_count);
518
519 VkFormat vkformat = zink_get_format(screen, format);
520 if (vkformat == VK_FORMAT_UNDEFINED)
521 return false;
522
523 if (sample_count >= 1) {
524 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
525 if (!sample_mask)
526 return false;
527 const struct util_format_description *desc = util_format_description(format);
528 if (util_format_is_depth_or_stencil(format)) {
529 if (util_format_has_depth(desc)) {
530 if (bind & PIPE_BIND_DEPTH_STENCIL &&
531 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
532 return false;
533 if (bind & PIPE_BIND_SAMPLER_VIEW &&
534 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
535 return false;
536 }
537 if (util_format_has_stencil(desc)) {
538 if (bind & PIPE_BIND_DEPTH_STENCIL &&
539 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
540 return false;
541 if (bind & PIPE_BIND_SAMPLER_VIEW &&
542 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
543 return false;
544 }
545 } else if (util_format_is_pure_integer(format)) {
546 if (bind & PIPE_BIND_RENDER_TARGET &&
547 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
548 return false;
549 if (bind & PIPE_BIND_SAMPLER_VIEW &&
550 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
551 return false;
552 } else {
553 if (bind & PIPE_BIND_RENDER_TARGET &&
554 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
555 return false;
556 if (bind & PIPE_BIND_SAMPLER_VIEW &&
557 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
558 return false;
559 }
560 }
561
562 VkFormatProperties props;
563 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
564
565 if (target == PIPE_BUFFER) {
566 if (bind & PIPE_BIND_VERTEX_BUFFER &&
567 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
568 return false;
569 } else {
570 /* all other targets are texture-targets */
571 if (bind & PIPE_BIND_RENDER_TARGET &&
572 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
573 return false;
574
575 if (bind & PIPE_BIND_BLENDABLE &&
576 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
577 return false;
578
579 if (bind & PIPE_BIND_SAMPLER_VIEW &&
580 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
581 return false;
582
583 if (bind & PIPE_BIND_DEPTH_STENCIL &&
584 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
585 return false;
586 }
587
588 if (util_format_is_compressed(format)) {
589 const struct util_format_description *desc = util_format_description(format);
590 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
591 !screen->feats.textureCompressionBC)
592 return false;
593 }
594
595 return true;
596 }
597
598 static void
599 zink_destroy_screen(struct pipe_screen *pscreen)
600 {
601 struct zink_screen *screen = zink_screen(pscreen);
602 slab_destroy_parent(&screen->transfer_pool);
603 FREE(screen);
604 }
605
606 static VkInstance
607 create_instance()
608 {
609 VkApplicationInfo ai = {};
610 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
611
612 char proc_name[128];
613 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
614 ai.pApplicationName = proc_name;
615 else
616 ai.pApplicationName = "unknown";
617
618 ai.pEngineName = "mesa zink";
619 ai.apiVersion = VK_API_VERSION_1_0;
620
621 const char *extensions[] = {
622 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
623 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
624 };
625
626 VkInstanceCreateInfo ici = {};
627 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
628 ici.pApplicationInfo = &ai;
629 ici.ppEnabledExtensionNames = extensions;
630 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
631
632 VkInstance instance = VK_NULL_HANDLE;
633 VkResult err = vkCreateInstance(&ici, NULL, &instance);
634 if (err != VK_SUCCESS)
635 return VK_NULL_HANDLE;
636
637 return instance;
638 }
639
640 static VkPhysicalDevice
641 choose_pdev(const VkInstance instance)
642 {
643 uint32_t i, pdev_count;
644 VkPhysicalDevice *pdevs, pdev;
645 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
646 assert(pdev_count > 0);
647
648 pdevs = malloc(sizeof(*pdevs) * pdev_count);
649 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
650 assert(pdev_count > 0);
651
652 pdev = pdevs[0];
653 for (i = 0; i < pdev_count; ++i) {
654 VkPhysicalDeviceProperties props;
655 vkGetPhysicalDeviceProperties(pdevs[i], &props);
656 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
657 pdev = pdevs[i];
658 break;
659 }
660 }
661 free(pdevs);
662 return pdev;
663 }
664
665 static void
666 update_queue_props(struct zink_screen *screen)
667 {
668 uint32_t num_queues;
669 vkGetPhysicalDeviceQueueFamilyProperties(screen->pdev, &num_queues, NULL);
670 assert(num_queues > 0);
671
672 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
673 vkGetPhysicalDeviceQueueFamilyProperties(screen->pdev, &num_queues, props);
674
675 for (uint32_t i = 0; i < num_queues; i++) {
676 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
677 screen->gfx_queue = i;
678 screen->timestamp_valid_bits = props[i].timestampValidBits;
679 assert(screen->timestamp_valid_bits);
680 break;
681 }
682 }
683 free(props);
684 }
685
686 static void
687 zink_flush_frontbuffer(struct pipe_screen *pscreen,
688 struct pipe_resource *pres,
689 unsigned level, unsigned layer,
690 void *winsys_drawable_handle,
691 struct pipe_box *sub_box)
692 {
693 struct zink_screen *screen = zink_screen(pscreen);
694 struct sw_winsys *winsys = screen->winsys;
695 struct zink_resource *res = zink_resource(pres);
696
697 if (!winsys)
698 return;
699 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
700
701 if (map) {
702 VkImageSubresource isr = {};
703 isr.aspectMask = res->aspect;
704 isr.mipLevel = level;
705 isr.arrayLayer = layer;
706 VkSubresourceLayout layout;
707 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
708
709 void *ptr;
710 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
711 if (result != VK_SUCCESS) {
712 debug_printf("failed to map memory for display\n");
713 return;
714 }
715 for (int i = 0; i < pres->height0; ++i) {
716 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
717 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
718 memcpy(dst, src, res->dt_stride);
719 }
720 vkUnmapMemory(screen->dev, res->mem);
721 }
722
723 winsys->displaytarget_unmap(winsys, res->dt);
724
725 assert(res->dt);
726 if (res->dt)
727 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
728 }
729
730 static bool
731 load_device_extensions(struct zink_screen *screen)
732 {
733 #define GET_PROC_ADDR(x) do { \
734 screen->vk_##x = (PFN_vk##x)vkGetDeviceProcAddr(screen->dev, "vk"#x); \
735 if (!screen->vk_##x) \
736 return false; \
737 } while (0)
738 if (screen->have_EXT_transform_feedback) {
739 GET_PROC_ADDR(CmdBindTransformFeedbackBuffersEXT);
740 GET_PROC_ADDR(CmdBeginTransformFeedbackEXT);
741 GET_PROC_ADDR(CmdEndTransformFeedbackEXT);
742 GET_PROC_ADDR(CmdBeginQueryIndexedEXT);
743 GET_PROC_ADDR(CmdEndQueryIndexedEXT);
744 GET_PROC_ADDR(CmdDrawIndirectByteCountEXT);
745 }
746 if (screen->have_KHR_external_memory_fd)
747 GET_PROC_ADDR(GetMemoryFdKHR);
748
749 if (screen->have_EXT_conditional_rendering) {
750 GET_PROC_ADDR(CmdBeginConditionalRenderingEXT);
751 GET_PROC_ADDR(CmdEndConditionalRenderingEXT);
752 }
753
754 #undef GET_PROC_ADDR
755
756 return true;
757 }
758
759 static struct pipe_screen *
760 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
761 {
762 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
763 bool have_tf_ext = false, have_cond_render_ext = false, have_EXT_index_type_uint8 = false,
764 have_EXT_robustness2_features = false, have_EXT_vertex_attribute_divisor = false;
765 if (!screen)
766 return NULL;
767
768 zink_debug = debug_get_option_zink_debug();
769
770 screen->instance = create_instance();
771 screen->pdev = choose_pdev(screen->instance);
772 update_queue_props(screen);
773
774 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
775
776 screen->have_X8_D24_UNORM_PACK32 = zink_is_depth_format_supported(screen,
777 VK_FORMAT_X8_D24_UNORM_PACK32);
778 screen->have_D24_UNORM_S8_UINT = zink_is_depth_format_supported(screen,
779 VK_FORMAT_D24_UNORM_S8_UINT);
780
781 uint32_t num_extensions = 0;
782 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
783 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
784 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
785 num_extensions);
786 if (extensions) {
787 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
788 &num_extensions, extensions);
789
790 for (uint32_t i = 0; i < num_extensions; ++i) {
791 if (!strcmp(extensions[i].extensionName,
792 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
793 screen->have_KHR_maintenance1 = true;
794 if (!strcmp(extensions[i].extensionName,
795 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME))
796 screen->have_KHR_external_memory_fd = true;
797 if (!strcmp(extensions[i].extensionName,
798 VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME))
799 have_cond_render_ext = true;
800 if (!strcmp(extensions[i].extensionName,
801 VK_EXT_TRANSFORM_FEEDBACK_EXTENSION_NAME))
802 have_tf_ext = true;
803 if (!strcmp(extensions[i].extensionName,
804 VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME))
805 have_EXT_index_type_uint8 = true;
806 if (!strcmp(extensions[i].extensionName,
807 VK_EXT_ROBUSTNESS_2_EXTENSION_NAME))
808 have_EXT_robustness2_features = true;
809 if (!strcmp(extensions[i].extensionName,
810 VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME))
811 have_EXT_vertex_attribute_divisor = true;
812
813 }
814 FREE(extensions);
815 }
816 }
817 VkPhysicalDeviceFeatures2 feats = {};
818 VkPhysicalDeviceTransformFeedbackFeaturesEXT tf_feats = {};
819 VkPhysicalDeviceConditionalRenderingFeaturesEXT cond_render_feats = {};
820 VkPhysicalDeviceIndexTypeUint8FeaturesEXT index_uint8_feats = {};
821
822 feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_FEATURES_2;
823 if (have_tf_ext) {
824 tf_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_TRANSFORM_FEEDBACK_FEATURES_EXT;
825 tf_feats.pNext = feats.pNext;
826 feats.pNext = &tf_feats;
827 }
828 if (have_cond_render_ext) {
829 cond_render_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_CONDITIONAL_RENDERING_FEATURES_EXT;
830 cond_render_feats.pNext = feats.pNext;
831 feats.pNext = &cond_render_feats;
832 }
833 if (have_EXT_index_type_uint8) {
834 index_uint8_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_INDEX_TYPE_UINT8_FEATURES_EXT;
835 index_uint8_feats.pNext = feats.pNext;
836 feats.pNext = &index_uint8_feats;
837 }
838 if (have_EXT_robustness2_features) {
839 screen->rb2_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_ROBUSTNESS_2_FEATURES_EXT;
840 screen->rb2_feats.pNext = feats.pNext;
841 feats.pNext = &screen->rb2_feats;
842 }
843 if (have_EXT_vertex_attribute_divisor) {
844 screen->vdiv_feats.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VERTEX_ATTRIBUTE_DIVISOR_FEATURES_EXT;
845 screen->vdiv_feats.pNext = feats.pNext;
846 feats.pNext = &screen->vdiv_feats;
847 }
848 vkGetPhysicalDeviceFeatures2(screen->pdev, &feats);
849 memcpy(&screen->feats, &feats.features, sizeof(screen->feats));
850 if (have_tf_ext && tf_feats.transformFeedback)
851 screen->have_EXT_transform_feedback = true;
852 if (have_cond_render_ext && cond_render_feats.conditionalRendering)
853 screen->have_EXT_conditional_rendering = true;
854 if (have_EXT_index_type_uint8 && index_uint8_feats.indexTypeUint8)
855 screen->have_EXT_index_type_uint8 = true;
856 screen->have_EXT_robustness2_features = have_EXT_robustness2_features;
857 if (have_EXT_vertex_attribute_divisor && screen->vdiv_feats.vertexAttributeInstanceRateDivisor)
858 screen->have_EXT_vertex_attribute_divisor = true;
859
860 VkPhysicalDeviceProperties2 props = {};
861 VkPhysicalDeviceVertexAttributeDivisorPropertiesEXT vdiv_props = {};
862 props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_PROPERTIES_2;
863 if (screen->have_EXT_transform_feedback) {
864 screen->tf_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_TRANSFORM_FEEDBACK_PROPERTIES_EXT;
865 screen->tf_props.pNext = props.pNext;
866 props.pNext = &screen->tf_props;
867 }
868 if (have_EXT_robustness2_features) {
869 screen->rb2_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_ROBUSTNESS_2_PROPERTIES_EXT;
870 screen->rb2_props.pNext = props.pNext;
871 props.pNext = &screen->rb2_props;
872 }
873 if (have_EXT_vertex_attribute_divisor) {
874 vdiv_props.sType = VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_VERTEX_ATTRIBUTE_DIVISOR_PROPERTIES_EXT;
875 vdiv_props.pNext = props.pNext;
876 props.pNext = &vdiv_props;
877 }
878 vkGetPhysicalDeviceProperties2(screen->pdev, &props);
879 memcpy(&screen->props, &props.properties, sizeof(screen->props));
880 screen->max_vertex_attrib_divisor = vdiv_props.maxVertexAttribDivisor;
881
882 if (!screen->have_KHR_maintenance1) {
883 debug_printf("ZINK: VK_KHR_maintenance1 required!\n");
884 goto fail;
885 }
886
887 VkDeviceQueueCreateInfo qci = {};
888 float dummy = 0.0f;
889 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
890 qci.queueFamilyIndex = screen->gfx_queue;
891 qci.queueCount = 1;
892 qci.pQueuePriorities = &dummy;
893
894 VkDeviceCreateInfo dci = {};
895 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
896 dci.queueCreateInfoCount = 1;
897 dci.pQueueCreateInfos = &qci;
898 /* extensions don't have bool members in pEnabledFeatures.
899 * this requires us to pass the whole VkPhysicalDeviceFeatures2 struct
900 */
901 dci.pNext = &feats;
902 const char *extensions[8] = {
903 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
904 };
905 num_extensions = 1;
906
907 if (fd >= 0 && !screen->have_KHR_external_memory_fd) {
908 debug_printf("ZINK: KHR_external_memory_fd required!\n");
909 goto fail;
910 }
911
912 if (screen->have_KHR_external_memory_fd) {
913 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME;
914 extensions[num_extensions++] = VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME;
915 }
916
917 if (screen->have_EXT_conditional_rendering)
918 extensions[num_extensions++] = VK_EXT_CONDITIONAL_RENDERING_EXTENSION_NAME;
919
920 if (screen->have_EXT_index_type_uint8)
921 extensions[num_extensions++] = VK_EXT_INDEX_TYPE_UINT8_EXTENSION_NAME;
922
923 if (screen->have_EXT_transform_feedback)
924 extensions[num_extensions++] = VK_EXT_TRANSFORM_FEEDBACK_EXTENSION_NAME;
925 if (screen->have_EXT_robustness2_features)
926 extensions[num_extensions++] = VK_EXT_ROBUSTNESS_2_EXTENSION_NAME;
927 if (screen->have_EXT_vertex_attribute_divisor)
928 extensions[num_extensions++] = VK_EXT_VERTEX_ATTRIBUTE_DIVISOR_EXTENSION_NAME;
929 assert(num_extensions <= ARRAY_SIZE(extensions));
930
931 dci.ppEnabledExtensionNames = extensions;
932 dci.enabledExtensionCount = num_extensions;
933 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
934 goto fail;
935
936 if (!load_device_extensions(screen))
937 goto fail;
938
939 screen->winsys = winsys;
940
941 screen->base.get_name = zink_get_name;
942 screen->base.get_vendor = zink_get_vendor;
943 screen->base.get_device_vendor = zink_get_device_vendor;
944 screen->base.get_param = zink_get_param;
945 screen->base.get_paramf = zink_get_paramf;
946 screen->base.get_shader_param = zink_get_shader_param;
947 screen->base.get_compiler_options = zink_get_compiler_options;
948 screen->base.is_format_supported = zink_is_format_supported;
949 screen->base.context_create = zink_context_create;
950 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
951 screen->base.destroy = zink_destroy_screen;
952
953 zink_screen_resource_init(&screen->base);
954 zink_screen_fence_init(&screen->base);
955
956 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
957
958 return &screen->base;
959
960 fail:
961 FREE(screen);
962 return NULL;
963 }
964
965 struct pipe_screen *
966 zink_create_screen(struct sw_winsys *winsys)
967 {
968 return zink_internal_create_screen(winsys, -1);
969 }
970
971 struct pipe_screen *
972 zink_drm_create_screen(int fd)
973 {
974 return zink_internal_create_screen(NULL, fd);
975 }