zink/spirv: implement load_front_face
[mesa.git] / src / gallium / drivers / zink / zink_screen.c
1 /*
2 * Copyright 2018 Collabora Ltd.
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * on the rights to use, copy, modify, merge, publish, distribute, sub
8 * license, and/or sell copies of the Software, and to permit persons to whom
9 * the Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,
19 * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
20 * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
21 * USE OR OTHER DEALINGS IN THE SOFTWARE.
22 */
23
24 #include "zink_screen.h"
25
26 #include "zink_compiler.h"
27 #include "zink_context.h"
28 #include "zink_fence.h"
29 #include "zink_public.h"
30 #include "zink_resource.h"
31
32 #include "os/os_process.h"
33 #include "util/u_debug.h"
34 #include "util/u_format.h"
35 #include "util/u_math.h"
36 #include "util/u_memory.h"
37 #include "util/u_screen.h"
38 #include "util/u_string.h"
39
40 #include "state_tracker/sw_winsys.h"
41
42 static const struct debug_named_value
43 debug_options[] = {
44 { "nir", ZINK_DEBUG_NIR, "Dump NIR during program compile" },
45 { "spirv", ZINK_DEBUG_SPIRV, "Dump SPIR-V during program compile" },
46 { "tgsi", ZINK_DEBUG_TGSI, "Dump TGSI during program compile" },
47 DEBUG_NAMED_VALUE_END
48 };
49
50 DEBUG_GET_ONCE_FLAGS_OPTION(zink_debug, "ZINK_DEBUG", debug_options, 0)
51
52 uint32_t
53 zink_debug;
54
55 static const char *
56 zink_get_vendor(struct pipe_screen *pscreen)
57 {
58 return "Collabora Ltd";
59 }
60
61 static const char *
62 zink_get_device_vendor(struct pipe_screen *pscreen)
63 {
64 struct zink_screen *screen = zink_screen(pscreen);
65 static char buf[1000];
66 snprintf(buf, sizeof(buf), "Unknown (vendor-id: 0x%04x)", screen->props.vendorID);
67 return buf;
68 }
69
70 static const char *
71 zink_get_name(struct pipe_screen *pscreen)
72 {
73 struct zink_screen *screen = zink_screen(pscreen);
74 static char buf[1000];
75 snprintf(buf, sizeof(buf), "zink (%s)", screen->props.deviceName);
76 return buf;
77 }
78
79 static int
80 get_video_mem(struct zink_screen *screen)
81 {
82 VkDeviceSize size = 0;
83 for (uint32_t i = 0; i < screen->mem_props.memoryHeapCount; ++i)
84 size += screen->mem_props.memoryHeaps[i].size;
85 return (int)(size >> 20);
86 }
87
88 static int
89 zink_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
90 {
91 struct zink_screen *screen = zink_screen(pscreen);
92
93 switch (param) {
94 case PIPE_CAP_NPOT_TEXTURES:
95 return 1;
96
97 case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
98 return screen->props.limits.maxFragmentDualSrcAttachments;
99
100 case PIPE_CAP_POINT_SPRITE:
101 return 1;
102
103 case PIPE_CAP_MAX_RENDER_TARGETS:
104 return screen->props.limits.maxColorAttachments;
105
106 case PIPE_CAP_OCCLUSION_QUERY:
107 return 1;
108
109 #if 0 /* TODO: Enable me */
110 case PIPE_CAP_QUERY_TIME_ELAPSED:
111 return 1;
112 #endif
113
114 case PIPE_CAP_TEXTURE_SWIZZLE:
115 return 1;
116
117 case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
118 return screen->props.limits.maxImageDimension2D;
119 case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
120 return 1 + util_logbase2(screen->props.limits.maxImageDimension3D);
121 case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
122 return 1 + util_logbase2(screen->props.limits.maxImageDimensionCube);
123
124 case PIPE_CAP_BLEND_EQUATION_SEPARATE:
125 return 1;
126
127 case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
128 case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
129 case PIPE_CAP_VERTEX_SHADER_SATURATE:
130 return 1;
131
132 case PIPE_CAP_INDEP_BLEND_ENABLE:
133 case PIPE_CAP_INDEP_BLEND_FUNC:
134 return 1;
135
136 case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
137 return screen->props.limits.maxImageArrayLayers;
138
139 #if 0 /* TODO: Enable me */
140 case PIPE_CAP_DEPTH_CLIP_DISABLE:
141 return 0;
142 #endif
143
144 #if 0 /* TODO: Enable me */
145 case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
146 return 1;
147 #endif
148
149 case PIPE_CAP_SEAMLESS_CUBE_MAP:
150 return 1;
151
152 case PIPE_CAP_MIN_TEXEL_OFFSET:
153 return screen->props.limits.minTexelOffset;
154 case PIPE_CAP_MAX_TEXEL_OFFSET:
155 return screen->props.limits.maxTexelOffset;
156
157 case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
158 return 1;
159
160 case PIPE_CAP_GLSL_FEATURE_LEVEL:
161 case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
162 return 120;
163
164 #if 0 /* TODO: Enable me */
165 case PIPE_CAP_COMPUTE:
166 return 1;
167 #endif
168
169 case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
170 return screen->props.limits.minUniformBufferOffsetAlignment;
171
172 #if 0 /* TODO: Enable me */
173 case PIPE_CAP_QUERY_TIMESTAMP:
174 return 1;
175 #endif
176
177 case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
178 return screen->props.limits.minMemoryMapAlignment;
179
180 case PIPE_CAP_CUBE_MAP_ARRAY:
181 return screen->feats.imageCubeArray;
182
183 case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
184 return 0; /* unsure */
185
186 case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
187 return screen->props.limits.maxTexelBufferElements;
188
189 case PIPE_CAP_ENDIANNESS:
190 return PIPE_ENDIAN_NATIVE; /* unsure */
191
192 case PIPE_CAP_MAX_VIEWPORTS:
193 return screen->props.limits.maxViewports;
194
195 case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
196 return 1;
197
198 case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
199 return screen->props.limits.maxGeometryOutputVertices;
200 case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
201 return screen->props.limits.maxGeometryOutputComponents;
202
203 #if 0 /* TODO: Enable me. Enables ARB_texture_gather */
204 case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
205 return 4;
206 #endif
207
208 case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
209 return screen->props.limits.minTexelGatherOffset;
210 case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
211 return screen->props.limits.maxTexelGatherOffset;
212
213 case PIPE_CAP_VENDOR_ID:
214 return screen->props.vendorID;
215 case PIPE_CAP_DEVICE_ID:
216 return screen->props.deviceID;
217
218 case PIPE_CAP_ACCELERATED:
219 return 1;
220 case PIPE_CAP_VIDEO_MEMORY:
221 return get_video_mem(screen);
222 case PIPE_CAP_UMA:
223 return screen->props.deviceType == VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU;
224
225 case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:
226 return screen->props.limits.maxVertexInputBindingStride;
227
228 #if 0 /* TODO: Enable me */
229 case PIPE_CAP_SAMPLER_VIEW_TARGET:
230 return 1;
231 #endif
232
233 #if 0 /* TODO: Enable me */
234 case PIPE_CAP_CLIP_HALFZ:
235 return 1;
236 #endif
237
238 #if 0 /* TODO: Enable me */
239 case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
240 case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
241 return 1;
242 #endif
243
244 case PIPE_CAP_SHAREABLE_SHADERS:
245 return 1;
246
247 #if 0 /* TODO: Enable me. Enables GL_ARB_shader_storage_buffer_object */
248 case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
249 return screen->props.limits.minStorageBufferOffsetAlignment;
250 #endif
251
252 case PIPE_CAP_PCI_GROUP:
253 case PIPE_CAP_PCI_BUS:
254 case PIPE_CAP_PCI_DEVICE:
255 case PIPE_CAP_PCI_FUNCTION:
256 return 0; /* TODO: figure these out */
257
258 #if 0 /* TODO: Enable me */
259 case PIPE_CAP_CULL_DISTANCE:
260 return screen->feats.shaderCullDistance;
261 #endif
262
263 case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:
264 return screen->props.limits.viewportSubPixelBits;
265
266 case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:
267 return 0; /* not sure */
268
269 case PIPE_CAP_MAX_GS_INVOCATIONS:
270 return 0; /* not implemented */
271
272 case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:
273 return screen->props.limits.maxDescriptorSetStorageBuffers;
274
275 case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
276 return screen->props.limits.maxStorageBufferRange; /* unsure */
277
278 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
279 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
280 return 1;
281
282 case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
283 case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
284 return 0;
285
286 case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
287 return 1;
288
289 case PIPE_CAP_NIR_COMPACT_ARRAYS:
290 return 1;
291
292 case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
293 return 1;
294
295 case PIPE_CAP_FLATSHADE:
296 case PIPE_CAP_ALPHA_TEST:
297 case PIPE_CAP_CLIP_PLANES:
298 case PIPE_CAP_POINT_SIZE_FIXED:
299 return 0;
300
301 default:
302 return u_pipe_screen_get_param_defaults(pscreen, param);
303 }
304 }
305
306 static float
307 zink_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
308 {
309 struct zink_screen *screen = zink_screen(pscreen);
310
311 switch (param) {
312 case PIPE_CAPF_MAX_LINE_WIDTH:
313 case PIPE_CAPF_MAX_LINE_WIDTH_AA:
314 return screen->props.limits.lineWidthRange[1];
315
316 case PIPE_CAPF_MAX_POINT_WIDTH:
317 case PIPE_CAPF_MAX_POINT_WIDTH_AA:
318 return screen->props.limits.pointSizeRange[1];
319
320 case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
321 return screen->props.limits.maxSamplerAnisotropy;
322
323 case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
324 return screen->props.limits.maxSamplerLodBias;
325
326 case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
327 case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
328 case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
329 return 0.0f; /* not implemented */
330 }
331
332 /* should only get here on unhandled cases */
333 return 0.0;
334 }
335
336 static int
337 zink_get_shader_param(struct pipe_screen *pscreen,
338 enum pipe_shader_type shader,
339 enum pipe_shader_cap param)
340 {
341 struct zink_screen *screen = zink_screen(pscreen);
342
343 switch (param) {
344 case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
345 case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
346 case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
347 case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
348 case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
349 if (shader == PIPE_SHADER_VERTEX ||
350 shader == PIPE_SHADER_FRAGMENT)
351 return INT_MAX;
352 return 0;
353
354 case PIPE_SHADER_CAP_MAX_INPUTS:
355 switch (shader) {
356 case PIPE_SHADER_VERTEX:
357 return MIN2(screen->props.limits.maxVertexInputAttributes,
358 PIPE_MAX_SHADER_INPUTS);
359 case PIPE_SHADER_FRAGMENT:
360 return MIN2(screen->props.limits.maxFragmentInputComponents / 4,
361 PIPE_MAX_SHADER_INPUTS);
362 default:
363 return 0; /* unsupported stage */
364 }
365
366 case PIPE_SHADER_CAP_MAX_OUTPUTS:
367 switch (shader) {
368 case PIPE_SHADER_VERTEX:
369 return MIN2(screen->props.limits.maxVertexOutputComponents / 4,
370 PIPE_MAX_SHADER_OUTPUTS);
371 case PIPE_SHADER_FRAGMENT:
372 return MIN2(screen->props.limits.maxColorAttachments,
373 PIPE_MAX_SHADER_OUTPUTS);
374 default:
375 return 0; /* unsupported stage */
376 }
377
378 case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
379 /* this might be a bit simplistic... */
380 return MIN2(screen->props.limits.maxPerStageDescriptorSamplers,
381 PIPE_MAX_SAMPLERS);
382
383 case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
384 return MIN2(screen->props.limits.maxUniformBufferRange, INT_MAX);
385
386 case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
387 return screen->props.limits.maxPerStageDescriptorUniformBuffers;
388
389 case PIPE_SHADER_CAP_MAX_TEMPS:
390 return INT_MAX;
391
392 case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
393 case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
394 case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
395 case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
396 case PIPE_SHADER_CAP_SUBROUTINES:
397 case PIPE_SHADER_CAP_INTEGERS:
398 case PIPE_SHADER_CAP_INT64_ATOMICS:
399 case PIPE_SHADER_CAP_FP16:
400 return 0; /* not implemented */
401
402 case PIPE_SHADER_CAP_PREFERRED_IR:
403 return PIPE_SHADER_IR_NIR;
404
405 case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
406 return 0; /* not implemented */
407
408 case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
409 return MIN2(screen->props.limits.maxPerStageDescriptorSampledImages,
410 PIPE_MAX_SHADER_SAMPLER_VIEWS);
411
412 case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
413 case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
414 case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
415 return 0; /* not implemented */
416
417 case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
418 return 0; /* no idea */
419
420 case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
421 return 32; /* arbitrary */
422
423 case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
424 /* TODO: this limitation is dumb, and will need some fixes in mesa */
425 return MIN2(screen->props.limits.maxPerStageDescriptorStorageBuffers, 8);
426
427 case PIPE_SHADER_CAP_SUPPORTED_IRS:
428 return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);
429
430 case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
431 return MIN2(screen->props.limits.maxPerStageDescriptorStorageImages,
432 PIPE_MAX_SHADER_IMAGES);
433
434 case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
435 case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
436 return 0; /* unsure */
437
438 case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
439 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
440 case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
441 case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
442 return 0; /* not implemented */
443 }
444
445 /* should only get here on unhandled cases */
446 return 0;
447 }
448
449 static const VkFormat formats[PIPE_FORMAT_COUNT] = {
450 #define MAP_FORMAT_NORM(FMT) \
451 [PIPE_FORMAT_ ## FMT ## _UNORM] = VK_FORMAT_ ## FMT ## _UNORM, \
452 [PIPE_FORMAT_ ## FMT ## _SNORM] = VK_FORMAT_ ## FMT ## _SNORM,
453
454 #define MAP_FORMAT_SCALED(FMT) \
455 [PIPE_FORMAT_ ## FMT ## _USCALED] = VK_FORMAT_ ## FMT ## _USCALED, \
456 [PIPE_FORMAT_ ## FMT ## _SSCALED] = VK_FORMAT_ ## FMT ## _SSCALED,
457
458 #define MAP_FORMAT_INT(FMT) \
459 [PIPE_FORMAT_ ## FMT ## _UINT] = VK_FORMAT_ ## FMT ## _UINT, \
460 [PIPE_FORMAT_ ## FMT ## _SINT] = VK_FORMAT_ ## FMT ## _SINT,
461
462 #define MAP_FORMAT_SRGB(FMT) \
463 [PIPE_FORMAT_ ## FMT ## _SRGB] = VK_FORMAT_ ## FMT ## _SRGB,
464
465 #define MAP_FORMAT_FLOAT(FMT) \
466 [PIPE_FORMAT_ ## FMT ## _FLOAT] = VK_FORMAT_ ## FMT ## _SFLOAT,
467
468 // one component
469
470 // 8-bits
471 MAP_FORMAT_NORM(R8)
472 MAP_FORMAT_SCALED(R8)
473 MAP_FORMAT_INT(R8)
474 // 16-bits
475 MAP_FORMAT_NORM(R16)
476 MAP_FORMAT_SCALED(R16)
477 MAP_FORMAT_INT(R16)
478 MAP_FORMAT_FLOAT(R16)
479 // 32-bits
480 MAP_FORMAT_INT(R32)
481 MAP_FORMAT_FLOAT(R32)
482
483 // two components
484
485 // 8-bits
486 MAP_FORMAT_NORM(R8G8)
487 MAP_FORMAT_SCALED(R8G8)
488 MAP_FORMAT_INT(R8G8)
489 // 16-bits
490 MAP_FORMAT_NORM(R16G16)
491 MAP_FORMAT_SCALED(R16G16)
492 MAP_FORMAT_INT(R16G16)
493 MAP_FORMAT_FLOAT(R16G16)
494 // 32-bits
495 MAP_FORMAT_INT(R32G32)
496 MAP_FORMAT_FLOAT(R32G32)
497
498 // three components
499
500 // 8-bits
501 MAP_FORMAT_NORM(R8G8B8)
502 MAP_FORMAT_SCALED(R8G8B8)
503 MAP_FORMAT_INT(R8G8B8)
504 MAP_FORMAT_SRGB(R8G8B8)
505 // 16-bits
506 MAP_FORMAT_NORM(R16G16B16)
507 MAP_FORMAT_SCALED(R16G16B16)
508 MAP_FORMAT_INT(R16G16B16)
509 MAP_FORMAT_FLOAT(R16G16B16)
510 // 32-bits
511 MAP_FORMAT_INT(R32G32B32)
512 MAP_FORMAT_FLOAT(R32G32B32)
513
514 // four components
515
516 // 8-bits
517 MAP_FORMAT_NORM(R8G8B8A8)
518 MAP_FORMAT_SCALED(R8G8B8A8)
519 MAP_FORMAT_INT(R8G8B8A8)
520 MAP_FORMAT_SRGB(R8G8B8A8)
521 [PIPE_FORMAT_B8G8R8A8_UNORM] = VK_FORMAT_B8G8R8A8_UNORM,
522 MAP_FORMAT_SRGB(B8G8R8A8)
523 [PIPE_FORMAT_A8B8G8R8_SRGB] = VK_FORMAT_A8B8G8R8_SRGB_PACK32,
524 // 16-bits
525 MAP_FORMAT_NORM(R16G16B16A16)
526 MAP_FORMAT_SCALED(R16G16B16A16)
527 MAP_FORMAT_INT(R16G16B16A16)
528 MAP_FORMAT_FLOAT(R16G16B16A16)
529 // 32-bits
530 MAP_FORMAT_INT(R32G32B32A32)
531 MAP_FORMAT_FLOAT(R32G32B32A32)
532
533 // other color formats
534 [PIPE_FORMAT_B5G6R5_UNORM] = VK_FORMAT_R5G6B5_UNORM_PACK16,
535 [PIPE_FORMAT_B5G5R5A1_UNORM] = VK_FORMAT_B5G5R5A1_UNORM_PACK16,
536 [PIPE_FORMAT_R11G11B10_FLOAT] = VK_FORMAT_B10G11R11_UFLOAT_PACK32,
537 [PIPE_FORMAT_R9G9B9E5_FLOAT] = VK_FORMAT_E5B9G9R9_UFLOAT_PACK32,
538 [PIPE_FORMAT_R10G10B10A2_UNORM] = VK_FORMAT_A2B10G10R10_UNORM_PACK32,
539 [PIPE_FORMAT_B10G10R10A2_UNORM] = VK_FORMAT_A2R10G10B10_UNORM_PACK32,
540 [PIPE_FORMAT_R10G10B10A2_UINT] = VK_FORMAT_A2B10G10R10_UINT_PACK32,
541 [PIPE_FORMAT_B10G10R10A2_UINT] = VK_FORMAT_A2R10G10B10_UINT_PACK32,
542
543 // depth/stencil formats
544 [PIPE_FORMAT_Z32_FLOAT] = VK_FORMAT_D32_SFLOAT,
545 [PIPE_FORMAT_Z32_FLOAT_S8X24_UINT] = VK_FORMAT_D32_SFLOAT_S8_UINT,
546 [PIPE_FORMAT_Z16_UNORM] = VK_FORMAT_D16_UNORM,
547 [PIPE_FORMAT_X8Z24_UNORM] = VK_FORMAT_X8_D24_UNORM_PACK32,
548 [PIPE_FORMAT_Z24_UNORM_S8_UINT] = VK_FORMAT_D24_UNORM_S8_UINT,
549
550 // compressed formats
551 [PIPE_FORMAT_DXT1_RGB] = VK_FORMAT_BC1_RGB_UNORM_BLOCK,
552 [PIPE_FORMAT_DXT1_RGBA] = VK_FORMAT_BC1_RGBA_UNORM_BLOCK,
553 [PIPE_FORMAT_DXT3_RGBA] = VK_FORMAT_BC2_UNORM_BLOCK,
554 [PIPE_FORMAT_DXT5_RGBA] = VK_FORMAT_BC3_UNORM_BLOCK,
555 [PIPE_FORMAT_DXT1_SRGB] = VK_FORMAT_BC1_RGB_SRGB_BLOCK,
556 [PIPE_FORMAT_DXT1_SRGBA] = VK_FORMAT_BC1_RGBA_SRGB_BLOCK,
557 [PIPE_FORMAT_DXT3_SRGBA] = VK_FORMAT_BC2_SRGB_BLOCK,
558 [PIPE_FORMAT_DXT5_SRGBA] = VK_FORMAT_BC3_SRGB_BLOCK,
559
560 [PIPE_FORMAT_RGTC1_UNORM] = VK_FORMAT_BC4_UNORM_BLOCK,
561 [PIPE_FORMAT_RGTC1_SNORM] = VK_FORMAT_BC4_SNORM_BLOCK,
562 [PIPE_FORMAT_RGTC2_UNORM] = VK_FORMAT_BC5_UNORM_BLOCK,
563 [PIPE_FORMAT_RGTC2_SNORM] = VK_FORMAT_BC5_SNORM_BLOCK,
564 [PIPE_FORMAT_BPTC_RGBA_UNORM] = VK_FORMAT_BC7_UNORM_BLOCK,
565 [PIPE_FORMAT_BPTC_SRGBA] = VK_FORMAT_BC7_SRGB_BLOCK,
566 [PIPE_FORMAT_BPTC_RGB_FLOAT] = VK_FORMAT_BC6H_SFLOAT_BLOCK,
567 [PIPE_FORMAT_BPTC_RGB_UFLOAT] = VK_FORMAT_BC6H_UFLOAT_BLOCK,
568 };
569
570 VkFormat
571 zink_get_format(enum pipe_format format)
572 {
573 return formats[format];
574 }
575
576 static VkSampleCountFlagBits
577 vk_sample_count_flags(uint32_t sample_count)
578 {
579 switch (sample_count) {
580 case 1: return VK_SAMPLE_COUNT_1_BIT;
581 case 2: return VK_SAMPLE_COUNT_2_BIT;
582 case 4: return VK_SAMPLE_COUNT_4_BIT;
583 case 8: return VK_SAMPLE_COUNT_8_BIT;
584 case 16: return VK_SAMPLE_COUNT_16_BIT;
585 case 32: return VK_SAMPLE_COUNT_32_BIT;
586 case 64: return VK_SAMPLE_COUNT_64_BIT;
587 default:
588 return 0;
589 }
590 }
591
592 static bool
593 zink_is_format_supported(struct pipe_screen *pscreen,
594 enum pipe_format format,
595 enum pipe_texture_target target,
596 unsigned sample_count,
597 unsigned storage_sample_count,
598 unsigned bind)
599 {
600 struct zink_screen *screen = zink_screen(pscreen);
601
602 if (format == PIPE_FORMAT_NONE)
603 return screen->props.limits.framebufferNoAttachmentsSampleCounts &
604 vk_sample_count_flags(sample_count);
605
606 VkFormat vkformat = formats[format];
607 if (vkformat == VK_FORMAT_UNDEFINED)
608 return FALSE;
609
610 if (sample_count >= 1) {
611 VkSampleCountFlagBits sample_mask = vk_sample_count_flags(sample_count);
612 const struct util_format_description *desc = util_format_description(format);
613 if (util_format_is_depth_or_stencil(format)) {
614 if (util_format_has_depth(desc)) {
615 if (bind & PIPE_BIND_DEPTH_STENCIL &&
616 (screen->props.limits.framebufferDepthSampleCounts & sample_mask) != sample_mask)
617 return FALSE;
618 if (bind & PIPE_BIND_SAMPLER_VIEW &&
619 (screen->props.limits.sampledImageDepthSampleCounts & sample_mask) != sample_mask)
620 return FALSE;
621 }
622 if (util_format_has_stencil(desc)) {
623 if (bind & PIPE_BIND_DEPTH_STENCIL &&
624 (screen->props.limits.framebufferStencilSampleCounts & sample_mask) != sample_mask)
625 return FALSE;
626 if (bind & PIPE_BIND_SAMPLER_VIEW &&
627 (screen->props.limits.sampledImageStencilSampleCounts & sample_mask) != sample_mask)
628 return FALSE;
629 }
630 } else if (util_format_is_pure_integer(format)) {
631 if (bind & PIPE_BIND_RENDER_TARGET &&
632 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
633 return FALSE;
634 if (bind & PIPE_BIND_SAMPLER_VIEW &&
635 !(screen->props.limits.sampledImageIntegerSampleCounts & sample_mask))
636 return FALSE;
637 } else {
638 if (bind & PIPE_BIND_RENDER_TARGET &&
639 !(screen->props.limits.framebufferColorSampleCounts & sample_mask))
640 return FALSE;
641 if (bind & PIPE_BIND_SAMPLER_VIEW &&
642 !(screen->props.limits.sampledImageColorSampleCounts & sample_mask))
643 return FALSE;
644 }
645 }
646
647 VkFormatProperties props;
648 vkGetPhysicalDeviceFormatProperties(screen->pdev, vkformat, &props);
649
650 if (target == PIPE_BUFFER) {
651 if (bind & PIPE_BIND_VERTEX_BUFFER &&
652 !(props.bufferFeatures & VK_FORMAT_FEATURE_VERTEX_BUFFER_BIT))
653 return FALSE;
654 } else {
655 /* all other targets are texture-targets */
656 if (bind & PIPE_BIND_RENDER_TARGET &&
657 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BIT))
658 return FALSE;
659
660 if (bind & PIPE_BIND_BLENDABLE &&
661 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_COLOR_ATTACHMENT_BLEND_BIT))
662 return FALSE;
663
664 if (bind & PIPE_BIND_SAMPLER_VIEW &&
665 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_SAMPLED_IMAGE_BIT))
666 return FALSE;
667
668 if (bind & PIPE_BIND_DEPTH_STENCIL &&
669 !(props.optimalTilingFeatures & VK_FORMAT_FEATURE_DEPTH_STENCIL_ATTACHMENT_BIT))
670 return FALSE;
671 }
672
673 if (util_format_is_compressed(format)) {
674 const struct util_format_description *desc = util_format_description(format);
675 if (desc->layout == UTIL_FORMAT_LAYOUT_BPTC &&
676 !screen->feats.textureCompressionBC)
677 return FALSE;
678 }
679
680 return TRUE;
681 }
682
683 static void
684 zink_destroy_screen(struct pipe_screen *pscreen)
685 {
686 struct zink_screen *screen = zink_screen(pscreen);
687 slab_destroy_parent(&screen->transfer_pool);
688 FREE(screen);
689 }
690
691 static VkInstance
692 create_instance()
693 {
694 VkApplicationInfo ai = {};
695 ai.sType = VK_STRUCTURE_TYPE_APPLICATION_INFO;
696
697 char proc_name[128];
698 if (os_get_process_name(proc_name, ARRAY_SIZE(proc_name)))
699 ai.pApplicationName = proc_name;
700 else
701 ai.pApplicationName = "unknown";
702
703 ai.pEngineName = "mesa zink";
704 ai.apiVersion = VK_API_VERSION_1_0;
705
706 const char *extensions[] = {
707 VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
708 VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
709 };
710
711 VkInstanceCreateInfo ici = {};
712 ici.sType = VK_STRUCTURE_TYPE_INSTANCE_CREATE_INFO;
713 ici.pApplicationInfo = &ai;
714 ici.ppEnabledExtensionNames = extensions;
715 ici.enabledExtensionCount = ARRAY_SIZE(extensions);
716
717 VkInstance instance = VK_NULL_HANDLE;
718 VkResult err = vkCreateInstance(&ici, NULL, &instance);
719 if (err != VK_SUCCESS)
720 return VK_NULL_HANDLE;
721
722 return instance;
723 }
724
725 static VkPhysicalDevice
726 choose_pdev(const VkInstance instance)
727 {
728 uint32_t i, pdev_count;
729 VkPhysicalDevice *pdevs, pdev;
730 vkEnumeratePhysicalDevices(instance, &pdev_count, NULL);
731 assert(pdev_count > 0);
732
733 pdevs = malloc(sizeof(*pdevs) * pdev_count);
734 vkEnumeratePhysicalDevices(instance, &pdev_count, pdevs);
735 assert(pdev_count > 0);
736
737 pdev = pdevs[0];
738 for (i = 0; i < pdev_count; ++i) {
739 VkPhysicalDeviceProperties props;
740 vkGetPhysicalDeviceProperties(pdevs[i], &props);
741 if (props.deviceType == VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU) {
742 pdev = pdevs[i];
743 break;
744 }
745 }
746 free(pdevs);
747 return pdev;
748 }
749
750 static uint32_t
751 find_gfx_queue(const VkPhysicalDevice pdev)
752 {
753 uint32_t num_queues;
754 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, NULL);
755 assert(num_queues > 0);
756
757 VkQueueFamilyProperties *props = malloc(sizeof(*props) * num_queues);
758 vkGetPhysicalDeviceQueueFamilyProperties(pdev, &num_queues, props);
759
760 for (uint32_t i = 0; i < num_queues; i++) {
761 if (props[i].queueFlags & VK_QUEUE_GRAPHICS_BIT) {
762 free(props);
763 return i;
764 }
765 }
766
767 return UINT32_MAX;
768 }
769
770 static void
771 zink_flush_frontbuffer(struct pipe_screen *pscreen,
772 struct pipe_resource *pres,
773 unsigned level, unsigned layer,
774 void *winsys_drawable_handle,
775 struct pipe_box *sub_box)
776 {
777 struct zink_screen *screen = zink_screen(pscreen);
778 struct sw_winsys *winsys = screen->winsys;
779 struct zink_resource *res = zink_resource(pres);
780
781 if (!winsys)
782 return;
783 void *map = winsys->displaytarget_map(winsys, res->dt, 0);
784
785 if (map) {
786 VkImageSubresource isr = {};
787 isr.aspectMask = res->aspect;
788 isr.mipLevel = level;
789 isr.arrayLayer = layer;
790 VkSubresourceLayout layout;
791 vkGetImageSubresourceLayout(screen->dev, res->image, &isr, &layout);
792
793 void *ptr;
794 VkResult result = vkMapMemory(screen->dev, res->mem, res->offset, res->size, 0, &ptr);
795 if (result != VK_SUCCESS) {
796 debug_printf("failed to map memory for display\n");
797 return;
798 }
799 for (int i = 0; i < pres->height0; ++i) {
800 uint8_t *src = (uint8_t *)ptr + i * layout.rowPitch;
801 uint8_t *dst = (uint8_t *)map + i * res->dt_stride;
802 memcpy(dst, src, res->dt_stride);
803 }
804 vkUnmapMemory(screen->dev, res->mem);
805 }
806
807 winsys->displaytarget_unmap(winsys, res->dt);
808
809 assert(res->dt);
810 if (res->dt)
811 winsys->displaytarget_display(winsys, res->dt, winsys_drawable_handle, sub_box);
812 }
813
814 static struct pipe_screen *
815 zink_internal_create_screen(struct sw_winsys *winsys, int fd)
816 {
817 struct zink_screen *screen = CALLOC_STRUCT(zink_screen);
818 if (!screen)
819 return NULL;
820
821 zink_debug = debug_get_option_zink_debug();
822
823 screen->instance = create_instance();
824 screen->pdev = choose_pdev(screen->instance);
825 screen->gfx_queue = find_gfx_queue(screen->pdev);
826
827 vkGetPhysicalDeviceProperties(screen->pdev, &screen->props);
828 vkGetPhysicalDeviceFeatures(screen->pdev, &screen->feats);
829 vkGetPhysicalDeviceMemoryProperties(screen->pdev, &screen->mem_props);
830
831 uint32_t num_extensions = 0;
832 if (vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
833 &num_extensions, NULL) == VK_SUCCESS && num_extensions > 0) {
834 VkExtensionProperties *extensions = MALLOC(sizeof(VkExtensionProperties) *
835 num_extensions);
836 if (extensions) {
837 vkEnumerateDeviceExtensionProperties(screen->pdev, NULL,
838 &num_extensions, extensions);
839
840 for (uint32_t i = 0; i < num_extensions; ++i) {
841 if (!strcmp(extensions[i].extensionName,
842 VK_KHR_MAINTENANCE1_EXTENSION_NAME))
843 screen->have_VK_KHR_maintenance1 = true;
844 }
845 FREE(extensions);
846 }
847 }
848
849 VkDeviceQueueCreateInfo qci = {};
850 float dummy = 0.0f;
851 qci.sType = VK_STRUCTURE_TYPE_DEVICE_QUEUE_CREATE_INFO;
852 qci.queueFamilyIndex = screen->gfx_queue;
853 qci.queueCount = 1;
854 qci.pQueuePriorities = &dummy;
855
856 VkDeviceCreateInfo dci = {};
857 dci.sType = VK_STRUCTURE_TYPE_DEVICE_CREATE_INFO;
858 dci.queueCreateInfoCount = 1;
859 dci.pQueueCreateInfos = &qci;
860 dci.pEnabledFeatures = &screen->feats;
861 const char *extensions[] = {
862 VK_KHR_MAINTENANCE1_EXTENSION_NAME,
863 VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME,
864 VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME,
865 };
866 dci.ppEnabledExtensionNames = extensions;
867 dci.enabledExtensionCount = ARRAY_SIZE(extensions);
868 if (vkCreateDevice(screen->pdev, &dci, NULL, &screen->dev) != VK_SUCCESS)
869 goto fail;
870
871 screen->winsys = winsys;
872
873 screen->base.get_name = zink_get_name;
874 screen->base.get_vendor = zink_get_vendor;
875 screen->base.get_device_vendor = zink_get_device_vendor;
876 screen->base.get_param = zink_get_param;
877 screen->base.get_paramf = zink_get_paramf;
878 screen->base.get_shader_param = zink_get_shader_param;
879 screen->base.get_compiler_options = zink_get_compiler_options;
880 screen->base.is_format_supported = zink_is_format_supported;
881 screen->base.context_create = zink_context_create;
882 screen->base.flush_frontbuffer = zink_flush_frontbuffer;
883 screen->base.destroy = zink_destroy_screen;
884
885 zink_screen_resource_init(&screen->base);
886 zink_screen_fence_init(&screen->base);
887
888 slab_create_parent(&screen->transfer_pool, sizeof(struct zink_transfer), 16);
889
890 return &screen->base;
891
892 fail:
893 FREE(screen);
894 return NULL;
895 }
896
897 struct pipe_screen *
898 zink_create_screen(struct sw_winsys *winsys)
899 {
900 return zink_internal_create_screen(winsys, -1);
901 }
902
903 struct pipe_screen *
904 zink_drm_create_screen(int fd)
905 {
906 return zink_internal_create_screen(NULL, fd);
907 }