tu: Add multiview lowering pass
[mesa.git] / src / freedreno / vulkan / tu_descriptor_set.c
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22 * DEALINGS IN THE SOFTWARE.
23 */
24
25 /**
26 * @file
27 *
28 * We use the bindless descriptor model, which maps fairly closely to how
29 * Vulkan descriptor sets work. The two exceptions are input attachments and
30 * dynamic descriptors, which have to be patched when recording command
31 * buffers. We reserve an extra descriptor set for these. This descriptor set
32 * contains all the input attachments in the pipeline, in order, and then all
33 * the dynamic descriptors. The dynamic descriptors are stored in the CPU-side
34 * datastructure for each tu_descriptor_set, and then combined into one big
35 * descriptor set at CmdBindDescriptors time/draw time.
36 */
37
38 #include "tu_private.h"
39
40 #include <assert.h>
41 #include <fcntl.h>
42 #include <stdbool.h>
43 #include <string.h>
44 #include <unistd.h>
45
46 #include "util/mesa-sha1.h"
47 #include "vk_util.h"
48
49 static int
50 binding_compare(const void *av, const void *bv)
51 {
52 const VkDescriptorSetLayoutBinding *a =
53 (const VkDescriptorSetLayoutBinding *) av;
54 const VkDescriptorSetLayoutBinding *b =
55 (const VkDescriptorSetLayoutBinding *) bv;
56
57 return (a->binding < b->binding) ? -1 : (a->binding > b->binding) ? 1 : 0;
58 }
59
60 static VkDescriptorSetLayoutBinding *
61 create_sorted_bindings(const VkDescriptorSetLayoutBinding *bindings,
62 unsigned count)
63 {
64 VkDescriptorSetLayoutBinding *sorted_bindings =
65 malloc(count * sizeof(VkDescriptorSetLayoutBinding));
66 if (!sorted_bindings)
67 return NULL;
68
69 memcpy(sorted_bindings, bindings,
70 count * sizeof(VkDescriptorSetLayoutBinding));
71
72 qsort(sorted_bindings, count, sizeof(VkDescriptorSetLayoutBinding),
73 binding_compare);
74
75 return sorted_bindings;
76 }
77
78 static uint32_t
79 descriptor_size(VkDescriptorType type)
80 {
81 switch (type) {
82 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
83 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
84 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
85 /* These are remapped to the special driver-managed descriptor set,
86 * hence they don't take up any space in the original descriptor set:
87 * Input attachment doesn't use descriptor sets at all
88 */
89 return 0;
90 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
91 /* We make offsets and sizes all 16 dwords, to match how the hardware
92 * interprets indices passed to sample/load/store instructions in
93 * multiples of 16 dwords. This means that "normal" descriptors are all
94 * of size 16, with padding for smaller descriptors like uniform storage
95 * descriptors which are less than 16 dwords. However combined images
96 * and samplers are actually two descriptors, so they have size 2.
97 */
98 return A6XX_TEX_CONST_DWORDS * 4 * 2;
99 default:
100 return A6XX_TEX_CONST_DWORDS * 4;
101 }
102 }
103
104 VkResult
105 tu_CreateDescriptorSetLayout(
106 VkDevice _device,
107 const VkDescriptorSetLayoutCreateInfo *pCreateInfo,
108 const VkAllocationCallbacks *pAllocator,
109 VkDescriptorSetLayout *pSetLayout)
110 {
111 TU_FROM_HANDLE(tu_device, device, _device);
112 struct tu_descriptor_set_layout *set_layout;
113
114 assert(pCreateInfo->sType ==
115 VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO);
116 const VkDescriptorSetLayoutBindingFlagsCreateInfoEXT *variable_flags =
117 vk_find_struct_const(
118 pCreateInfo->pNext,
119 DESCRIPTOR_SET_LAYOUT_BINDING_FLAGS_CREATE_INFO_EXT);
120
121 uint32_t max_binding = 0;
122 uint32_t immutable_sampler_count = 0;
123 uint32_t ycbcr_sampler_count = 0;
124 for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
125 max_binding = MAX2(max_binding, pCreateInfo->pBindings[j].binding);
126 if ((pCreateInfo->pBindings[j].descriptorType == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER ||
127 pCreateInfo->pBindings[j].descriptorType == VK_DESCRIPTOR_TYPE_SAMPLER) &&
128 pCreateInfo->pBindings[j].pImmutableSamplers) {
129 immutable_sampler_count += pCreateInfo->pBindings[j].descriptorCount;
130
131 bool has_ycbcr_sampler = false;
132 for (unsigned i = 0; i < pCreateInfo->pBindings[j].descriptorCount; ++i) {
133 if (tu_sampler_from_handle(pCreateInfo->pBindings[j].pImmutableSamplers[i])->ycbcr_sampler)
134 has_ycbcr_sampler = true;
135 }
136
137 if (has_ycbcr_sampler)
138 ycbcr_sampler_count += pCreateInfo->pBindings[j].descriptorCount;
139 }
140 }
141
142 uint32_t samplers_offset =
143 offsetof(struct tu_descriptor_set_layout, binding[max_binding + 1]);
144
145 /* note: only need to store TEX_SAMP_DWORDS for immutable samples,
146 * but using struct tu_sampler makes things simpler */
147 uint32_t size = samplers_offset +
148 immutable_sampler_count * sizeof(struct tu_sampler) +
149 ycbcr_sampler_count * sizeof(struct tu_sampler_ycbcr_conversion);
150
151 set_layout = vk_object_zalloc(&device->vk, pAllocator, size,
152 VK_OBJECT_TYPE_DESCRIPTOR_SET_LAYOUT);
153 if (!set_layout)
154 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
155
156 set_layout->flags = pCreateInfo->flags;
157
158 /* We just allocate all the immutable samplers at the end of the struct */
159 struct tu_sampler *samplers = (void*) &set_layout->binding[max_binding + 1];
160 struct tu_sampler_ycbcr_conversion *ycbcr_samplers =
161 (void*) &samplers[immutable_sampler_count];
162
163 VkDescriptorSetLayoutBinding *bindings = create_sorted_bindings(
164 pCreateInfo->pBindings, pCreateInfo->bindingCount);
165 if (!bindings) {
166 vk_object_free(&device->vk, pAllocator, set_layout);
167 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
168 }
169
170 set_layout->binding_count = max_binding + 1;
171 set_layout->shader_stages = 0;
172 set_layout->has_immutable_samplers = false;
173 set_layout->size = 0;
174 set_layout->dynamic_ubo = 0;
175
176 uint32_t dynamic_offset_count = 0;
177 uint32_t buffer_count = 0;
178
179 for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
180 const VkDescriptorSetLayoutBinding *binding = bindings + j;
181 uint32_t b = binding->binding;
182
183 set_layout->binding[b].type = binding->descriptorType;
184 set_layout->binding[b].array_size = binding->descriptorCount;
185 set_layout->binding[b].offset = set_layout->size;
186 set_layout->binding[b].buffer_offset = buffer_count;
187 set_layout->binding[b].dynamic_offset_offset = dynamic_offset_count;
188 set_layout->binding[b].size = descriptor_size(binding->descriptorType);
189 set_layout->binding[b].shader_stages = binding->stageFlags;
190
191 if (variable_flags && binding->binding < variable_flags->bindingCount &&
192 (variable_flags->pBindingFlags[binding->binding] &
193 VK_DESCRIPTOR_BINDING_VARIABLE_DESCRIPTOR_COUNT_BIT_EXT)) {
194 assert(!binding->pImmutableSamplers); /* Terribly ill defined how
195 many samplers are valid */
196 assert(binding->binding == max_binding);
197
198 set_layout->has_variable_descriptors = true;
199 }
200
201 if ((binding->descriptorType == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER ||
202 binding->descriptorType == VK_DESCRIPTOR_TYPE_SAMPLER) &&
203 binding->pImmutableSamplers) {
204 set_layout->binding[b].immutable_samplers_offset = samplers_offset;
205 set_layout->has_immutable_samplers = true;
206
207 for (uint32_t i = 0; i < binding->descriptorCount; i++)
208 samplers[i] = *tu_sampler_from_handle(binding->pImmutableSamplers[i]);
209
210 samplers += binding->descriptorCount;
211 samplers_offset += sizeof(struct tu_sampler) * binding->descriptorCount;
212
213 bool has_ycbcr_sampler = false;
214 for (unsigned i = 0; i < pCreateInfo->pBindings[j].descriptorCount; ++i) {
215 if (tu_sampler_from_handle(binding->pImmutableSamplers[i])->ycbcr_sampler)
216 has_ycbcr_sampler = true;
217 }
218
219 if (has_ycbcr_sampler) {
220 set_layout->binding[b].ycbcr_samplers_offset =
221 (const char*)ycbcr_samplers - (const char*)set_layout;
222 for (uint32_t i = 0; i < binding->descriptorCount; i++) {
223 struct tu_sampler *sampler = tu_sampler_from_handle(binding->pImmutableSamplers[i]);
224 if (sampler->ycbcr_sampler)
225 ycbcr_samplers[i] = *sampler->ycbcr_sampler;
226 else
227 ycbcr_samplers[i].ycbcr_model = VK_SAMPLER_YCBCR_MODEL_CONVERSION_RGB_IDENTITY;
228 }
229 ycbcr_samplers += binding->descriptorCount;
230 } else {
231 set_layout->binding[b].ycbcr_samplers_offset = 0;
232 }
233 }
234
235 set_layout->size +=
236 binding->descriptorCount * set_layout->binding[b].size;
237 if (binding->descriptorType != VK_DESCRIPTOR_TYPE_SAMPLER &&
238 binding->descriptorType != VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK_EXT)
239 buffer_count += binding->descriptorCount;
240 if (binding->descriptorType == VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC ||
241 binding->descriptorType == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC) {
242 if (binding->descriptorType == VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC) {
243 STATIC_ASSERT(MAX_DYNAMIC_BUFFERS <= 8 * sizeof(set_layout->dynamic_ubo));
244 set_layout->dynamic_ubo |=
245 ((1u << binding->descriptorCount) - 1) << dynamic_offset_count;
246 }
247
248 dynamic_offset_count += binding->descriptorCount;
249 }
250
251 set_layout->shader_stages |= binding->stageFlags;
252 }
253
254 free(bindings);
255
256 set_layout->dynamic_offset_count = dynamic_offset_count;
257 set_layout->buffer_count = buffer_count;
258
259 *pSetLayout = tu_descriptor_set_layout_to_handle(set_layout);
260
261 return VK_SUCCESS;
262 }
263
264 void
265 tu_DestroyDescriptorSetLayout(VkDevice _device,
266 VkDescriptorSetLayout _set_layout,
267 const VkAllocationCallbacks *pAllocator)
268 {
269 TU_FROM_HANDLE(tu_device, device, _device);
270 TU_FROM_HANDLE(tu_descriptor_set_layout, set_layout, _set_layout);
271
272 if (!set_layout)
273 return;
274
275 vk_object_free(&device->vk, pAllocator, set_layout);
276 }
277
278 void
279 tu_GetDescriptorSetLayoutSupport(
280 VkDevice device,
281 const VkDescriptorSetLayoutCreateInfo *pCreateInfo,
282 VkDescriptorSetLayoutSupport *pSupport)
283 {
284 VkDescriptorSetLayoutBinding *bindings = create_sorted_bindings(
285 pCreateInfo->pBindings, pCreateInfo->bindingCount);
286 if (!bindings) {
287 pSupport->supported = false;
288 return;
289 }
290
291 const VkDescriptorSetLayoutBindingFlagsCreateInfoEXT *variable_flags =
292 vk_find_struct_const(
293 pCreateInfo->pNext,
294 DESCRIPTOR_SET_LAYOUT_BINDING_FLAGS_CREATE_INFO_EXT);
295 VkDescriptorSetVariableDescriptorCountLayoutSupportEXT *variable_count =
296 vk_find_struct(
297 (void *) pCreateInfo->pNext,
298 DESCRIPTOR_SET_VARIABLE_DESCRIPTOR_COUNT_LAYOUT_SUPPORT_EXT);
299 if (variable_count) {
300 variable_count->maxVariableDescriptorCount = 0;
301 }
302
303 bool supported = true;
304 uint64_t size = 0;
305 for (uint32_t i = 0; i < pCreateInfo->bindingCount; i++) {
306 const VkDescriptorSetLayoutBinding *binding = bindings + i;
307
308 uint64_t descriptor_sz = descriptor_size(binding->descriptorType);
309 uint64_t descriptor_alignment = 8;
310
311 if (size && !ALIGN_POT(size, descriptor_alignment)) {
312 supported = false;
313 }
314 size = ALIGN_POT(size, descriptor_alignment);
315
316 uint64_t max_count = UINT64_MAX;
317 if (descriptor_sz)
318 max_count = (UINT64_MAX - size) / descriptor_sz;
319
320 if (max_count < binding->descriptorCount) {
321 supported = false;
322 }
323 if (variable_flags && binding->binding < variable_flags->bindingCount &&
324 variable_count &&
325 (variable_flags->pBindingFlags[binding->binding] &
326 VK_DESCRIPTOR_BINDING_VARIABLE_DESCRIPTOR_COUNT_BIT_EXT)) {
327 variable_count->maxVariableDescriptorCount =
328 MIN2(UINT32_MAX, max_count);
329 }
330 size += binding->descriptorCount * descriptor_sz;
331 }
332
333 free(bindings);
334
335 pSupport->supported = supported;
336 }
337
338 /*
339 * Pipeline layouts. These have nothing to do with the pipeline. They are
340 * just multiple descriptor set layouts pasted together.
341 */
342
343 VkResult
344 tu_CreatePipelineLayout(VkDevice _device,
345 const VkPipelineLayoutCreateInfo *pCreateInfo,
346 const VkAllocationCallbacks *pAllocator,
347 VkPipelineLayout *pPipelineLayout)
348 {
349 TU_FROM_HANDLE(tu_device, device, _device);
350 struct tu_pipeline_layout *layout;
351 struct mesa_sha1 ctx;
352
353 assert(pCreateInfo->sType ==
354 VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO);
355
356 layout = vk_object_alloc(&device->vk, pAllocator, sizeof(*layout),
357 VK_OBJECT_TYPE_PIPELINE_LAYOUT);
358 if (layout == NULL)
359 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
360
361 layout->num_sets = pCreateInfo->setLayoutCount;
362 layout->dynamic_offset_count = 0;
363
364 unsigned dynamic_offset_count = 0;
365
366 _mesa_sha1_init(&ctx);
367 for (uint32_t set = 0; set < pCreateInfo->setLayoutCount; set++) {
368 TU_FROM_HANDLE(tu_descriptor_set_layout, set_layout,
369 pCreateInfo->pSetLayouts[set]);
370 layout->set[set].layout = set_layout;
371 layout->set[set].dynamic_offset_start = dynamic_offset_count;
372 dynamic_offset_count += set_layout->dynamic_offset_count;
373
374 for (uint32_t b = 0; b < set_layout->binding_count; b++) {
375 if (set_layout->binding[b].immutable_samplers_offset)
376 _mesa_sha1_update(
377 &ctx,
378 tu_immutable_samplers(set_layout, set_layout->binding + b),
379 set_layout->binding[b].array_size * 4 * sizeof(uint32_t));
380 }
381 _mesa_sha1_update(
382 &ctx, set_layout->binding,
383 sizeof(set_layout->binding[0]) * set_layout->binding_count);
384 }
385
386 layout->dynamic_offset_count = dynamic_offset_count;
387 layout->push_constant_size = 0;
388
389 for (unsigned i = 0; i < pCreateInfo->pushConstantRangeCount; ++i) {
390 const VkPushConstantRange *range = pCreateInfo->pPushConstantRanges + i;
391 layout->push_constant_size =
392 MAX2(layout->push_constant_size, range->offset + range->size);
393 }
394
395 layout->push_constant_size = align(layout->push_constant_size, 16);
396 _mesa_sha1_update(&ctx, &layout->push_constant_size,
397 sizeof(layout->push_constant_size));
398 _mesa_sha1_final(&ctx, layout->sha1);
399 *pPipelineLayout = tu_pipeline_layout_to_handle(layout);
400
401 return VK_SUCCESS;
402 }
403
404 void
405 tu_DestroyPipelineLayout(VkDevice _device,
406 VkPipelineLayout _pipelineLayout,
407 const VkAllocationCallbacks *pAllocator)
408 {
409 TU_FROM_HANDLE(tu_device, device, _device);
410 TU_FROM_HANDLE(tu_pipeline_layout, pipeline_layout, _pipelineLayout);
411
412 if (!pipeline_layout)
413 return;
414
415 vk_object_free(&device->vk, pAllocator, pipeline_layout);
416 }
417
418 #define EMPTY 1
419
420 static VkResult
421 tu_descriptor_set_create(struct tu_device *device,
422 struct tu_descriptor_pool *pool,
423 const struct tu_descriptor_set_layout *layout,
424 const uint32_t *variable_count,
425 struct tu_descriptor_set **out_set)
426 {
427 struct tu_descriptor_set *set;
428 uint32_t buffer_count = layout->buffer_count;
429 if (variable_count) {
430 unsigned stride = 1;
431 if (layout->binding[layout->binding_count - 1].type == VK_DESCRIPTOR_TYPE_SAMPLER ||
432 layout->binding[layout->binding_count - 1].type == VK_DESCRIPTOR_TYPE_INLINE_UNIFORM_BLOCK_EXT)
433 stride = 0;
434 buffer_count = layout->binding[layout->binding_count - 1].buffer_offset +
435 *variable_count * stride;
436 }
437 unsigned dynamic_offset = sizeof(struct tu_descriptor_set) +
438 sizeof(struct tu_bo *) * buffer_count;
439 unsigned mem_size = dynamic_offset +
440 A6XX_TEX_CONST_DWORDS * 4 * layout->dynamic_offset_count;
441
442 if (pool->host_memory_base) {
443 if (pool->host_memory_end - pool->host_memory_ptr < mem_size)
444 return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY);
445
446 set = (struct tu_descriptor_set*)pool->host_memory_ptr;
447 pool->host_memory_ptr += mem_size;
448 } else {
449 set = vk_alloc2(&device->vk.alloc, NULL, mem_size, 8,
450 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
451
452 if (!set)
453 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
454 }
455
456 memset(set, 0, mem_size);
457 vk_object_base_init(&device->vk, &set->base, VK_OBJECT_TYPE_DESCRIPTOR_SET);
458
459 if (layout->dynamic_offset_count) {
460 set->dynamic_descriptors = (uint32_t *)((uint8_t*)set + dynamic_offset);
461 }
462
463 set->layout = layout;
464 set->pool = pool;
465 uint32_t layout_size = layout->size;
466 if (variable_count) {
467 assert(layout->has_variable_descriptors);
468 uint32_t stride = layout->binding[layout->binding_count - 1].size;
469 layout_size = layout->binding[layout->binding_count - 1].offset +
470 *variable_count * stride;
471 }
472
473 if (layout_size) {
474 set->size = layout_size;
475
476 if (!pool->host_memory_base && pool->entry_count == pool->max_entry_count) {
477 vk_object_free(&device->vk, NULL, set);
478 return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY);
479 }
480
481 /* try to allocate linearly first, so that we don't spend
482 * time looking for gaps if the app only allocates &
483 * resets via the pool. */
484 if (pool->current_offset + layout_size <= pool->size) {
485 set->mapped_ptr = (uint32_t*)(pool->bo.map + pool->current_offset);
486 set->va = pool->bo.iova + pool->current_offset;
487 if (!pool->host_memory_base) {
488 pool->entries[pool->entry_count].offset = pool->current_offset;
489 pool->entries[pool->entry_count].size = layout_size;
490 pool->entries[pool->entry_count].set = set;
491 pool->entry_count++;
492 }
493 pool->current_offset += layout_size;
494 } else if (!pool->host_memory_base) {
495 uint64_t offset = 0;
496 int index;
497
498 for (index = 0; index < pool->entry_count; ++index) {
499 if (pool->entries[index].offset - offset >= layout_size)
500 break;
501 offset = pool->entries[index].offset + pool->entries[index].size;
502 }
503
504 if (pool->size - offset < layout_size) {
505 vk_object_free(&device->vk, NULL, set);
506 return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY);
507 }
508
509 set->mapped_ptr = (uint32_t*)(pool->bo.map + offset);
510 set->va = pool->bo.iova + offset;
511 memmove(&pool->entries[index + 1], &pool->entries[index],
512 sizeof(pool->entries[0]) * (pool->entry_count - index));
513 pool->entries[index].offset = offset;
514 pool->entries[index].size = layout_size;
515 pool->entries[index].set = set;
516 pool->entry_count++;
517 } else
518 return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY);
519 }
520
521 if (layout->has_immutable_samplers) {
522 for (unsigned i = 0; i < layout->binding_count; ++i) {
523 if (!layout->binding[i].immutable_samplers_offset)
524 continue;
525
526 unsigned offset = layout->binding[i].offset / 4;
527 if (layout->binding[i].type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
528 offset += A6XX_TEX_CONST_DWORDS;
529
530 const struct tu_sampler *samplers =
531 (const struct tu_sampler *)((const char *)layout +
532 layout->binding[i].immutable_samplers_offset);
533 for (unsigned j = 0; j < layout->binding[i].array_size; ++j) {
534 memcpy(set->mapped_ptr + offset, samplers[j].descriptor,
535 sizeof(samplers[j].descriptor));
536 offset += layout->binding[i].size / 4;
537 }
538 }
539 }
540
541 *out_set = set;
542 return VK_SUCCESS;
543 }
544
545 static void
546 tu_descriptor_set_destroy(struct tu_device *device,
547 struct tu_descriptor_pool *pool,
548 struct tu_descriptor_set *set,
549 bool free_bo)
550 {
551 assert(!pool->host_memory_base);
552
553 if (free_bo && set->size && !pool->host_memory_base) {
554 uint32_t offset = (uint8_t*)set->mapped_ptr - (uint8_t*)pool->bo.map;
555 for (int i = 0; i < pool->entry_count; ++i) {
556 if (pool->entries[i].offset == offset) {
557 memmove(&pool->entries[i], &pool->entries[i+1],
558 sizeof(pool->entries[i]) * (pool->entry_count - i - 1));
559 --pool->entry_count;
560 break;
561 }
562 }
563 }
564
565 vk_object_free(&device->vk, NULL, set);
566 }
567
568 VkResult
569 tu_CreateDescriptorPool(VkDevice _device,
570 const VkDescriptorPoolCreateInfo *pCreateInfo,
571 const VkAllocationCallbacks *pAllocator,
572 VkDescriptorPool *pDescriptorPool)
573 {
574 TU_FROM_HANDLE(tu_device, device, _device);
575 struct tu_descriptor_pool *pool;
576 uint64_t size = sizeof(struct tu_descriptor_pool);
577 uint64_t bo_size = 0, bo_count = 0, dynamic_count = 0;
578
579 for (unsigned i = 0; i < pCreateInfo->poolSizeCount; ++i) {
580 if (pCreateInfo->pPoolSizes[i].type != VK_DESCRIPTOR_TYPE_SAMPLER)
581 bo_count += pCreateInfo->pPoolSizes[i].descriptorCount;
582
583 switch(pCreateInfo->pPoolSizes[i].type) {
584 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
585 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
586 dynamic_count += pCreateInfo->pPoolSizes[i].descriptorCount;
587 default:
588 break;
589 }
590
591 bo_size += descriptor_size(pCreateInfo->pPoolSizes[i].type) *
592 pCreateInfo->pPoolSizes[i].descriptorCount;
593 }
594
595 if (!(pCreateInfo->flags & VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT)) {
596 uint64_t host_size = pCreateInfo->maxSets * sizeof(struct tu_descriptor_set);
597 host_size += sizeof(struct tu_bo*) * bo_count;
598 host_size += A6XX_TEX_CONST_DWORDS * 4 * dynamic_count;
599 size += host_size;
600 } else {
601 size += sizeof(struct tu_descriptor_pool_entry) * pCreateInfo->maxSets;
602 }
603
604 pool = vk_object_zalloc(&device->vk, pAllocator, size,
605 VK_OBJECT_TYPE_DESCRIPTOR_POOL);
606 if (!pool)
607 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
608
609 if (!(pCreateInfo->flags & VK_DESCRIPTOR_POOL_CREATE_FREE_DESCRIPTOR_SET_BIT)) {
610 pool->host_memory_base = (uint8_t*)pool + sizeof(struct tu_descriptor_pool);
611 pool->host_memory_ptr = pool->host_memory_base;
612 pool->host_memory_end = (uint8_t*)pool + size;
613 }
614
615 if (bo_size) {
616 VkResult ret;
617
618 ret = tu_bo_init_new(device, &pool->bo, bo_size);
619 assert(ret == VK_SUCCESS);
620
621 ret = tu_bo_map(device, &pool->bo);
622 assert(ret == VK_SUCCESS);
623 }
624 pool->size = bo_size;
625 pool->max_entry_count = pCreateInfo->maxSets;
626
627 *pDescriptorPool = tu_descriptor_pool_to_handle(pool);
628 return VK_SUCCESS;
629 }
630
631 void
632 tu_DestroyDescriptorPool(VkDevice _device,
633 VkDescriptorPool _pool,
634 const VkAllocationCallbacks *pAllocator)
635 {
636 TU_FROM_HANDLE(tu_device, device, _device);
637 TU_FROM_HANDLE(tu_descriptor_pool, pool, _pool);
638
639 if (!pool)
640 return;
641
642 if (!pool->host_memory_base) {
643 for(int i = 0; i < pool->entry_count; ++i) {
644 tu_descriptor_set_destroy(device, pool, pool->entries[i].set, false);
645 }
646 }
647
648 if (pool->size)
649 tu_bo_finish(device, &pool->bo);
650
651 vk_object_free(&device->vk, pAllocator, pool);
652 }
653
654 VkResult
655 tu_ResetDescriptorPool(VkDevice _device,
656 VkDescriptorPool descriptorPool,
657 VkDescriptorPoolResetFlags flags)
658 {
659 TU_FROM_HANDLE(tu_device, device, _device);
660 TU_FROM_HANDLE(tu_descriptor_pool, pool, descriptorPool);
661
662 if (!pool->host_memory_base) {
663 for(int i = 0; i < pool->entry_count; ++i) {
664 tu_descriptor_set_destroy(device, pool, pool->entries[i].set, false);
665 }
666 pool->entry_count = 0;
667 }
668
669 pool->current_offset = 0;
670 pool->host_memory_ptr = pool->host_memory_base;
671
672 return VK_SUCCESS;
673 }
674
675 VkResult
676 tu_AllocateDescriptorSets(VkDevice _device,
677 const VkDescriptorSetAllocateInfo *pAllocateInfo,
678 VkDescriptorSet *pDescriptorSets)
679 {
680 TU_FROM_HANDLE(tu_device, device, _device);
681 TU_FROM_HANDLE(tu_descriptor_pool, pool, pAllocateInfo->descriptorPool);
682
683 VkResult result = VK_SUCCESS;
684 uint32_t i;
685 struct tu_descriptor_set *set = NULL;
686
687 const VkDescriptorSetVariableDescriptorCountAllocateInfoEXT *variable_counts =
688 vk_find_struct_const(pAllocateInfo->pNext, DESCRIPTOR_SET_VARIABLE_DESCRIPTOR_COUNT_ALLOCATE_INFO_EXT);
689 const uint32_t zero = 0;
690
691 /* allocate a set of buffers for each shader to contain descriptors */
692 for (i = 0; i < pAllocateInfo->descriptorSetCount; i++) {
693 TU_FROM_HANDLE(tu_descriptor_set_layout, layout,
694 pAllocateInfo->pSetLayouts[i]);
695
696 const uint32_t *variable_count = NULL;
697 if (variable_counts) {
698 if (i < variable_counts->descriptorSetCount)
699 variable_count = variable_counts->pDescriptorCounts + i;
700 else
701 variable_count = &zero;
702 }
703
704 assert(!(layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
705
706 result = tu_descriptor_set_create(device, pool, layout, variable_count, &set);
707 if (result != VK_SUCCESS)
708 break;
709
710 pDescriptorSets[i] = tu_descriptor_set_to_handle(set);
711 }
712
713 if (result != VK_SUCCESS) {
714 tu_FreeDescriptorSets(_device, pAllocateInfo->descriptorPool,
715 i, pDescriptorSets);
716 for (i = 0; i < pAllocateInfo->descriptorSetCount; i++) {
717 pDescriptorSets[i] = VK_NULL_HANDLE;
718 }
719 }
720 return result;
721 }
722
723 VkResult
724 tu_FreeDescriptorSets(VkDevice _device,
725 VkDescriptorPool descriptorPool,
726 uint32_t count,
727 const VkDescriptorSet *pDescriptorSets)
728 {
729 TU_FROM_HANDLE(tu_device, device, _device);
730 TU_FROM_HANDLE(tu_descriptor_pool, pool, descriptorPool);
731
732 for (uint32_t i = 0; i < count; i++) {
733 TU_FROM_HANDLE(tu_descriptor_set, set, pDescriptorSets[i]);
734
735 if (set && !pool->host_memory_base)
736 tu_descriptor_set_destroy(device, pool, set, true);
737 }
738 return VK_SUCCESS;
739 }
740
741 static void write_texel_buffer_descriptor(struct tu_device *device,
742 struct tu_cmd_buffer *cmd_buffer,
743 unsigned *dst,
744 struct tu_bo **buffer_list,
745 const VkBufferView buffer_view)
746 {
747 TU_FROM_HANDLE(tu_buffer_view, view, buffer_view);
748
749 memcpy(dst, view->descriptor, sizeof(view->descriptor));
750
751 if (cmd_buffer)
752 tu_bo_list_add(&cmd_buffer->bo_list, view->buffer->bo, MSM_SUBMIT_BO_READ);
753 else
754 *buffer_list = view->buffer->bo;
755 }
756
757 static uint32_t get_range(struct tu_buffer *buf, VkDeviceSize offset,
758 VkDeviceSize range)
759 {
760 if (range == VK_WHOLE_SIZE) {
761 return buf->size - offset;
762 } else {
763 return range;
764 }
765 }
766
767 static void write_buffer_descriptor(struct tu_device *device,
768 struct tu_cmd_buffer *cmd_buffer,
769 unsigned *dst,
770 struct tu_bo **buffer_list,
771 const VkDescriptorBufferInfo *buffer_info)
772 {
773 TU_FROM_HANDLE(tu_buffer, buffer, buffer_info->buffer);
774
775 uint64_t va = tu_buffer_iova(buffer) + buffer_info->offset;
776 uint32_t range = get_range(buffer, buffer_info->offset, buffer_info->range);
777 range = ALIGN_POT(range, 4) / 4;
778 dst[0] =
779 A6XX_IBO_0_TILE_MODE(TILE6_LINEAR) | A6XX_IBO_0_FMT(FMT6_32_UINT);
780 dst[1] = range;
781 dst[2] =
782 A6XX_IBO_2_UNK4 | A6XX_IBO_2_TYPE(A6XX_TEX_1D) | A6XX_IBO_2_UNK31;
783 dst[3] = 0;
784 dst[4] = A6XX_IBO_4_BASE_LO(va);
785 dst[5] = A6XX_IBO_5_BASE_HI(va >> 32);
786 for (int i = 6; i < A6XX_TEX_CONST_DWORDS; i++)
787 dst[i] = 0;
788
789 if (cmd_buffer)
790 tu_bo_list_add(&cmd_buffer->bo_list, buffer->bo, MSM_SUBMIT_BO_READ);
791 else
792 *buffer_list = buffer->bo;
793 }
794
795 static void write_ubo_descriptor(struct tu_device *device,
796 struct tu_cmd_buffer *cmd_buffer,
797 unsigned *dst,
798 struct tu_bo **buffer_list,
799 const VkDescriptorBufferInfo *buffer_info)
800 {
801 TU_FROM_HANDLE(tu_buffer, buffer, buffer_info->buffer);
802
803 uint32_t range = get_range(buffer, buffer_info->offset, buffer_info->range);
804 /* The HW range is in vec4 units */
805 range = ALIGN_POT(range, 16) / 16;
806 uint64_t va = tu_buffer_iova(buffer) + buffer_info->offset;
807 dst[0] = A6XX_UBO_0_BASE_LO(va);
808 dst[1] = A6XX_UBO_1_BASE_HI(va >> 32) | A6XX_UBO_1_SIZE(range);
809
810 if (cmd_buffer)
811 tu_bo_list_add(&cmd_buffer->bo_list, buffer->bo, MSM_SUBMIT_BO_READ);
812 else
813 *buffer_list = buffer->bo;
814 }
815
816 static void
817 write_image_descriptor(struct tu_device *device,
818 struct tu_cmd_buffer *cmd_buffer,
819 unsigned *dst,
820 struct tu_bo **buffer_list,
821 VkDescriptorType descriptor_type,
822 const VkDescriptorImageInfo *image_info)
823 {
824 TU_FROM_HANDLE(tu_image_view, iview, image_info->imageView);
825
826 if (descriptor_type == VK_DESCRIPTOR_TYPE_STORAGE_IMAGE) {
827 memcpy(dst, iview->storage_descriptor, sizeof(iview->storage_descriptor));
828 } else {
829 memcpy(dst, iview->descriptor, sizeof(iview->descriptor));
830 }
831
832 if (cmd_buffer)
833 tu_bo_list_add(&cmd_buffer->bo_list, iview->image->bo, MSM_SUBMIT_BO_READ);
834 else
835 *buffer_list = iview->image->bo;
836 }
837
838 static void
839 write_combined_image_sampler_descriptor(struct tu_device *device,
840 struct tu_cmd_buffer *cmd_buffer,
841 unsigned sampler_offset,
842 unsigned *dst,
843 struct tu_bo **buffer_list,
844 VkDescriptorType descriptor_type,
845 const VkDescriptorImageInfo *image_info,
846 bool has_sampler)
847 {
848 TU_FROM_HANDLE(tu_sampler, sampler, image_info->sampler);
849
850 write_image_descriptor(device, cmd_buffer, dst, buffer_list,
851 descriptor_type, image_info);
852 /* copy over sampler state */
853 if (has_sampler) {
854 memcpy(dst + A6XX_TEX_CONST_DWORDS, sampler->descriptor, sizeof(sampler->descriptor));
855 }
856 }
857
858 static void
859 write_sampler_descriptor(struct tu_device *device,
860 unsigned *dst,
861 const VkDescriptorImageInfo *image_info)
862 {
863 TU_FROM_HANDLE(tu_sampler, sampler, image_info->sampler);
864
865 memcpy(dst, sampler->descriptor, sizeof(sampler->descriptor));
866 }
867
868 void
869 tu_update_descriptor_sets(struct tu_device *device,
870 struct tu_cmd_buffer *cmd_buffer,
871 VkDescriptorSet dstSetOverride,
872 uint32_t descriptorWriteCount,
873 const VkWriteDescriptorSet *pDescriptorWrites,
874 uint32_t descriptorCopyCount,
875 const VkCopyDescriptorSet *pDescriptorCopies)
876 {
877 uint32_t i, j;
878 for (i = 0; i < descriptorWriteCount; i++) {
879 const VkWriteDescriptorSet *writeset = &pDescriptorWrites[i];
880 TU_FROM_HANDLE(tu_descriptor_set, set,
881 dstSetOverride ? dstSetOverride : writeset->dstSet);
882 const struct tu_descriptor_set_binding_layout *binding_layout =
883 set->layout->binding + writeset->dstBinding;
884 uint32_t *ptr = set->mapped_ptr;
885 struct tu_bo **buffer_list = set->buffers;
886
887 ptr += binding_layout->offset / 4;
888
889 ptr += (binding_layout->size / 4) * writeset->dstArrayElement;
890 buffer_list += binding_layout->buffer_offset;
891 buffer_list += writeset->dstArrayElement;
892 for (j = 0; j < writeset->descriptorCount; ++j) {
893 switch(writeset->descriptorType) {
894 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC: {
895 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
896 unsigned idx = writeset->dstArrayElement + j;
897 idx += binding_layout->dynamic_offset_offset;
898 write_ubo_descriptor(device, cmd_buffer,
899 set->dynamic_descriptors + A6XX_TEX_CONST_DWORDS * idx,
900 buffer_list, writeset->pBufferInfo + j);
901 break;
902 }
903 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
904 write_ubo_descriptor(device, cmd_buffer, ptr, buffer_list,
905 writeset->pBufferInfo + j);
906 break;
907 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
908 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
909 unsigned idx = writeset->dstArrayElement + j;
910 idx += binding_layout->dynamic_offset_offset;
911 write_buffer_descriptor(device, cmd_buffer,
912 set->dynamic_descriptors + A6XX_TEX_CONST_DWORDS * idx,
913 buffer_list, writeset->pBufferInfo + j);
914 break;
915 }
916 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
917 write_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
918 writeset->pBufferInfo + j);
919 break;
920 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
921 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
922 write_texel_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
923 writeset->pTexelBufferView[j]);
924 break;
925 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
926 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
927 write_image_descriptor(device, cmd_buffer, ptr, buffer_list,
928 writeset->descriptorType,
929 writeset->pImageInfo + j);
930 break;
931 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
932 write_combined_image_sampler_descriptor(device, cmd_buffer,
933 A6XX_TEX_CONST_DWORDS * 4,
934 ptr, buffer_list,
935 writeset->descriptorType,
936 writeset->pImageInfo + j,
937 !binding_layout->immutable_samplers_offset);
938 break;
939 case VK_DESCRIPTOR_TYPE_SAMPLER:
940 write_sampler_descriptor(device, ptr, writeset->pImageInfo + j);
941 break;
942 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
943 /* nothing in descriptor set - framebuffer state is used instead */
944 break;
945 default:
946 unreachable("unimplemented descriptor type");
947 break;
948 }
949 ptr += binding_layout->size / 4;
950 ++buffer_list;
951 }
952 }
953
954 for (i = 0; i < descriptorCopyCount; i++) {
955 const VkCopyDescriptorSet *copyset = &pDescriptorCopies[i];
956 TU_FROM_HANDLE(tu_descriptor_set, src_set,
957 copyset->srcSet);
958 TU_FROM_HANDLE(tu_descriptor_set, dst_set,
959 copyset->dstSet);
960 const struct tu_descriptor_set_binding_layout *src_binding_layout =
961 src_set->layout->binding + copyset->srcBinding;
962 const struct tu_descriptor_set_binding_layout *dst_binding_layout =
963 dst_set->layout->binding + copyset->dstBinding;
964 uint32_t *src_ptr = src_set->mapped_ptr;
965 uint32_t *dst_ptr = dst_set->mapped_ptr;
966 struct tu_bo **src_buffer_list = src_set->buffers;
967 struct tu_bo **dst_buffer_list = dst_set->buffers;
968
969 src_ptr += src_binding_layout->offset / 4;
970 dst_ptr += dst_binding_layout->offset / 4;
971
972 src_ptr += src_binding_layout->size * copyset->srcArrayElement / 4;
973 dst_ptr += dst_binding_layout->size * copyset->dstArrayElement / 4;
974
975 src_buffer_list += src_binding_layout->buffer_offset;
976 src_buffer_list += copyset->srcArrayElement;
977
978 dst_buffer_list += dst_binding_layout->buffer_offset;
979 dst_buffer_list += copyset->dstArrayElement;
980
981 for (j = 0; j < copyset->descriptorCount; ++j) {
982 switch (src_binding_layout->type) {
983 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
984 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
985 unsigned src_idx = copyset->srcArrayElement + j;
986 unsigned dst_idx = copyset->dstArrayElement + j;
987 src_idx += src_binding_layout->dynamic_offset_offset;
988 dst_idx += dst_binding_layout->dynamic_offset_offset;
989
990 uint32_t *src_dynamic, *dst_dynamic;
991 src_dynamic = src_set->dynamic_descriptors + src_idx * A6XX_TEX_CONST_DWORDS;
992 dst_dynamic = dst_set->dynamic_descriptors + dst_idx * A6XX_TEX_CONST_DWORDS;
993 memcpy(dst_dynamic, src_dynamic, A6XX_TEX_CONST_DWORDS * 4);
994 break;
995 }
996 default:
997 memcpy(dst_ptr, src_ptr, src_binding_layout->size);
998 }
999
1000 src_ptr += src_binding_layout->size / 4;
1001 dst_ptr += dst_binding_layout->size / 4;
1002
1003 if (src_binding_layout->type != VK_DESCRIPTOR_TYPE_SAMPLER) {
1004 /* Sampler descriptors don't have a buffer list. */
1005 dst_buffer_list[j] = src_buffer_list[j];
1006 }
1007 }
1008 }
1009 }
1010
1011 void
1012 tu_UpdateDescriptorSets(VkDevice _device,
1013 uint32_t descriptorWriteCount,
1014 const VkWriteDescriptorSet *pDescriptorWrites,
1015 uint32_t descriptorCopyCount,
1016 const VkCopyDescriptorSet *pDescriptorCopies)
1017 {
1018 TU_FROM_HANDLE(tu_device, device, _device);
1019
1020 tu_update_descriptor_sets(device, NULL, VK_NULL_HANDLE,
1021 descriptorWriteCount, pDescriptorWrites,
1022 descriptorCopyCount, pDescriptorCopies);
1023 }
1024
1025 VkResult
1026 tu_CreateDescriptorUpdateTemplate(
1027 VkDevice _device,
1028 const VkDescriptorUpdateTemplateCreateInfo *pCreateInfo,
1029 const VkAllocationCallbacks *pAllocator,
1030 VkDescriptorUpdateTemplate *pDescriptorUpdateTemplate)
1031 {
1032 TU_FROM_HANDLE(tu_device, device, _device);
1033 TU_FROM_HANDLE(tu_descriptor_set_layout, set_layout,
1034 pCreateInfo->descriptorSetLayout);
1035 const uint32_t entry_count = pCreateInfo->descriptorUpdateEntryCount;
1036 const size_t size =
1037 sizeof(struct tu_descriptor_update_template) +
1038 sizeof(struct tu_descriptor_update_template_entry) * entry_count;
1039 struct tu_descriptor_update_template *templ;
1040
1041 templ = vk_object_alloc(&device->vk, pAllocator, size,
1042 VK_OBJECT_TYPE_DESCRIPTOR_UPDATE_TEMPLATE);
1043 if (!templ)
1044 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
1045
1046 templ->entry_count = entry_count;
1047
1048 if (pCreateInfo->templateType == VK_DESCRIPTOR_UPDATE_TEMPLATE_TYPE_PUSH_DESCRIPTORS_KHR) {
1049 TU_FROM_HANDLE(tu_pipeline_layout, pipeline_layout, pCreateInfo->pipelineLayout);
1050
1051 /* descriptorSetLayout should be ignored for push descriptors
1052 * and instead it refers to pipelineLayout and set.
1053 */
1054 assert(pCreateInfo->set < MAX_SETS);
1055 set_layout = pipeline_layout->set[pCreateInfo->set].layout;
1056 }
1057
1058 for (uint32_t i = 0; i < entry_count; i++) {
1059 const VkDescriptorUpdateTemplateEntry *entry = &pCreateInfo->pDescriptorUpdateEntries[i];
1060
1061 const struct tu_descriptor_set_binding_layout *binding_layout =
1062 set_layout->binding + entry->dstBinding;
1063 const uint32_t buffer_offset = binding_layout->buffer_offset +
1064 entry->dstArrayElement;
1065 uint32_t dst_offset, dst_stride;
1066
1067 /* dst_offset is an offset into dynamic_descriptors when the descriptor
1068 * is dynamic, and an offset into mapped_ptr otherwise.
1069 */
1070 switch (entry->descriptorType) {
1071 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
1072 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
1073 dst_offset = (binding_layout->dynamic_offset_offset +
1074 entry->dstArrayElement) * A6XX_TEX_CONST_DWORDS;
1075 dst_stride = A6XX_TEX_CONST_DWORDS;
1076 break;
1077 default:
1078 dst_offset = binding_layout->offset / 4;
1079 dst_offset += (binding_layout->size * entry->dstArrayElement) / 4;
1080 dst_stride = binding_layout->size / 4;
1081 }
1082
1083 templ->entry[i] = (struct tu_descriptor_update_template_entry) {
1084 .descriptor_type = entry->descriptorType,
1085 .descriptor_count = entry->descriptorCount,
1086 .src_offset = entry->offset,
1087 .src_stride = entry->stride,
1088 .dst_offset = dst_offset,
1089 .dst_stride = dst_stride,
1090 .buffer_offset = buffer_offset,
1091 .has_sampler = !binding_layout->immutable_samplers_offset,
1092 };
1093 }
1094
1095 *pDescriptorUpdateTemplate =
1096 tu_descriptor_update_template_to_handle(templ);
1097
1098 return VK_SUCCESS;
1099 }
1100
1101 void
1102 tu_DestroyDescriptorUpdateTemplate(
1103 VkDevice _device,
1104 VkDescriptorUpdateTemplate descriptorUpdateTemplate,
1105 const VkAllocationCallbacks *pAllocator)
1106 {
1107 TU_FROM_HANDLE(tu_device, device, _device);
1108 TU_FROM_HANDLE(tu_descriptor_update_template, templ,
1109 descriptorUpdateTemplate);
1110
1111 if (!templ)
1112 return;
1113
1114 vk_object_free(&device->vk, pAllocator, templ);
1115 }
1116
1117 void
1118 tu_update_descriptor_set_with_template(
1119 struct tu_device *device,
1120 struct tu_cmd_buffer *cmd_buffer,
1121 struct tu_descriptor_set *set,
1122 VkDescriptorUpdateTemplate descriptorUpdateTemplate,
1123 const void *pData)
1124 {
1125 TU_FROM_HANDLE(tu_descriptor_update_template, templ,
1126 descriptorUpdateTemplate);
1127
1128 for (uint32_t i = 0; i < templ->entry_count; i++) {
1129 uint32_t *ptr = set->mapped_ptr;
1130 const void *src = ((const char *) pData) + templ->entry[i].src_offset;
1131 struct tu_bo **buffer_list = set->buffers;
1132
1133 ptr += templ->entry[i].dst_offset;
1134 buffer_list += templ->entry[i].buffer_offset;
1135 unsigned dst_offset = templ->entry[i].dst_offset;
1136 for (unsigned j = 0; j < templ->entry[i].descriptor_count; ++j) {
1137 switch(templ->entry[i].descriptor_type) {
1138 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC: {
1139 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
1140 write_ubo_descriptor(device, cmd_buffer,
1141 set->dynamic_descriptors + dst_offset,
1142 buffer_list, src);
1143 break;
1144 }
1145 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
1146 write_ubo_descriptor(device, cmd_buffer, ptr, buffer_list, src);
1147 break;
1148 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
1149 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
1150 write_buffer_descriptor(device, cmd_buffer,
1151 set->dynamic_descriptors + dst_offset,
1152 buffer_list, src);
1153 break;
1154 }
1155 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
1156 write_buffer_descriptor(device, cmd_buffer, ptr, buffer_list, src);
1157 break;
1158 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
1159 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
1160 write_texel_buffer_descriptor(device, cmd_buffer, ptr,
1161 buffer_list, *(VkBufferView *) src);
1162 break;
1163 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
1164 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE: {
1165 write_image_descriptor(device, cmd_buffer, ptr, buffer_list,
1166 templ->entry[i].descriptor_type,
1167 src);
1168 break;
1169 }
1170 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
1171 write_combined_image_sampler_descriptor(device, cmd_buffer,
1172 A6XX_TEX_CONST_DWORDS * 4,
1173 ptr, buffer_list,
1174 templ->entry[i].descriptor_type,
1175 src,
1176 templ->entry[i].has_sampler);
1177 break;
1178 case VK_DESCRIPTOR_TYPE_SAMPLER:
1179 write_sampler_descriptor(device, ptr, src);
1180 break;
1181 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
1182 /* nothing in descriptor set - framebuffer state is used instead */
1183 break;
1184 default:
1185 unreachable("unimplemented descriptor type");
1186 break;
1187 }
1188 src = (char *) src + templ->entry[i].src_stride;
1189 ptr += templ->entry[i].dst_stride;
1190 dst_offset += templ->entry[i].dst_stride;
1191 ++buffer_list;
1192 }
1193 }
1194 }
1195
1196 void
1197 tu_UpdateDescriptorSetWithTemplate(
1198 VkDevice _device,
1199 VkDescriptorSet descriptorSet,
1200 VkDescriptorUpdateTemplate descriptorUpdateTemplate,
1201 const void *pData)
1202 {
1203 TU_FROM_HANDLE(tu_device, device, _device);
1204 TU_FROM_HANDLE(tu_descriptor_set, set, descriptorSet);
1205
1206 tu_update_descriptor_set_with_template(device, NULL, set,
1207 descriptorUpdateTemplate, pData);
1208 }
1209
1210 VkResult
1211 tu_CreateSamplerYcbcrConversion(
1212 VkDevice _device,
1213 const VkSamplerYcbcrConversionCreateInfo *pCreateInfo,
1214 const VkAllocationCallbacks *pAllocator,
1215 VkSamplerYcbcrConversion *pYcbcrConversion)
1216 {
1217 TU_FROM_HANDLE(tu_device, device, _device);
1218 struct tu_sampler_ycbcr_conversion *conversion;
1219
1220 conversion = vk_object_alloc(&device->vk, pAllocator, sizeof(*conversion),
1221 VK_OBJECT_TYPE_SAMPLER_YCBCR_CONVERSION);
1222 if (!conversion)
1223 return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
1224
1225 conversion->format = pCreateInfo->format;
1226 conversion->ycbcr_model = pCreateInfo->ycbcrModel;
1227 conversion->ycbcr_range = pCreateInfo->ycbcrRange;
1228 conversion->components = pCreateInfo->components;
1229 conversion->chroma_offsets[0] = pCreateInfo->xChromaOffset;
1230 conversion->chroma_offsets[1] = pCreateInfo->yChromaOffset;
1231 conversion->chroma_filter = pCreateInfo->chromaFilter;
1232
1233 *pYcbcrConversion = tu_sampler_ycbcr_conversion_to_handle(conversion);
1234 return VK_SUCCESS;
1235 }
1236
1237 void
1238 tu_DestroySamplerYcbcrConversion(VkDevice _device,
1239 VkSamplerYcbcrConversion ycbcrConversion,
1240 const VkAllocationCallbacks *pAllocator)
1241 {
1242 TU_FROM_HANDLE(tu_device, device, _device);
1243 TU_FROM_HANDLE(tu_sampler_ycbcr_conversion, ycbcr_conversion, ycbcrConversion);
1244
1245 if (!ycbcr_conversion)
1246 return;
1247
1248 vk_object_free(&device->vk, pAllocator, ycbcr_conversion);
1249 }