radv: Don't allocate dynamic descriptors separately.
[mesa.git] / src / amd / vulkan / radv_descriptor_set.c
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22 * IN THE SOFTWARE.
23 */
24 #include <assert.h>
25 #include <stdbool.h>
26 #include <string.h>
27 #include <unistd.h>
28 #include <fcntl.h>
29
30 #include "util/mesa-sha1.h"
31 #include "radv_private.h"
32 #include "sid.h"
33
34 VkResult radv_CreateDescriptorSetLayout(
35 VkDevice _device,
36 const VkDescriptorSetLayoutCreateInfo* pCreateInfo,
37 const VkAllocationCallbacks* pAllocator,
38 VkDescriptorSetLayout* pSetLayout)
39 {
40 RADV_FROM_HANDLE(radv_device, device, _device);
41 struct radv_descriptor_set_layout *set_layout;
42
43 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO);
44
45 uint32_t max_binding = 0;
46 uint32_t immutable_sampler_count = 0;
47 for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
48 max_binding = MAX2(max_binding, pCreateInfo->pBindings[j].binding);
49 if (pCreateInfo->pBindings[j].pImmutableSamplers)
50 immutable_sampler_count += pCreateInfo->pBindings[j].descriptorCount;
51 }
52
53 uint32_t samplers_offset = sizeof(struct radv_descriptor_set_layout) +
54 (max_binding + 1) * sizeof(set_layout->binding[0]);
55 size_t size = samplers_offset + immutable_sampler_count * 4 * sizeof(uint32_t);
56
57 set_layout = vk_alloc2(&device->alloc, pAllocator, size, 8,
58 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
59 if (!set_layout)
60 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
61
62 set_layout->flags = pCreateInfo->flags;
63
64 /* We just allocate all the samplers at the end of the struct */
65 uint32_t *samplers = (uint32_t*)&set_layout->binding[max_binding + 1];
66
67 set_layout->binding_count = max_binding + 1;
68 set_layout->shader_stages = 0;
69 set_layout->size = 0;
70
71 memset(set_layout->binding, 0, size - sizeof(struct radv_descriptor_set_layout));
72
73 uint32_t buffer_count = 0;
74 uint32_t dynamic_offset_count = 0;
75
76 for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
77 const VkDescriptorSetLayoutBinding *binding = &pCreateInfo->pBindings[j];
78 uint32_t b = binding->binding;
79 uint32_t alignment;
80
81 switch (binding->descriptorType) {
82 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
83 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
84 assert(!(pCreateInfo->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
85 set_layout->binding[b].dynamic_offset_count = 1;
86 set_layout->dynamic_shader_stages |= binding->stageFlags;
87 set_layout->binding[b].size = 0;
88 set_layout->binding[b].buffer_count = 1;
89 alignment = 1;
90 break;
91 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
92 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
93 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
94 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
95 set_layout->binding[b].size = 16;
96 set_layout->binding[b].buffer_count = 1;
97 alignment = 16;
98 break;
99 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
100 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
101 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
102 /* main descriptor + fmask descriptor */
103 set_layout->binding[b].size = 64;
104 set_layout->binding[b].buffer_count = 1;
105 alignment = 32;
106 break;
107 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
108 /* main descriptor + fmask descriptor + sampler */
109 set_layout->binding[b].size = 96;
110 set_layout->binding[b].buffer_count = 1;
111 alignment = 32;
112 break;
113 case VK_DESCRIPTOR_TYPE_SAMPLER:
114 set_layout->binding[b].size = 16;
115 alignment = 16;
116 break;
117 default:
118 unreachable("unknown descriptor type\n");
119 break;
120 }
121
122 set_layout->size = align(set_layout->size, alignment);
123 assert(binding->descriptorCount > 0);
124 set_layout->binding[b].type = binding->descriptorType;
125 set_layout->binding[b].array_size = binding->descriptorCount;
126 set_layout->binding[b].offset = set_layout->size;
127 set_layout->binding[b].buffer_offset = buffer_count;
128 set_layout->binding[b].dynamic_offset_offset = dynamic_offset_count;
129
130 if (binding->pImmutableSamplers) {
131 set_layout->binding[b].immutable_samplers_offset = samplers_offset;
132 set_layout->binding[b].immutable_samplers_equal = true;
133
134
135 for (uint32_t i = 0; i < binding->descriptorCount; i++)
136 memcpy(samplers + 4 * i, &radv_sampler_from_handle(binding->pImmutableSamplers[i])->state, 16);
137 for (uint32_t i = 1; i < binding->descriptorCount; i++)
138 if (memcmp(samplers + 4 * i, samplers, 16) != 0)
139 set_layout->binding[b].immutable_samplers_equal = false;
140
141 /* Don't reserve space for the samplers if they're not accessed. */
142 if (set_layout->binding[b].immutable_samplers_equal) {
143 if (binding->descriptorType == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
144 set_layout->binding[b].size -= 32;
145 else if (binding->descriptorType == VK_DESCRIPTOR_TYPE_SAMPLER)
146 set_layout->binding[b].size -= 16;
147 }
148 samplers += 4 * binding->descriptorCount;
149 samplers_offset += 4 * sizeof(uint32_t) * binding->descriptorCount;
150 }
151
152 set_layout->size += binding->descriptorCount * set_layout->binding[b].size;
153 buffer_count += binding->descriptorCount * set_layout->binding[b].buffer_count;
154 dynamic_offset_count += binding->descriptorCount *
155 set_layout->binding[b].dynamic_offset_count;
156 set_layout->shader_stages |= binding->stageFlags;
157 }
158
159 set_layout->buffer_count = buffer_count;
160 set_layout->dynamic_offset_count = dynamic_offset_count;
161
162 *pSetLayout = radv_descriptor_set_layout_to_handle(set_layout);
163
164 return VK_SUCCESS;
165 }
166
167 void radv_DestroyDescriptorSetLayout(
168 VkDevice _device,
169 VkDescriptorSetLayout _set_layout,
170 const VkAllocationCallbacks* pAllocator)
171 {
172 RADV_FROM_HANDLE(radv_device, device, _device);
173 RADV_FROM_HANDLE(radv_descriptor_set_layout, set_layout, _set_layout);
174
175 if (!set_layout)
176 return;
177
178 vk_free2(&device->alloc, pAllocator, set_layout);
179 }
180
181 /*
182 * Pipeline layouts. These have nothing to do with the pipeline. They are
183 * just muttiple descriptor set layouts pasted together
184 */
185
186 VkResult radv_CreatePipelineLayout(
187 VkDevice _device,
188 const VkPipelineLayoutCreateInfo* pCreateInfo,
189 const VkAllocationCallbacks* pAllocator,
190 VkPipelineLayout* pPipelineLayout)
191 {
192 RADV_FROM_HANDLE(radv_device, device, _device);
193 struct radv_pipeline_layout *layout;
194 struct mesa_sha1 ctx;
195
196 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO);
197
198 layout = vk_alloc2(&device->alloc, pAllocator, sizeof(*layout), 8,
199 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
200 if (layout == NULL)
201 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
202
203 layout->num_sets = pCreateInfo->setLayoutCount;
204
205 unsigned dynamic_offset_count = 0;
206
207
208 _mesa_sha1_init(&ctx);
209 for (uint32_t set = 0; set < pCreateInfo->setLayoutCount; set++) {
210 RADV_FROM_HANDLE(radv_descriptor_set_layout, set_layout,
211 pCreateInfo->pSetLayouts[set]);
212 layout->set[set].layout = set_layout;
213
214 layout->set[set].dynamic_offset_start = dynamic_offset_count;
215 for (uint32_t b = 0; b < set_layout->binding_count; b++) {
216 dynamic_offset_count += set_layout->binding[b].array_size * set_layout->binding[b].dynamic_offset_count;
217 if (set_layout->binding[b].immutable_samplers_offset)
218 _mesa_sha1_update(&ctx, radv_immutable_samplers(set_layout, set_layout->binding + b),
219 set_layout->binding[b].array_size * 4 * sizeof(uint32_t));
220 }
221 _mesa_sha1_update(&ctx, set_layout->binding,
222 sizeof(set_layout->binding[0]) * set_layout->binding_count);
223 }
224
225 layout->dynamic_offset_count = dynamic_offset_count;
226 layout->push_constant_size = 0;
227 for (unsigned i = 0; i < pCreateInfo->pushConstantRangeCount; ++i) {
228 const VkPushConstantRange *range = pCreateInfo->pPushConstantRanges + i;
229 layout->push_constant_size = MAX2(layout->push_constant_size,
230 range->offset + range->size);
231 }
232
233 layout->push_constant_size = align(layout->push_constant_size, 16);
234 _mesa_sha1_update(&ctx, &layout->push_constant_size,
235 sizeof(layout->push_constant_size));
236 _mesa_sha1_final(&ctx, layout->sha1);
237 *pPipelineLayout = radv_pipeline_layout_to_handle(layout);
238
239 return VK_SUCCESS;
240 }
241
242 void radv_DestroyPipelineLayout(
243 VkDevice _device,
244 VkPipelineLayout _pipelineLayout,
245 const VkAllocationCallbacks* pAllocator)
246 {
247 RADV_FROM_HANDLE(radv_device, device, _device);
248 RADV_FROM_HANDLE(radv_pipeline_layout, pipeline_layout, _pipelineLayout);
249
250 if (!pipeline_layout)
251 return;
252 vk_free2(&device->alloc, pAllocator, pipeline_layout);
253 }
254
255 #define EMPTY 1
256
257 static VkResult
258 radv_descriptor_set_create(struct radv_device *device,
259 struct radv_descriptor_pool *pool,
260 const struct radv_descriptor_set_layout *layout,
261 struct radv_descriptor_set **out_set)
262 {
263 struct radv_descriptor_set *set;
264 unsigned range_offset = sizeof(struct radv_descriptor_set) +
265 sizeof(struct radeon_winsys_bo *) * layout->buffer_count;
266 unsigned mem_size = range_offset +
267 sizeof(struct radv_descriptor_range) * layout->dynamic_offset_count;
268 set = vk_alloc2(&device->alloc, NULL, mem_size, 8,
269 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
270
271 if (!set)
272 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
273
274 memset(set, 0, mem_size);
275
276 if (layout->dynamic_offset_count) {
277 set->dynamic_descriptors = (struct radv_descriptor_range*)((uint8_t*)set + range_offset);
278 }
279
280 set->layout = layout;
281 if (layout->size) {
282 uint32_t layout_size = align_u32(layout->size, 32);
283 set->size = layout->size;
284
285 /* try to allocate linearly first, so that we don't spend
286 * time looking for gaps if the app only allocates &
287 * resets via the pool. */
288 if (pool->current_offset + layout_size <= pool->size) {
289 set->bo = pool->bo;
290 set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + pool->current_offset);
291 set->va = device->ws->buffer_get_va(set->bo) + pool->current_offset;
292 pool->current_offset += layout_size;
293 list_addtail(&set->vram_list, &pool->vram_list);
294 } else {
295 uint64_t offset = 0;
296 struct list_head *prev = &pool->vram_list;
297 struct radv_descriptor_set *cur;
298 LIST_FOR_EACH_ENTRY(cur, &pool->vram_list, vram_list) {
299 uint64_t start = (uint8_t*)cur->mapped_ptr - pool->mapped_ptr;
300 if (start - offset >= layout_size)
301 break;
302
303 offset = start + cur->size;
304 prev = &cur->vram_list;
305 }
306
307 if (pool->size - offset < layout_size) {
308 vk_free2(&device->alloc, NULL, set->dynamic_descriptors);
309 vk_free2(&device->alloc, NULL, set);
310 return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
311 }
312 set->bo = pool->bo;
313 set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + offset);
314 set->va = device->ws->buffer_get_va(set->bo) + offset;
315 list_add(&set->vram_list, prev);
316 }
317 }
318
319 for (unsigned i = 0; i < layout->binding_count; ++i) {
320 if (!layout->binding[i].immutable_samplers_offset ||
321 layout->binding[i].immutable_samplers_equal)
322 continue;
323
324 unsigned offset = layout->binding[i].offset / 4;
325 if (layout->binding[i].type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
326 offset += 16;
327
328 const uint32_t *samplers = (const uint32_t*)((const char*)layout + layout->binding[i].immutable_samplers_offset);
329 for (unsigned j = 0; j < layout->binding[i].array_size; ++j) {
330 memcpy(set->mapped_ptr + offset, samplers + 4 * j, 16);
331 offset += layout->binding[i].size / 4;
332 }
333
334 }
335 *out_set = set;
336 return VK_SUCCESS;
337 }
338
339 static void
340 radv_descriptor_set_destroy(struct radv_device *device,
341 struct radv_descriptor_pool *pool,
342 struct radv_descriptor_set *set,
343 bool free_bo)
344 {
345 if (free_bo && set->size)
346 list_del(&set->vram_list);
347 vk_free2(&device->alloc, NULL, set);
348 }
349
350 VkResult radv_CreateDescriptorPool(
351 VkDevice _device,
352 const VkDescriptorPoolCreateInfo* pCreateInfo,
353 const VkAllocationCallbacks* pAllocator,
354 VkDescriptorPool* pDescriptorPool)
355 {
356 RADV_FROM_HANDLE(radv_device, device, _device);
357 struct radv_descriptor_pool *pool;
358 int size = sizeof(struct radv_descriptor_pool);
359 uint64_t bo_size = 0;
360 pool = vk_alloc2(&device->alloc, pAllocator, size, 8,
361 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
362 if (!pool)
363 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
364
365 memset(pool, 0, sizeof(*pool));
366
367 for (unsigned i = 0; i < pCreateInfo->poolSizeCount; ++i) {
368 switch(pCreateInfo->pPoolSizes[i].type) {
369 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
370 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
371 break;
372 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
373 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
374 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
375 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
376 case VK_DESCRIPTOR_TYPE_SAMPLER:
377 /* 32 as we may need to align for images */
378 bo_size += 32 * pCreateInfo->pPoolSizes[i].descriptorCount;
379 break;
380 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
381 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
382 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
383 bo_size += 64 * pCreateInfo->pPoolSizes[i].descriptorCount;
384 break;
385 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
386 bo_size += 96 * pCreateInfo->pPoolSizes[i].descriptorCount;
387 break;
388 default:
389 unreachable("unknown descriptor type\n");
390 break;
391 }
392 }
393
394 if (bo_size) {
395 pool->bo = device->ws->buffer_create(device->ws, bo_size,
396 32, RADEON_DOMAIN_VRAM, 0);
397 pool->mapped_ptr = (uint8_t*)device->ws->buffer_map(pool->bo);
398 }
399 pool->size = bo_size;
400
401 list_inithead(&pool->vram_list);
402 *pDescriptorPool = radv_descriptor_pool_to_handle(pool);
403 return VK_SUCCESS;
404 }
405
406 void radv_DestroyDescriptorPool(
407 VkDevice _device,
408 VkDescriptorPool _pool,
409 const VkAllocationCallbacks* pAllocator)
410 {
411 RADV_FROM_HANDLE(radv_device, device, _device);
412 RADV_FROM_HANDLE(radv_descriptor_pool, pool, _pool);
413
414 if (!pool)
415 return;
416
417 list_for_each_entry_safe(struct radv_descriptor_set, set,
418 &pool->vram_list, vram_list) {
419 radv_descriptor_set_destroy(device, pool, set, false);
420 }
421
422 if (pool->bo)
423 device->ws->buffer_destroy(pool->bo);
424 vk_free2(&device->alloc, pAllocator, pool);
425 }
426
427 VkResult radv_ResetDescriptorPool(
428 VkDevice _device,
429 VkDescriptorPool descriptorPool,
430 VkDescriptorPoolResetFlags flags)
431 {
432 RADV_FROM_HANDLE(radv_device, device, _device);
433 RADV_FROM_HANDLE(radv_descriptor_pool, pool, descriptorPool);
434
435 list_for_each_entry_safe(struct radv_descriptor_set, set,
436 &pool->vram_list, vram_list) {
437 radv_descriptor_set_destroy(device, pool, set, false);
438 }
439
440 list_inithead(&pool->vram_list);
441
442 pool->current_offset = 0;
443
444 return VK_SUCCESS;
445 }
446
447 VkResult radv_AllocateDescriptorSets(
448 VkDevice _device,
449 const VkDescriptorSetAllocateInfo* pAllocateInfo,
450 VkDescriptorSet* pDescriptorSets)
451 {
452 RADV_FROM_HANDLE(radv_device, device, _device);
453 RADV_FROM_HANDLE(radv_descriptor_pool, pool, pAllocateInfo->descriptorPool);
454
455 VkResult result = VK_SUCCESS;
456 uint32_t i;
457 struct radv_descriptor_set *set;
458
459 /* allocate a set of buffers for each shader to contain descriptors */
460 for (i = 0; i < pAllocateInfo->descriptorSetCount; i++) {
461 RADV_FROM_HANDLE(radv_descriptor_set_layout, layout,
462 pAllocateInfo->pSetLayouts[i]);
463
464 assert(!(layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
465
466 result = radv_descriptor_set_create(device, pool, layout, &set);
467 if (result != VK_SUCCESS)
468 break;
469
470 pDescriptorSets[i] = radv_descriptor_set_to_handle(set);
471 }
472
473 if (result != VK_SUCCESS)
474 radv_FreeDescriptorSets(_device, pAllocateInfo->descriptorPool,
475 i, pDescriptorSets);
476 return result;
477 }
478
479 VkResult radv_FreeDescriptorSets(
480 VkDevice _device,
481 VkDescriptorPool descriptorPool,
482 uint32_t count,
483 const VkDescriptorSet* pDescriptorSets)
484 {
485 RADV_FROM_HANDLE(radv_device, device, _device);
486 RADV_FROM_HANDLE(radv_descriptor_pool, pool, descriptorPool);
487
488 for (uint32_t i = 0; i < count; i++) {
489 RADV_FROM_HANDLE(radv_descriptor_set, set, pDescriptorSets[i]);
490
491 if (set)
492 radv_descriptor_set_destroy(device, pool, set, true);
493 }
494 return VK_SUCCESS;
495 }
496
497 static void write_texel_buffer_descriptor(struct radv_device *device,
498 struct radv_cmd_buffer *cmd_buffer,
499 unsigned *dst,
500 struct radeon_winsys_bo **buffer_list,
501 const VkBufferView _buffer_view)
502 {
503 RADV_FROM_HANDLE(radv_buffer_view, buffer_view, _buffer_view);
504
505 memcpy(dst, buffer_view->state, 4 * 4);
506
507 if (cmd_buffer)
508 device->ws->cs_add_buffer(cmd_buffer->cs, buffer_view->bo, 7);
509 else
510 *buffer_list = buffer_view->bo;
511 }
512
513 static void write_buffer_descriptor(struct radv_device *device,
514 struct radv_cmd_buffer *cmd_buffer,
515 unsigned *dst,
516 struct radeon_winsys_bo **buffer_list,
517 const VkDescriptorBufferInfo *buffer_info)
518 {
519 RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
520 uint64_t va = device->ws->buffer_get_va(buffer->bo);
521 uint32_t range = buffer_info->range;
522
523 if (buffer_info->range == VK_WHOLE_SIZE)
524 range = buffer->size - buffer_info->offset;
525
526 va += buffer_info->offset + buffer->offset;
527 dst[0] = va;
528 dst[1] = S_008F04_BASE_ADDRESS_HI(va >> 32);
529 dst[2] = range;
530 dst[3] = S_008F0C_DST_SEL_X(V_008F0C_SQ_SEL_X) |
531 S_008F0C_DST_SEL_Y(V_008F0C_SQ_SEL_Y) |
532 S_008F0C_DST_SEL_Z(V_008F0C_SQ_SEL_Z) |
533 S_008F0C_DST_SEL_W(V_008F0C_SQ_SEL_W) |
534 S_008F0C_NUM_FORMAT(V_008F0C_BUF_NUM_FORMAT_FLOAT) |
535 S_008F0C_DATA_FORMAT(V_008F0C_BUF_DATA_FORMAT_32);
536
537 if (cmd_buffer)
538 device->ws->cs_add_buffer(cmd_buffer->cs, buffer->bo, 7);
539 else
540 *buffer_list = buffer->bo;
541 }
542
543 static void write_dynamic_buffer_descriptor(struct radv_device *device,
544 struct radv_descriptor_range *range,
545 struct radeon_winsys_bo **buffer_list,
546 const VkDescriptorBufferInfo *buffer_info)
547 {
548 RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
549 uint64_t va = device->ws->buffer_get_va(buffer->bo);
550 unsigned size = buffer_info->range;
551
552 if (buffer_info->range == VK_WHOLE_SIZE)
553 size = buffer->size - buffer_info->offset;
554
555 va += buffer_info->offset + buffer->offset;
556 range->va = va;
557 range->size = size;
558
559 *buffer_list = buffer->bo;
560 }
561
562 static void
563 write_image_descriptor(struct radv_device *device,
564 struct radv_cmd_buffer *cmd_buffer,
565 unsigned *dst,
566 struct radeon_winsys_bo **buffer_list,
567 const VkDescriptorImageInfo *image_info)
568 {
569 RADV_FROM_HANDLE(radv_image_view, iview, image_info->imageView);
570 memcpy(dst, iview->descriptor, 8 * 4);
571 memcpy(dst + 8, iview->fmask_descriptor, 8 * 4);
572
573 if (cmd_buffer)
574 device->ws->cs_add_buffer(cmd_buffer->cs, iview->bo, 7);
575 else
576 *buffer_list = iview->bo;
577 }
578
579 static void
580 write_combined_image_sampler_descriptor(struct radv_device *device,
581 struct radv_cmd_buffer *cmd_buffer,
582 unsigned *dst,
583 struct radeon_winsys_bo **buffer_list,
584 const VkDescriptorImageInfo *image_info,
585 bool has_sampler)
586 {
587 RADV_FROM_HANDLE(radv_sampler, sampler, image_info->sampler);
588
589 write_image_descriptor(device, cmd_buffer, dst, buffer_list, image_info);
590 /* copy over sampler state */
591 if (has_sampler)
592 memcpy(dst + 16, sampler->state, 16);
593 }
594
595 static void
596 write_sampler_descriptor(struct radv_device *device,
597 unsigned *dst,
598 const VkDescriptorImageInfo *image_info)
599 {
600 RADV_FROM_HANDLE(radv_sampler, sampler, image_info->sampler);
601
602 memcpy(dst, sampler->state, 16);
603 }
604
605 void radv_update_descriptor_sets(
606 struct radv_device* device,
607 struct radv_cmd_buffer* cmd_buffer,
608 VkDescriptorSet dstSetOverride,
609 uint32_t descriptorWriteCount,
610 const VkWriteDescriptorSet* pDescriptorWrites,
611 uint32_t descriptorCopyCount,
612 const VkCopyDescriptorSet* pDescriptorCopies)
613 {
614 uint32_t i, j;
615 for (i = 0; i < descriptorWriteCount; i++) {
616 const VkWriteDescriptorSet *writeset = &pDescriptorWrites[i];
617 RADV_FROM_HANDLE(radv_descriptor_set, set,
618 dstSetOverride ? dstSetOverride : writeset->dstSet);
619 const struct radv_descriptor_set_binding_layout *binding_layout =
620 set->layout->binding + writeset->dstBinding;
621 uint32_t *ptr = set->mapped_ptr;
622 struct radeon_winsys_bo **buffer_list = set->descriptors;
623 /* Immutable samplers are not copied into push descriptors when they are
624 * allocated, so if we are writing push descriptors we have to copy the
625 * immutable samplers into them now.
626 */
627 const bool copy_immutable_samplers = cmd_buffer &&
628 binding_layout->immutable_samplers_offset && !binding_layout->immutable_samplers_equal;
629 const uint32_t *samplers = radv_immutable_samplers(set->layout, binding_layout);
630
631 ptr += binding_layout->offset / 4;
632 ptr += binding_layout->size * writeset->dstArrayElement / 4;
633 buffer_list += binding_layout->buffer_offset;
634 buffer_list += binding_layout->buffer_count * writeset->dstArrayElement;
635 for (j = 0; j < writeset->descriptorCount; ++j) {
636 switch(writeset->descriptorType) {
637 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
638 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
639 unsigned idx = writeset->dstArrayElement + j;
640 idx += binding_layout->dynamic_offset_offset;
641 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
642 write_dynamic_buffer_descriptor(device, set->dynamic_descriptors + idx,
643 buffer_list, writeset->pBufferInfo + j);
644 break;
645 }
646 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
647 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
648 write_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
649 writeset->pBufferInfo + j);
650 break;
651 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
652 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
653 write_texel_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
654 writeset->pTexelBufferView[j]);
655 break;
656 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
657 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
658 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
659 write_image_descriptor(device, cmd_buffer, ptr, buffer_list,
660 writeset->pImageInfo + j);
661 break;
662 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
663 write_combined_image_sampler_descriptor(device, cmd_buffer, ptr, buffer_list,
664 writeset->pImageInfo + j,
665 !binding_layout->immutable_samplers_offset);
666 if (copy_immutable_samplers) {
667 const unsigned idx = writeset->dstArrayElement + j;
668 memcpy(ptr + 16, samplers + 4 * idx, 16);
669 }
670 break;
671 case VK_DESCRIPTOR_TYPE_SAMPLER:
672 if (!binding_layout->immutable_samplers_offset) {
673 write_sampler_descriptor(device, ptr,
674 writeset->pImageInfo + j);
675 } else if (copy_immutable_samplers) {
676 unsigned idx = writeset->dstArrayElement + j;
677 memcpy(ptr, samplers + 4 * idx, 16);
678 }
679 break;
680 default:
681 unreachable("unimplemented descriptor type");
682 break;
683 }
684 ptr += binding_layout->size / 4;
685 buffer_list += binding_layout->buffer_count;
686 }
687
688 }
689 if (descriptorCopyCount)
690 radv_finishme("copy descriptors");
691 }
692
693 void radv_UpdateDescriptorSets(
694 VkDevice _device,
695 uint32_t descriptorWriteCount,
696 const VkWriteDescriptorSet* pDescriptorWrites,
697 uint32_t descriptorCopyCount,
698 const VkCopyDescriptorSet* pDescriptorCopies)
699 {
700 RADV_FROM_HANDLE(radv_device, device, _device);
701
702 radv_update_descriptor_sets(device, NULL, VK_NULL_HANDLE, descriptorWriteCount, pDescriptorWrites,
703 descriptorCopyCount, pDescriptorCopies);
704 }
705
706 VkResult radv_CreateDescriptorUpdateTemplateKHR(VkDevice _device,
707 const VkDescriptorUpdateTemplateCreateInfoKHR *pCreateInfo,
708 const VkAllocationCallbacks *pAllocator,
709 VkDescriptorUpdateTemplateKHR *pDescriptorUpdateTemplate)
710 {
711 RADV_FROM_HANDLE(radv_device, device, _device);
712 RADV_FROM_HANDLE(radv_descriptor_set_layout, set_layout, pCreateInfo->descriptorSetLayout);
713 const uint32_t entry_count = pCreateInfo->descriptorUpdateEntryCount;
714 const size_t size = sizeof(struct radv_descriptor_update_template) +
715 sizeof(struct radv_descriptor_update_template_entry) * entry_count;
716 struct radv_descriptor_update_template *templ;
717 uint32_t i;
718
719 templ = vk_alloc2(&device->alloc, pAllocator, size, 8, VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
720 if (!templ)
721 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
722
723 templ->entry_count = entry_count;
724
725 for (i = 0; i < entry_count; i++) {
726 const VkDescriptorUpdateTemplateEntryKHR *entry = &pCreateInfo->pDescriptorUpdateEntries[i];
727 const struct radv_descriptor_set_binding_layout *binding_layout =
728 set_layout->binding + entry->dstBinding;
729 const uint32_t buffer_offset = binding_layout->buffer_offset +
730 binding_layout->buffer_count * entry->dstArrayElement;
731 const uint32_t *immutable_samplers = NULL;
732 uint32_t dst_offset;
733 uint32_t dst_stride;
734
735 /* dst_offset is an offset into dynamic_descriptors when the descriptor
736 is dynamic, and an offset into mapped_ptr otherwise */
737 switch (entry->descriptorType) {
738 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
739 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
740 assert(pCreateInfo->templateType == VK_DESCRIPTOR_UPDATE_TEMPLATE_TYPE_DESCRIPTOR_SET_KHR);
741 dst_offset = binding_layout->dynamic_offset_offset + entry->dstArrayElement;
742 dst_stride = 0; /* Not used */
743 break;
744 default:
745 switch (entry->descriptorType) {
746 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
747 case VK_DESCRIPTOR_TYPE_SAMPLER:
748 /* Immutable samplers are copied into push descriptors when they are pushed */
749 if (pCreateInfo->templateType == VK_DESCRIPTOR_UPDATE_TEMPLATE_TYPE_PUSH_DESCRIPTORS_KHR &&
750 binding_layout->immutable_samplers_offset && !binding_layout->immutable_samplers_equal) {
751 immutable_samplers = radv_immutable_samplers(set_layout, binding_layout) + entry->dstArrayElement * 4;
752 }
753 break;
754 default:
755 break;
756 }
757 dst_offset = binding_layout->offset / 4 + binding_layout->size * entry->dstArrayElement / 4;
758 dst_stride = binding_layout->size / 4;
759 break;
760 }
761
762 templ->entry[i] = (struct radv_descriptor_update_template_entry) {
763 .descriptor_type = entry->descriptorType,
764 .descriptor_count = entry->descriptorCount,
765 .src_offset = entry->offset,
766 .src_stride = entry->stride,
767 .dst_offset = dst_offset,
768 .dst_stride = dst_stride,
769 .buffer_offset = buffer_offset,
770 .buffer_count = binding_layout->buffer_count,
771 .has_sampler = !binding_layout->immutable_samplers_offset,
772 .immutable_samplers = immutable_samplers
773 };
774 }
775
776 *pDescriptorUpdateTemplate = radv_descriptor_update_template_to_handle(templ);
777 return VK_SUCCESS;
778 }
779
780 void radv_DestroyDescriptorUpdateTemplateKHR(VkDevice _device,
781 VkDescriptorUpdateTemplateKHR descriptorUpdateTemplate,
782 const VkAllocationCallbacks *pAllocator)
783 {
784 RADV_FROM_HANDLE(radv_device, device, _device);
785 RADV_FROM_HANDLE(radv_descriptor_update_template, templ, descriptorUpdateTemplate);
786
787 if (!templ)
788 return;
789
790 vk_free2(&device->alloc, pAllocator, templ);
791 }
792
793 void radv_update_descriptor_set_with_template(struct radv_device *device,
794 struct radv_cmd_buffer *cmd_buffer,
795 struct radv_descriptor_set *set,
796 VkDescriptorUpdateTemplateKHR descriptorUpdateTemplate,
797 const void *pData)
798 {
799 RADV_FROM_HANDLE(radv_descriptor_update_template, templ, descriptorUpdateTemplate);
800 uint32_t i;
801
802 for (i = 0; i < templ->entry_count; ++i) {
803 struct radeon_winsys_bo **buffer_list = set->descriptors + templ->entry[i].buffer_offset;
804 uint32_t *pDst = set->mapped_ptr + templ->entry[i].dst_offset;
805 const uint8_t *pSrc = ((const uint8_t *) pData) + templ->entry[i].src_offset;
806 uint32_t j;
807
808 for (j = 0; j < templ->entry[i].descriptor_count; ++j) {
809 switch (templ->entry[i].descriptor_type) {
810 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
811 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
812 const unsigned idx = templ->entry[i].dst_offset + j;
813 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
814 write_dynamic_buffer_descriptor(device, set->dynamic_descriptors + idx,
815 buffer_list, (struct VkDescriptorBufferInfo *) pSrc);
816 break;
817 }
818 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
819 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
820 write_buffer_descriptor(device, cmd_buffer, pDst, buffer_list,
821 (struct VkDescriptorBufferInfo *) pSrc);
822 break;
823 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
824 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
825 write_texel_buffer_descriptor(device, cmd_buffer, pDst, buffer_list,
826 *(VkBufferView *) pSrc);
827 break;
828 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
829 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
830 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
831 write_image_descriptor(device, cmd_buffer, pDst, buffer_list,
832 (struct VkDescriptorImageInfo *) pSrc);
833 break;
834 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
835 write_combined_image_sampler_descriptor(device, cmd_buffer, pDst, buffer_list,
836 (struct VkDescriptorImageInfo *) pSrc,
837 templ->entry[i].has_sampler);
838 if (templ->entry[i].immutable_samplers)
839 memcpy(pDst + 16, templ->entry[i].immutable_samplers + 4 * j, 16);
840 break;
841 case VK_DESCRIPTOR_TYPE_SAMPLER:
842 if (templ->entry[i].has_sampler)
843 write_sampler_descriptor(device, pDst,
844 (struct VkDescriptorImageInfo *) pSrc);
845 else if (templ->entry[i].immutable_samplers)
846 memcpy(pDst, templ->entry[i].immutable_samplers + 4 * j, 16);
847 break;
848 default:
849 unreachable("unimplemented descriptor type");
850 break;
851 }
852 pSrc += templ->entry[i].src_stride;
853 pDst += templ->entry[i].dst_stride;
854 buffer_list += templ->entry[i].buffer_count;
855 }
856 }
857 }
858
859 void radv_UpdateDescriptorSetWithTemplateKHR(VkDevice _device,
860 VkDescriptorSet descriptorSet,
861 VkDescriptorUpdateTemplateKHR descriptorUpdateTemplate,
862 const void *pData)
863 {
864 RADV_FROM_HANDLE(radv_device, device, _device);
865 RADV_FROM_HANDLE(radv_descriptor_set, set, descriptorSet);
866
867 radv_update_descriptor_set_with_template(device, NULL, set, descriptorUpdateTemplate, pData);
868 }