radv: implement VK_KHR_descriptor_update_template
[mesa.git] / src / amd / vulkan / radv_descriptor_set.c
1 /*
2 * Copyright © 2016 Red Hat.
3 * Copyright © 2016 Bas Nieuwenhuizen
4 *
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the "Software"),
7 * to deal in the Software without restriction, including without limitation
8 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9 * and/or sell copies of the Software, and to permit persons to whom the
10 * Software is furnished to do so, subject to the following conditions:
11 *
12 * The above copyright notice and this permission notice (including the next
13 * paragraph) shall be included in all copies or substantial portions of the
14 * Software.
15 *
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22 * IN THE SOFTWARE.
23 */
24 #include <assert.h>
25 #include <stdbool.h>
26 #include <string.h>
27 #include <unistd.h>
28 #include <fcntl.h>
29
30 #include "util/mesa-sha1.h"
31 #include "radv_private.h"
32 #include "sid.h"
33
34 VkResult radv_CreateDescriptorSetLayout(
35 VkDevice _device,
36 const VkDescriptorSetLayoutCreateInfo* pCreateInfo,
37 const VkAllocationCallbacks* pAllocator,
38 VkDescriptorSetLayout* pSetLayout)
39 {
40 RADV_FROM_HANDLE(radv_device, device, _device);
41 struct radv_descriptor_set_layout *set_layout;
42
43 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_DESCRIPTOR_SET_LAYOUT_CREATE_INFO);
44
45 uint32_t max_binding = 0;
46 uint32_t immutable_sampler_count = 0;
47 for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
48 max_binding = MAX2(max_binding, pCreateInfo->pBindings[j].binding);
49 if (pCreateInfo->pBindings[j].pImmutableSamplers)
50 immutable_sampler_count += pCreateInfo->pBindings[j].descriptorCount;
51 }
52
53 size_t size = sizeof(struct radv_descriptor_set_layout) +
54 (max_binding + 1) * sizeof(set_layout->binding[0]) +
55 immutable_sampler_count * 4 * sizeof(uint32_t);
56
57 set_layout = vk_alloc2(&device->alloc, pAllocator, size, 8,
58 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
59 if (!set_layout)
60 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
61
62 set_layout->flags = pCreateInfo->flags;
63
64 /* We just allocate all the samplers at the end of the struct */
65 uint32_t *samplers = (uint32_t*)&set_layout->binding[max_binding + 1];
66
67 set_layout->binding_count = max_binding + 1;
68 set_layout->shader_stages = 0;
69 set_layout->size = 0;
70
71 memset(set_layout->binding, 0, size - sizeof(struct radv_descriptor_set_layout));
72
73 uint32_t buffer_count = 0;
74 uint32_t dynamic_offset_count = 0;
75
76 for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
77 const VkDescriptorSetLayoutBinding *binding = &pCreateInfo->pBindings[j];
78 uint32_t b = binding->binding;
79 uint32_t alignment;
80
81 switch (binding->descriptorType) {
82 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
83 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
84 assert(!(pCreateInfo->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
85 set_layout->binding[b].dynamic_offset_count = 1;
86 set_layout->dynamic_shader_stages |= binding->stageFlags;
87 set_layout->binding[b].size = 0;
88 set_layout->binding[b].buffer_count = 1;
89 alignment = 1;
90 break;
91 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
92 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
93 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
94 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
95 set_layout->binding[b].size = 16;
96 set_layout->binding[b].buffer_count = 1;
97 alignment = 16;
98 break;
99 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
100 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
101 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
102 /* main descriptor + fmask descriptor */
103 set_layout->binding[b].size = 64;
104 set_layout->binding[b].buffer_count = 1;
105 alignment = 32;
106 break;
107 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
108 /* main descriptor + fmask descriptor + sampler */
109 set_layout->binding[b].size = 96;
110 set_layout->binding[b].buffer_count = 1;
111 alignment = 32;
112 break;
113 case VK_DESCRIPTOR_TYPE_SAMPLER:
114 set_layout->binding[b].size = 16;
115 alignment = 16;
116 break;
117 default:
118 unreachable("unknown descriptor type\n");
119 break;
120 }
121
122 set_layout->size = align(set_layout->size, alignment);
123 assert(binding->descriptorCount > 0);
124 set_layout->binding[b].type = binding->descriptorType;
125 set_layout->binding[b].array_size = binding->descriptorCount;
126 set_layout->binding[b].offset = set_layout->size;
127 set_layout->binding[b].buffer_offset = buffer_count;
128 set_layout->binding[b].dynamic_offset_offset = dynamic_offset_count;
129
130 if (binding->pImmutableSamplers) {
131 set_layout->binding[b].immutable_samplers = samplers;
132 set_layout->binding[b].immutable_samplers_equal = true;
133 samplers += 4 * binding->descriptorCount;
134
135 for (uint32_t i = 0; i < binding->descriptorCount; i++)
136 memcpy(set_layout->binding[b].immutable_samplers + 4 * i, &radv_sampler_from_handle(binding->pImmutableSamplers[i])->state, 16);
137 for (uint32_t i = 1; i < binding->descriptorCount; i++)
138 if (memcmp(set_layout->binding[b].immutable_samplers + 4 * i,
139 set_layout->binding[b].immutable_samplers, 16) != 0)
140 set_layout->binding[b].immutable_samplers_equal = false;
141
142 /* Don't reserve space for the samplers if they're not accessed. */
143 if (set_layout->binding[b].immutable_samplers_equal) {
144 if (binding->descriptorType == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
145 set_layout->binding[b].size -= 32;
146 else if (binding->descriptorType == VK_DESCRIPTOR_TYPE_SAMPLER)
147 set_layout->binding[b].size -= 16;
148 }
149 }
150
151 set_layout->size += binding->descriptorCount * set_layout->binding[b].size;
152 buffer_count += binding->descriptorCount * set_layout->binding[b].buffer_count;
153 dynamic_offset_count += binding->descriptorCount *
154 set_layout->binding[b].dynamic_offset_count;
155 set_layout->shader_stages |= binding->stageFlags;
156 }
157
158 set_layout->buffer_count = buffer_count;
159 set_layout->dynamic_offset_count = dynamic_offset_count;
160
161 *pSetLayout = radv_descriptor_set_layout_to_handle(set_layout);
162
163 return VK_SUCCESS;
164 }
165
166 void radv_DestroyDescriptorSetLayout(
167 VkDevice _device,
168 VkDescriptorSetLayout _set_layout,
169 const VkAllocationCallbacks* pAllocator)
170 {
171 RADV_FROM_HANDLE(radv_device, device, _device);
172 RADV_FROM_HANDLE(radv_descriptor_set_layout, set_layout, _set_layout);
173
174 if (!set_layout)
175 return;
176
177 vk_free2(&device->alloc, pAllocator, set_layout);
178 }
179
180 /*
181 * Pipeline layouts. These have nothing to do with the pipeline. They are
182 * just muttiple descriptor set layouts pasted together
183 */
184
185 VkResult radv_CreatePipelineLayout(
186 VkDevice _device,
187 const VkPipelineLayoutCreateInfo* pCreateInfo,
188 const VkAllocationCallbacks* pAllocator,
189 VkPipelineLayout* pPipelineLayout)
190 {
191 RADV_FROM_HANDLE(radv_device, device, _device);
192 struct radv_pipeline_layout *layout;
193 struct mesa_sha1 ctx;
194
195 assert(pCreateInfo->sType == VK_STRUCTURE_TYPE_PIPELINE_LAYOUT_CREATE_INFO);
196
197 layout = vk_alloc2(&device->alloc, pAllocator, sizeof(*layout), 8,
198 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
199 if (layout == NULL)
200 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
201
202 layout->num_sets = pCreateInfo->setLayoutCount;
203
204 unsigned dynamic_offset_count = 0;
205
206
207 _mesa_sha1_init(&ctx);
208 for (uint32_t set = 0; set < pCreateInfo->setLayoutCount; set++) {
209 RADV_FROM_HANDLE(radv_descriptor_set_layout, set_layout,
210 pCreateInfo->pSetLayouts[set]);
211 layout->set[set].layout = set_layout;
212
213 layout->set[set].dynamic_offset_start = dynamic_offset_count;
214 for (uint32_t b = 0; b < set_layout->binding_count; b++) {
215 dynamic_offset_count += set_layout->binding[b].array_size * set_layout->binding[b].dynamic_offset_count;
216 }
217 _mesa_sha1_update(&ctx, set_layout->binding,
218 sizeof(set_layout->binding[0]) * set_layout->binding_count);
219 }
220
221 layout->dynamic_offset_count = dynamic_offset_count;
222 layout->push_constant_size = 0;
223 for (unsigned i = 0; i < pCreateInfo->pushConstantRangeCount; ++i) {
224 const VkPushConstantRange *range = pCreateInfo->pPushConstantRanges + i;
225 layout->push_constant_size = MAX2(layout->push_constant_size,
226 range->offset + range->size);
227 }
228
229 layout->push_constant_size = align(layout->push_constant_size, 16);
230 _mesa_sha1_update(&ctx, &layout->push_constant_size,
231 sizeof(layout->push_constant_size));
232 _mesa_sha1_final(&ctx, layout->sha1);
233 *pPipelineLayout = radv_pipeline_layout_to_handle(layout);
234
235 return VK_SUCCESS;
236 }
237
238 void radv_DestroyPipelineLayout(
239 VkDevice _device,
240 VkPipelineLayout _pipelineLayout,
241 const VkAllocationCallbacks* pAllocator)
242 {
243 RADV_FROM_HANDLE(radv_device, device, _device);
244 RADV_FROM_HANDLE(radv_pipeline_layout, pipeline_layout, _pipelineLayout);
245
246 if (!pipeline_layout)
247 return;
248 vk_free2(&device->alloc, pAllocator, pipeline_layout);
249 }
250
251 #define EMPTY 1
252
253 static VkResult
254 radv_descriptor_set_create(struct radv_device *device,
255 struct radv_descriptor_pool *pool,
256 struct radv_cmd_buffer *cmd_buffer,
257 const struct radv_descriptor_set_layout *layout,
258 struct radv_descriptor_set **out_set)
259 {
260 struct radv_descriptor_set *set;
261 unsigned mem_size = sizeof(struct radv_descriptor_set) +
262 sizeof(struct radeon_winsys_bo *) * layout->buffer_count;
263 set = vk_alloc2(&device->alloc, NULL, mem_size, 8,
264 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
265
266 if (!set)
267 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
268
269 memset(set, 0, mem_size);
270
271 if (layout->dynamic_offset_count) {
272 unsigned size = sizeof(struct radv_descriptor_range) *
273 layout->dynamic_offset_count;
274 set->dynamic_descriptors = vk_alloc2(&device->alloc, NULL, size, 8,
275 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
276
277 if (!set->dynamic_descriptors) {
278 vk_free2(&device->alloc, NULL, set);
279 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
280 }
281 }
282
283 set->layout = layout;
284 if (layout->size) {
285 uint32_t layout_size = align_u32(layout->size, 32);
286 set->size = layout->size;
287 if (!cmd_buffer) {
288 /* try to allocate linearly first, so that we don't spend
289 * time looking for gaps if the app only allocates &
290 * resets via the pool. */
291 if (pool->current_offset + layout_size <= pool->size) {
292 set->bo = pool->bo;
293 set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + pool->current_offset);
294 set->va = device->ws->buffer_get_va(set->bo) + pool->current_offset;
295 pool->current_offset += layout_size;
296 list_addtail(&set->vram_list, &pool->vram_list);
297 } else {
298 uint64_t offset = 0;
299 struct list_head *prev = &pool->vram_list;
300 struct radv_descriptor_set *cur;
301 LIST_FOR_EACH_ENTRY(cur, &pool->vram_list, vram_list) {
302 uint64_t start = (uint8_t*)cur->mapped_ptr - pool->mapped_ptr;
303 if (start - offset >= layout_size)
304 break;
305
306 offset = start + cur->size;
307 prev = &cur->vram_list;
308 }
309
310 if (pool->size - offset < layout_size) {
311 vk_free2(&device->alloc, NULL, set->dynamic_descriptors);
312 vk_free2(&device->alloc, NULL, set);
313 return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
314 }
315 set->bo = pool->bo;
316 set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + offset);
317 set->va = device->ws->buffer_get_va(set->bo) + offset;
318 list_add(&set->vram_list, prev);
319 }
320 } else {
321 unsigned bo_offset;
322 if (!radv_cmd_buffer_upload_alloc(cmd_buffer, set->size, 32,
323 &bo_offset,
324 (void**)&set->mapped_ptr)) {
325 vk_free2(&device->alloc, NULL, set->dynamic_descriptors);
326 vk_free2(&device->alloc, NULL, set);
327 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
328 }
329
330 set->va = device->ws->buffer_get_va(cmd_buffer->upload.upload_bo);
331 set->va += bo_offset;
332 }
333 }
334
335 for (unsigned i = 0; i < layout->binding_count; ++i) {
336 if (!layout->binding[i].immutable_samplers ||
337 layout->binding[i].immutable_samplers_equal)
338 continue;
339
340 unsigned offset = layout->binding[i].offset / 4;
341 if (layout->binding[i].type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
342 offset += 16;
343
344 for (unsigned j = 0; j < layout->binding[i].array_size; ++j) {
345 memcpy(set->mapped_ptr + offset, layout->binding[i].immutable_samplers + 4 * j, 16);
346 offset += layout->binding[i].size / 4;
347 }
348
349 }
350 *out_set = set;
351 return VK_SUCCESS;
352 }
353
354 static void
355 radv_descriptor_set_destroy(struct radv_device *device,
356 struct radv_descriptor_pool *pool,
357 struct radv_descriptor_set *set,
358 bool free_bo)
359 {
360 if (free_bo && set->size)
361 list_del(&set->vram_list);
362 if (set->dynamic_descriptors)
363 vk_free2(&device->alloc, NULL, set->dynamic_descriptors);
364 vk_free2(&device->alloc, NULL, set);
365 }
366
367 VkResult
368 radv_temp_descriptor_set_create(struct radv_device *device,
369 struct radv_cmd_buffer *cmd_buffer,
370 VkDescriptorSetLayout _layout,
371 VkDescriptorSet *_set)
372 {
373 RADV_FROM_HANDLE(radv_descriptor_set_layout, layout, _layout);
374 struct radv_descriptor_set *set = NULL;
375 VkResult ret;
376
377 ret = radv_descriptor_set_create(device, NULL, cmd_buffer, layout, &set);
378 *_set = radv_descriptor_set_to_handle(set);
379 return ret;
380 }
381
382 void
383 radv_temp_descriptor_set_destroy(struct radv_device *device,
384 VkDescriptorSet _set)
385 {
386 RADV_FROM_HANDLE(radv_descriptor_set, set, _set);
387
388 radv_descriptor_set_destroy(device, NULL, set, false);
389 }
390
391 VkResult radv_CreateDescriptorPool(
392 VkDevice _device,
393 const VkDescriptorPoolCreateInfo* pCreateInfo,
394 const VkAllocationCallbacks* pAllocator,
395 VkDescriptorPool* pDescriptorPool)
396 {
397 RADV_FROM_HANDLE(radv_device, device, _device);
398 struct radv_descriptor_pool *pool;
399 int size = sizeof(struct radv_descriptor_pool);
400 uint64_t bo_size = 0;
401 pool = vk_alloc2(&device->alloc, pAllocator, size, 8,
402 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
403 if (!pool)
404 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
405
406 memset(pool, 0, sizeof(*pool));
407
408 for (unsigned i = 0; i < pCreateInfo->poolSizeCount; ++i) {
409 switch(pCreateInfo->pPoolSizes[i].type) {
410 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
411 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
412 break;
413 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
414 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
415 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
416 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
417 case VK_DESCRIPTOR_TYPE_SAMPLER:
418 /* 32 as we may need to align for images */
419 bo_size += 32 * pCreateInfo->pPoolSizes[i].descriptorCount;
420 break;
421 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
422 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
423 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
424 bo_size += 64 * pCreateInfo->pPoolSizes[i].descriptorCount;
425 break;
426 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
427 bo_size += 96 * pCreateInfo->pPoolSizes[i].descriptorCount;
428 break;
429 default:
430 unreachable("unknown descriptor type\n");
431 break;
432 }
433 }
434
435 if (bo_size) {
436 pool->bo = device->ws->buffer_create(device->ws, bo_size,
437 32, RADEON_DOMAIN_VRAM, 0);
438 pool->mapped_ptr = (uint8_t*)device->ws->buffer_map(pool->bo);
439 }
440 pool->size = bo_size;
441
442 list_inithead(&pool->vram_list);
443 *pDescriptorPool = radv_descriptor_pool_to_handle(pool);
444 return VK_SUCCESS;
445 }
446
447 void radv_DestroyDescriptorPool(
448 VkDevice _device,
449 VkDescriptorPool _pool,
450 const VkAllocationCallbacks* pAllocator)
451 {
452 RADV_FROM_HANDLE(radv_device, device, _device);
453 RADV_FROM_HANDLE(radv_descriptor_pool, pool, _pool);
454
455 if (!pool)
456 return;
457
458 list_for_each_entry_safe(struct radv_descriptor_set, set,
459 &pool->vram_list, vram_list) {
460 radv_descriptor_set_destroy(device, pool, set, false);
461 }
462
463 if (pool->bo)
464 device->ws->buffer_destroy(pool->bo);
465 vk_free2(&device->alloc, pAllocator, pool);
466 }
467
468 VkResult radv_ResetDescriptorPool(
469 VkDevice _device,
470 VkDescriptorPool descriptorPool,
471 VkDescriptorPoolResetFlags flags)
472 {
473 RADV_FROM_HANDLE(radv_device, device, _device);
474 RADV_FROM_HANDLE(radv_descriptor_pool, pool, descriptorPool);
475
476 list_for_each_entry_safe(struct radv_descriptor_set, set,
477 &pool->vram_list, vram_list) {
478 radv_descriptor_set_destroy(device, pool, set, false);
479 }
480
481 list_inithead(&pool->vram_list);
482
483 pool->current_offset = 0;
484
485 return VK_SUCCESS;
486 }
487
488 VkResult radv_AllocateDescriptorSets(
489 VkDevice _device,
490 const VkDescriptorSetAllocateInfo* pAllocateInfo,
491 VkDescriptorSet* pDescriptorSets)
492 {
493 RADV_FROM_HANDLE(radv_device, device, _device);
494 RADV_FROM_HANDLE(radv_descriptor_pool, pool, pAllocateInfo->descriptorPool);
495
496 VkResult result = VK_SUCCESS;
497 uint32_t i;
498 struct radv_descriptor_set *set;
499
500 /* allocate a set of buffers for each shader to contain descriptors */
501 for (i = 0; i < pAllocateInfo->descriptorSetCount; i++) {
502 RADV_FROM_HANDLE(radv_descriptor_set_layout, layout,
503 pAllocateInfo->pSetLayouts[i]);
504
505 assert(!(layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
506
507 result = radv_descriptor_set_create(device, pool, NULL, layout, &set);
508 if (result != VK_SUCCESS)
509 break;
510
511 pDescriptorSets[i] = radv_descriptor_set_to_handle(set);
512 }
513
514 if (result != VK_SUCCESS)
515 radv_FreeDescriptorSets(_device, pAllocateInfo->descriptorPool,
516 i, pDescriptorSets);
517 return result;
518 }
519
520 VkResult radv_FreeDescriptorSets(
521 VkDevice _device,
522 VkDescriptorPool descriptorPool,
523 uint32_t count,
524 const VkDescriptorSet* pDescriptorSets)
525 {
526 RADV_FROM_HANDLE(radv_device, device, _device);
527 RADV_FROM_HANDLE(radv_descriptor_pool, pool, descriptorPool);
528
529 for (uint32_t i = 0; i < count; i++) {
530 RADV_FROM_HANDLE(radv_descriptor_set, set, pDescriptorSets[i]);
531
532 if (set)
533 radv_descriptor_set_destroy(device, pool, set, true);
534 }
535 return VK_SUCCESS;
536 }
537
538 static void write_texel_buffer_descriptor(struct radv_device *device,
539 struct radv_cmd_buffer *cmd_buffer,
540 unsigned *dst,
541 struct radeon_winsys_bo **buffer_list,
542 const VkBufferView _buffer_view)
543 {
544 RADV_FROM_HANDLE(radv_buffer_view, buffer_view, _buffer_view);
545
546 memcpy(dst, buffer_view->state, 4 * 4);
547
548 if (cmd_buffer)
549 device->ws->cs_add_buffer(cmd_buffer->cs, buffer_view->bo, 7);
550 else
551 *buffer_list = buffer_view->bo;
552 }
553
554 static void write_buffer_descriptor(struct radv_device *device,
555 struct radv_cmd_buffer *cmd_buffer,
556 unsigned *dst,
557 struct radeon_winsys_bo **buffer_list,
558 const VkDescriptorBufferInfo *buffer_info)
559 {
560 RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
561 uint64_t va = device->ws->buffer_get_va(buffer->bo);
562 uint32_t range = buffer_info->range;
563
564 if (buffer_info->range == VK_WHOLE_SIZE)
565 range = buffer->size - buffer_info->offset;
566
567 va += buffer_info->offset + buffer->offset;
568 dst[0] = va;
569 dst[1] = S_008F04_BASE_ADDRESS_HI(va >> 32);
570 dst[2] = range;
571 dst[3] = S_008F0C_DST_SEL_X(V_008F0C_SQ_SEL_X) |
572 S_008F0C_DST_SEL_Y(V_008F0C_SQ_SEL_Y) |
573 S_008F0C_DST_SEL_Z(V_008F0C_SQ_SEL_Z) |
574 S_008F0C_DST_SEL_W(V_008F0C_SQ_SEL_W) |
575 S_008F0C_NUM_FORMAT(V_008F0C_BUF_NUM_FORMAT_FLOAT) |
576 S_008F0C_DATA_FORMAT(V_008F0C_BUF_DATA_FORMAT_32);
577
578 if (cmd_buffer)
579 device->ws->cs_add_buffer(cmd_buffer->cs, buffer->bo, 7);
580 else
581 *buffer_list = buffer->bo;
582 }
583
584 static void write_dynamic_buffer_descriptor(struct radv_device *device,
585 struct radv_descriptor_range *range,
586 struct radeon_winsys_bo **buffer_list,
587 const VkDescriptorBufferInfo *buffer_info)
588 {
589 RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
590 uint64_t va = device->ws->buffer_get_va(buffer->bo);
591 unsigned size = buffer_info->range;
592
593 if (buffer_info->range == VK_WHOLE_SIZE)
594 size = buffer->size - buffer_info->offset;
595
596 va += buffer_info->offset + buffer->offset;
597 range->va = va;
598 range->size = size;
599
600 *buffer_list = buffer->bo;
601 }
602
603 static void
604 write_image_descriptor(struct radv_device *device,
605 struct radv_cmd_buffer *cmd_buffer,
606 unsigned *dst,
607 struct radeon_winsys_bo **buffer_list,
608 const VkDescriptorImageInfo *image_info)
609 {
610 RADV_FROM_HANDLE(radv_image_view, iview, image_info->imageView);
611 memcpy(dst, iview->descriptor, 8 * 4);
612 memcpy(dst + 8, iview->fmask_descriptor, 8 * 4);
613
614 if (cmd_buffer)
615 device->ws->cs_add_buffer(cmd_buffer->cs, iview->bo, 7);
616 else
617 *buffer_list = iview->bo;
618 }
619
620 static void
621 write_combined_image_sampler_descriptor(struct radv_device *device,
622 struct radv_cmd_buffer *cmd_buffer,
623 unsigned *dst,
624 struct radeon_winsys_bo **buffer_list,
625 const VkDescriptorImageInfo *image_info,
626 bool has_sampler)
627 {
628 RADV_FROM_HANDLE(radv_sampler, sampler, image_info->sampler);
629
630 write_image_descriptor(device, cmd_buffer, dst, buffer_list, image_info);
631 /* copy over sampler state */
632 if (has_sampler)
633 memcpy(dst + 16, sampler->state, 16);
634 }
635
636 static void
637 write_sampler_descriptor(struct radv_device *device,
638 unsigned *dst,
639 const VkDescriptorImageInfo *image_info)
640 {
641 RADV_FROM_HANDLE(radv_sampler, sampler, image_info->sampler);
642
643 memcpy(dst, sampler->state, 16);
644 }
645
646 void radv_update_descriptor_sets(
647 struct radv_device* device,
648 struct radv_cmd_buffer* cmd_buffer,
649 VkDescriptorSet dstSetOverride,
650 uint32_t descriptorWriteCount,
651 const VkWriteDescriptorSet* pDescriptorWrites,
652 uint32_t descriptorCopyCount,
653 const VkCopyDescriptorSet* pDescriptorCopies)
654 {
655 uint32_t i, j;
656 for (i = 0; i < descriptorWriteCount; i++) {
657 const VkWriteDescriptorSet *writeset = &pDescriptorWrites[i];
658 RADV_FROM_HANDLE(radv_descriptor_set, set,
659 dstSetOverride ? dstSetOverride : writeset->dstSet);
660 const struct radv_descriptor_set_binding_layout *binding_layout =
661 set->layout->binding + writeset->dstBinding;
662 uint32_t *ptr = set->mapped_ptr;
663 struct radeon_winsys_bo **buffer_list = set->descriptors;
664 /* Immutable samplers are not copied into push descriptors when they are
665 * allocated, so if we are writing push descriptors we have to copy the
666 * immutable samplers into them now.
667 */
668 const bool copy_immutable_samplers = cmd_buffer &&
669 binding_layout->immutable_samplers && !binding_layout->immutable_samplers_equal;
670
671 ptr += binding_layout->offset / 4;
672 ptr += binding_layout->size * writeset->dstArrayElement / 4;
673 buffer_list += binding_layout->buffer_offset;
674 buffer_list += binding_layout->buffer_count * writeset->dstArrayElement;
675 for (j = 0; j < writeset->descriptorCount; ++j) {
676 switch(writeset->descriptorType) {
677 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
678 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
679 unsigned idx = writeset->dstArrayElement + j;
680 idx += binding_layout->dynamic_offset_offset;
681 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
682 write_dynamic_buffer_descriptor(device, set->dynamic_descriptors + idx,
683 buffer_list, writeset->pBufferInfo + j);
684 break;
685 }
686 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
687 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
688 write_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
689 writeset->pBufferInfo + j);
690 break;
691 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
692 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
693 write_texel_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
694 writeset->pTexelBufferView[j]);
695 break;
696 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
697 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
698 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
699 write_image_descriptor(device, cmd_buffer, ptr, buffer_list,
700 writeset->pImageInfo + j);
701 break;
702 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
703 write_combined_image_sampler_descriptor(device, cmd_buffer, ptr, buffer_list,
704 writeset->pImageInfo + j,
705 !binding_layout->immutable_samplers);
706 if (copy_immutable_samplers) {
707 const unsigned idx = writeset->dstArrayElement + j;
708 memcpy(ptr + 16, binding_layout->immutable_samplers + 4 * idx, 16);
709 }
710 break;
711 case VK_DESCRIPTOR_TYPE_SAMPLER:
712 if (!binding_layout->immutable_samplers) {
713 write_sampler_descriptor(device, ptr,
714 writeset->pImageInfo + j);
715 } else if (copy_immutable_samplers) {
716 unsigned idx = writeset->dstArrayElement + j;
717 memcpy(ptr, binding_layout->immutable_samplers + 4 * idx, 16);
718 }
719 break;
720 default:
721 unreachable("unimplemented descriptor type");
722 break;
723 }
724 ptr += binding_layout->size / 4;
725 buffer_list += binding_layout->buffer_count;
726 }
727
728 }
729 if (descriptorCopyCount)
730 radv_finishme("copy descriptors");
731 }
732
733 void radv_UpdateDescriptorSets(
734 VkDevice _device,
735 uint32_t descriptorWriteCount,
736 const VkWriteDescriptorSet* pDescriptorWrites,
737 uint32_t descriptorCopyCount,
738 const VkCopyDescriptorSet* pDescriptorCopies)
739 {
740 RADV_FROM_HANDLE(radv_device, device, _device);
741
742 radv_update_descriptor_sets(device, NULL, VK_NULL_HANDLE, descriptorWriteCount, pDescriptorWrites,
743 descriptorCopyCount, pDescriptorCopies);
744 }
745
746 VkResult radv_CreateDescriptorUpdateTemplateKHR(VkDevice _device,
747 const VkDescriptorUpdateTemplateCreateInfoKHR *pCreateInfo,
748 const VkAllocationCallbacks *pAllocator,
749 VkDescriptorUpdateTemplateKHR *pDescriptorUpdateTemplate)
750 {
751 RADV_FROM_HANDLE(radv_device, device, _device);
752 RADV_FROM_HANDLE(radv_descriptor_set_layout, set_layout, pCreateInfo->descriptorSetLayout);
753 const uint32_t entry_count = pCreateInfo->descriptorUpdateEntryCount;
754 const size_t size = sizeof(struct radv_descriptor_update_template) +
755 sizeof(struct radv_descriptor_update_template_entry) * entry_count;
756 struct radv_descriptor_update_template *templ;
757 uint32_t i;
758
759 templ = vk_alloc2(&device->alloc, pAllocator, size, 8, VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
760 if (!templ)
761 return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
762
763 templ->entry_count = entry_count;
764
765 for (i = 0; i < entry_count; i++) {
766 const VkDescriptorUpdateTemplateEntryKHR *entry = &pCreateInfo->pDescriptorUpdateEntries[i];
767 const struct radv_descriptor_set_binding_layout *binding_layout =
768 set_layout->binding + entry->dstBinding;
769 const uint32_t buffer_offset = binding_layout->buffer_offset +
770 binding_layout->buffer_count * entry->dstArrayElement;
771 uint32_t *immutable_samplers = NULL;
772 uint16_t dst_offset;
773 uint16_t dst_stride;
774
775 /* dst_offset is an offset into dynamic_descriptors when the descriptor
776 is dynamic, and an offset into mapped_ptr otherwise */
777 switch (entry->descriptorType) {
778 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
779 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC:
780 assert(pCreateInfo->templateType == VK_DESCRIPTOR_UPDATE_TEMPLATE_TYPE_DESCRIPTOR_SET_KHR);
781 dst_offset = binding_layout->dynamic_offset_offset + entry->dstArrayElement;
782 dst_stride = 0; /* Not used */
783 break;
784 default:
785 switch (entry->descriptorType) {
786 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
787 case VK_DESCRIPTOR_TYPE_SAMPLER:
788 /* Immutable samplers are copied into push descriptors when they are pushed */
789 if (pCreateInfo->templateType == VK_DESCRIPTOR_UPDATE_TEMPLATE_TYPE_PUSH_DESCRIPTORS_KHR &&
790 binding_layout->immutable_samplers && !binding_layout->immutable_samplers_equal)
791 immutable_samplers = binding_layout->immutable_samplers + entry->dstArrayElement * 4;
792 break;
793 default:
794 break;
795 }
796 dst_offset = binding_layout->offset / 4 + binding_layout->size * entry->dstArrayElement / 4;
797 dst_stride = binding_layout->size / 4;
798 break;
799 }
800
801 templ->entry[i] = (struct radv_descriptor_update_template_entry) {
802 .descriptor_type = entry->descriptorType,
803 .descriptor_count = entry->descriptorCount,
804 .src_offset = entry->offset,
805 .src_stride = entry->stride,
806 .dst_offset = dst_offset,
807 .dst_stride = dst_stride,
808 .buffer_offset = buffer_offset,
809 .buffer_count = binding_layout->buffer_count,
810 .has_sampler = !binding_layout->immutable_samplers,
811 .immutable_samplers = immutable_samplers
812 };
813 }
814
815 *pDescriptorUpdateTemplate = radv_descriptor_update_template_to_handle(templ);
816 return VK_SUCCESS;
817 }
818
819 void radv_DestroyDescriptorUpdateTemplateKHR(VkDevice _device,
820 VkDescriptorUpdateTemplateKHR descriptorUpdateTemplate,
821 const VkAllocationCallbacks *pAllocator)
822 {
823 RADV_FROM_HANDLE(radv_device, device, _device);
824 RADV_FROM_HANDLE(radv_descriptor_update_template, templ, descriptorUpdateTemplate);
825
826 if (!templ)
827 return;
828
829 vk_free2(&device->alloc, pAllocator, templ);
830 }
831
832 void radv_update_descriptor_set_with_template(struct radv_device *device,
833 struct radv_cmd_buffer *cmd_buffer,
834 struct radv_descriptor_set *set,
835 VkDescriptorUpdateTemplateKHR descriptorUpdateTemplate,
836 const void *pData)
837 {
838 RADV_FROM_HANDLE(radv_descriptor_update_template, templ, descriptorUpdateTemplate);
839 uint32_t i;
840
841 for (i = 0; i < templ->entry_count; ++i) {
842 struct radeon_winsys_bo **buffer_list = set->descriptors + templ->entry[i].buffer_offset;
843 uint32_t *pDst = set->mapped_ptr + templ->entry[i].dst_offset;
844 const uint8_t *pSrc = ((const uint8_t *) pData) + templ->entry[i].src_offset;
845 uint32_t j;
846
847 for (j = 0; j < templ->entry[i].descriptor_count; ++j) {
848 switch (templ->entry[i].descriptor_type) {
849 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
850 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
851 const unsigned idx = templ->entry[i].dst_offset + j;
852 assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
853 write_dynamic_buffer_descriptor(device, set->dynamic_descriptors + idx,
854 buffer_list, (struct VkDescriptorBufferInfo *) pSrc);
855 break;
856 }
857 case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
858 case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
859 write_buffer_descriptor(device, cmd_buffer, pDst, buffer_list,
860 (struct VkDescriptorBufferInfo *) pSrc);
861 break;
862 case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
863 case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
864 write_texel_buffer_descriptor(device, cmd_buffer, pDst, buffer_list,
865 *(VkBufferView *) pSrc);
866 break;
867 case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
868 case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
869 case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
870 write_image_descriptor(device, cmd_buffer, pDst, buffer_list,
871 (struct VkDescriptorImageInfo *) pSrc);
872 break;
873 case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
874 write_combined_image_sampler_descriptor(device, cmd_buffer, pDst, buffer_list,
875 (struct VkDescriptorImageInfo *) pSrc,
876 templ->entry[i].has_sampler);
877 if (templ->entry[i].immutable_samplers)
878 memcpy(pDst + 16, templ->entry[i].immutable_samplers + 4 * j, 16);
879 break;
880 case VK_DESCRIPTOR_TYPE_SAMPLER:
881 if (templ->entry[i].has_sampler)
882 write_sampler_descriptor(device, pDst,
883 (struct VkDescriptorImageInfo *) pSrc);
884 else if (templ->entry[i].immutable_samplers)
885 memcpy(pDst, templ->entry[i].immutable_samplers + 4 * j, 16);
886 break;
887 default:
888 unreachable("unimplemented descriptor type");
889 break;
890 }
891 pSrc += templ->entry[i].src_stride;
892 pDst += templ->entry[i].dst_stride;
893 buffer_list += templ->entry[i].buffer_count;
894 }
895 }
896 }
897
898 void radv_UpdateDescriptorSetWithTemplateKHR(VkDevice _device,
899 VkDescriptorSet descriptorSet,
900 VkDescriptorUpdateTemplateKHR descriptorUpdateTemplate,
901 const void *pData)
902 {
903 RADV_FROM_HANDLE(radv_device, device, _device);
904 RADV_FROM_HANDLE(radv_descriptor_set, set, descriptorSet);
905
906 radv_update_descriptor_set_with_template(device, NULL, set, descriptorUpdateTemplate, pData);
907 }