radv: remove radv_pipeline_layout::push_constant_stages field
[mesa.git] / src / amd / vulkan / radv_descriptor_set.c
index 7cee9d4dedd3cff3a5ed8a6e0f38eed159d04c36..b1ef66308d6d9e61d69e506a760b0727695c3158 100644 (file)
@@ -66,6 +66,8 @@ VkResult radv_CreateDescriptorSetLayout(
 
        set_layout->binding_count = max_binding + 1;
        set_layout->shader_stages = 0;
+       set_layout->dynamic_shader_stages = 0;
+       set_layout->has_immutable_samplers = false;
        set_layout->size = 0;
 
        memset(set_layout->binding, 0, size - sizeof(struct radv_descriptor_set_layout));
@@ -131,6 +133,7 @@ VkResult radv_CreateDescriptorSetLayout(
                if (binding->pImmutableSamplers) {
                        set_layout->binding[b].immutable_samplers_offset = samplers_offset;
                        set_layout->binding[b].immutable_samplers_equal = true;
+                       set_layout->has_immutable_samplers = true;
 
 
                        for (uint32_t i = 0; i < binding->descriptorCount; i++)
@@ -225,6 +228,7 @@ VkResult radv_CreatePipelineLayout(
 
        layout->dynamic_offset_count = dynamic_offset_count;
        layout->push_constant_size = 0;
+
        for (unsigned i = 0; i < pCreateInfo->pushConstantRangeCount; ++i) {
                const VkPushConstantRange *range = pCreateInfo->pPushConstantRanges + i;
                layout->push_constant_size = MAX2(layout->push_constant_size,
@@ -292,28 +296,33 @@ radv_descriptor_set_create(struct radv_device *device,
                uint32_t layout_size = align_u32(layout->size, 32);
                set->size = layout->size;
 
+               if (!pool->host_memory_base && pool->entry_count == pool->max_entry_count) {
+                       vk_free2(&device->alloc, NULL, set);
+                       return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
+               }
+
                /* try to allocate linearly first, so that we don't spend
                 * time looking for gaps if the app only allocates &
                 * resets via the pool. */
                if (pool->current_offset + layout_size <= pool->size) {
                        set->bo = pool->bo;
                        set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + pool->current_offset);
-                       set->va = device->ws->buffer_get_va(set->bo) + pool->current_offset;
+                       set->va = radv_buffer_get_va(set->bo) + pool->current_offset;
+                       if (!pool->host_memory_base) {
+                               pool->entries[pool->entry_count].offset = pool->current_offset;
+                               pool->entries[pool->entry_count].size = layout_size;
+                               pool->entries[pool->entry_count].set = set;
+                               pool->entry_count++;
+                       }
                        pool->current_offset += layout_size;
-                       list_addtail(&set->vram_list, &pool->vram_list);
                } else if (!pool->host_memory_base) {
                        uint64_t offset = 0;
-                       struct list_head *prev = &pool->vram_list;
-                       struct radv_descriptor_set *cur;
+                       int index;
 
-                       assert(!pool->host_memory_base);
-                       LIST_FOR_EACH_ENTRY(cur, &pool->vram_list, vram_list) {
-                               uint64_t start = (uint8_t*)cur->mapped_ptr - pool->mapped_ptr;
-                               if (start - offset >= layout_size)
+                       for (index = 0; index < pool->entry_count; ++index) {
+                               if (pool->entries[index].offset - offset >= layout_size)
                                        break;
-
-                               offset = start + cur->size;
-                               prev = &cur->vram_list;
+                               offset = pool->entries[index].offset + pool->entries[index].size;
                        }
 
                        if (pool->size - offset < layout_size) {
@@ -322,27 +331,34 @@ radv_descriptor_set_create(struct radv_device *device,
                        }
                        set->bo = pool->bo;
                        set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + offset);
-                       set->va = device->ws->buffer_get_va(set->bo) + offset;
-                       list_add(&set->vram_list, prev);
+                       set->va = radv_buffer_get_va(set->bo) + offset;
+                       memmove(&pool->entries[index + 1], &pool->entries[index],
+                               sizeof(pool->entries[0]) * (pool->entry_count - index));
+                       pool->entries[index].offset = offset;
+                       pool->entries[index].size = layout_size;
+                       pool->entries[index].set = set;
+                       pool->entry_count++;
                } else
                        return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
        }
 
-       for (unsigned i = 0; i < layout->binding_count; ++i) {
-               if (!layout->binding[i].immutable_samplers_offset ||
-                   layout->binding[i].immutable_samplers_equal)
-                       continue;
+       if (layout->has_immutable_samplers) {
+               for (unsigned i = 0; i < layout->binding_count; ++i) {
+                       if (!layout->binding[i].immutable_samplers_offset ||
+                       layout->binding[i].immutable_samplers_equal)
+                               continue;
 
-               unsigned offset = layout->binding[i].offset / 4;
-               if (layout->binding[i].type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
-                       offset += 16;
+                       unsigned offset = layout->binding[i].offset / 4;
+                       if (layout->binding[i].type == VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER)
+                               offset += 16;
 
-               const uint32_t *samplers = (const uint32_t*)((const char*)layout + layout->binding[i].immutable_samplers_offset);
-               for (unsigned j = 0; j < layout->binding[i].array_size; ++j) {
-                       memcpy(set->mapped_ptr + offset, samplers + 4 * j, 16);
-                       offset += layout->binding[i].size / 4;
-               }
+                       const uint32_t *samplers = (const uint32_t*)((const char*)layout + layout->binding[i].immutable_samplers_offset);
+                       for (unsigned j = 0; j < layout->binding[i].array_size; ++j) {
+                               memcpy(set->mapped_ptr + offset, samplers + 4 * j, 16);
+                               offset += layout->binding[i].size / 4;
+                       }
 
+               }
        }
        *out_set = set;
        return VK_SUCCESS;
@@ -356,8 +372,17 @@ radv_descriptor_set_destroy(struct radv_device *device,
 {
        assert(!pool->host_memory_base);
 
-       if (free_bo && set->size)
-               list_del(&set->vram_list);
+       if (free_bo && set->size && !pool->host_memory_base) {
+               uint32_t offset = (uint8_t*)set->mapped_ptr - pool->mapped_ptr;
+               for (int i = 0; i < pool->entry_count; ++i) {
+                       if (pool->entries[i].offset == offset) {
+                               memmove(&pool->entries[i], &pool->entries[i+1],
+                                       sizeof(pool->entries[i]) * (pool->entry_count - i - 1));
+                               --pool->entry_count;
+                               break;
+                       }
+               }
+       }
        vk_free2(&device->alloc, NULL, set);
 }
 
@@ -409,6 +434,8 @@ VkResult radv_CreateDescriptorPool(
                host_size += sizeof(struct radeon_winsys_bo*) * bo_count;
                host_size += sizeof(struct radv_descriptor_range) * range_count;
                size += host_size;
+       } else {
+               size += sizeof(struct radv_descriptor_pool_entry) * pCreateInfo->maxSets;
        }
 
        pool = vk_alloc2(&device->alloc, pAllocator, size, 8,
@@ -425,13 +452,15 @@ VkResult radv_CreateDescriptorPool(
        }
 
        if (bo_size) {
-               pool->bo = device->ws->buffer_create(device->ws, bo_size,
-                                                       32, RADEON_DOMAIN_VRAM, 0);
+               pool->bo = device->ws->buffer_create(device->ws, bo_size, 32,
+                                                    RADEON_DOMAIN_VRAM,
+                                                    RADEON_FLAG_NO_INTERPROCESS_SHARING |
+                                                    RADEON_FLAG_READ_ONLY);
                pool->mapped_ptr = (uint8_t*)device->ws->buffer_map(pool->bo);
        }
        pool->size = bo_size;
+       pool->max_entry_count = pCreateInfo->maxSets;
 
-       list_inithead(&pool->vram_list);
        *pDescriptorPool = radv_descriptor_pool_to_handle(pool);
        return VK_SUCCESS;
 }
@@ -448,9 +477,8 @@ void radv_DestroyDescriptorPool(
                return;
 
        if (!pool->host_memory_base) {
-               list_for_each_entry_safe(struct radv_descriptor_set, set,
-                                        &pool->vram_list, vram_list) {
-                       radv_descriptor_set_destroy(device, pool, set, false);
+               for(int i = 0; i < pool->entry_count; ++i) {
+                       radv_descriptor_set_destroy(device, pool, pool->entries[i].set, false);
                }
        }
 
@@ -468,14 +496,12 @@ VkResult radv_ResetDescriptorPool(
        RADV_FROM_HANDLE(radv_descriptor_pool, pool, descriptorPool);
 
        if (!pool->host_memory_base) {
-               list_for_each_entry_safe(struct radv_descriptor_set, set,
-                                        &pool->vram_list, vram_list) {
-                       radv_descriptor_set_destroy(device, pool, set, false);
+               for(int i = 0; i < pool->entry_count; ++i) {
+                       radv_descriptor_set_destroy(device, pool, pool->entries[i].set, false);
                }
+               pool->entry_count = 0;
        }
 
-       list_inithead(&pool->vram_list);
-
        pool->current_offset = 0;
        pool->host_memory_ptr = pool->host_memory_base;
 
@@ -543,7 +569,7 @@ static void write_texel_buffer_descriptor(struct radv_device *device,
        memcpy(dst, buffer_view->state, 4 * 4);
 
        if (cmd_buffer)
-               device->ws->cs_add_buffer(cmd_buffer->cs, buffer_view->bo, 7);
+               radv_cs_add_buffer(device->ws, cmd_buffer->cs, buffer_view->bo, 7);
        else
                *buffer_list = buffer_view->bo;
 }
@@ -555,7 +581,7 @@ static void write_buffer_descriptor(struct radv_device *device,
                                     const VkDescriptorBufferInfo *buffer_info)
 {
        RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
-       uint64_t va = device->ws->buffer_get_va(buffer->bo);
+       uint64_t va = radv_buffer_get_va(buffer->bo);
        uint32_t range = buffer_info->range;
 
        if (buffer_info->range == VK_WHOLE_SIZE)
@@ -573,7 +599,7 @@ static void write_buffer_descriptor(struct radv_device *device,
                S_008F0C_DATA_FORMAT(V_008F0C_BUF_DATA_FORMAT_32);
 
        if (cmd_buffer)
-               device->ws->cs_add_buffer(cmd_buffer->cs, buffer->bo, 7);
+               radv_cs_add_buffer(device->ws, cmd_buffer->cs, buffer->bo, 7);
        else
                *buffer_list = buffer->bo;
 }
@@ -584,7 +610,7 @@ static void write_dynamic_buffer_descriptor(struct radv_device *device,
                                             const VkDescriptorBufferInfo *buffer_info)
 {
        RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
-       uint64_t va = device->ws->buffer_get_va(buffer->bo);
+       uint64_t va = radv_buffer_get_va(buffer->bo);
        unsigned size = buffer_info->range;
 
        if (buffer_info->range == VK_WHOLE_SIZE)
@@ -606,17 +632,18 @@ write_image_descriptor(struct radv_device *device,
                       const VkDescriptorImageInfo *image_info)
 {
        RADV_FROM_HANDLE(radv_image_view, iview, image_info->imageView);
+       uint32_t *descriptor;
 
        if (descriptor_type == VK_DESCRIPTOR_TYPE_STORAGE_IMAGE) {
-               memcpy(dst, iview->storage_descriptor, 8 * 4);
-               memcpy(dst + 8, iview->storage_fmask_descriptor, 8 * 4);
+               descriptor = iview->storage_descriptor;
        } else {
-               memcpy(dst, iview->descriptor, 8 * 4);
-               memcpy(dst + 8, iview->fmask_descriptor, 8 * 4);
+               descriptor = iview->descriptor;
        }
 
+       memcpy(dst, descriptor, 16 * 4);
+
        if (cmd_buffer)
-               device->ws->cs_add_buffer(cmd_buffer->cs, iview->bo, 7);
+               radv_cs_add_buffer(device->ws, cmd_buffer->cs, iview->bo, 7);
        else
                *buffer_list = iview->bo;
 }
@@ -734,8 +761,59 @@ void radv_update_descriptor_sets(
                }
 
        }
-       if (descriptorCopyCount)
-               radv_finishme("copy descriptors");
+
+       for (i = 0; i < descriptorCopyCount; i++) {
+               const VkCopyDescriptorSet *copyset = &pDescriptorCopies[i];
+               RADV_FROM_HANDLE(radv_descriptor_set, src_set,
+                                copyset->srcSet);
+               RADV_FROM_HANDLE(radv_descriptor_set, dst_set,
+                                copyset->dstSet);
+               const struct radv_descriptor_set_binding_layout *src_binding_layout =
+                       src_set->layout->binding + copyset->srcBinding;
+               const struct radv_descriptor_set_binding_layout *dst_binding_layout =
+                       dst_set->layout->binding + copyset->dstBinding;
+               uint32_t *src_ptr = src_set->mapped_ptr;
+               uint32_t *dst_ptr = dst_set->mapped_ptr;
+               struct radeon_winsys_bo **src_buffer_list = src_set->descriptors;
+               struct radeon_winsys_bo **dst_buffer_list = dst_set->descriptors;
+
+               src_ptr += src_binding_layout->offset / 4;
+               dst_ptr += dst_binding_layout->offset / 4;
+
+               src_ptr += src_binding_layout->size * copyset->srcArrayElement / 4;
+               dst_ptr += dst_binding_layout->size * copyset->dstArrayElement / 4;
+
+               src_buffer_list += src_binding_layout->buffer_offset;
+               src_buffer_list += copyset->srcArrayElement;
+
+               dst_buffer_list += dst_binding_layout->buffer_offset;
+               dst_buffer_list += copyset->dstArrayElement;
+
+               for (j = 0; j < copyset->descriptorCount; ++j) {
+                       switch (src_binding_layout->type) {
+                       case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
+                       case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER_DYNAMIC: {
+                               unsigned src_idx = copyset->srcArrayElement + j;
+                               unsigned dst_idx = copyset->dstArrayElement + j;
+                               struct radv_descriptor_range *src_range, *dst_range;
+                               src_idx += src_binding_layout->dynamic_offset_offset;
+                               dst_idx += dst_binding_layout->dynamic_offset_offset;
+
+                               src_range = src_set->dynamic_descriptors + src_idx;
+                               dst_range = dst_set->dynamic_descriptors + dst_idx;
+                               *dst_range = *src_range;
+                               break;
+                       }
+                       default:
+                               memcpy(dst_ptr, src_ptr, src_binding_layout->size);
+                       }
+                       src_ptr += src_binding_layout->size / 4;
+                       dst_ptr += dst_binding_layout->size / 4;
+                       dst_buffer_list[j] = src_buffer_list[j];
+                       ++src_buffer_list;
+                       ++dst_buffer_list;
+               }
+       }
 }
 
 void radv_UpdateDescriptorSets(