radv: get rid of buffer object priorities
[mesa.git] / src / amd / vulkan / radv_descriptor_set.c
index 55b4aaa388cc83e2c286a51a094bfc5bf45afb1c..c4341f6ac52288b0f38918f1d302978f04b58767 100644 (file)
@@ -95,7 +95,7 @@ VkResult radv_CreateDescriptorSetLayout(
        set_layout = vk_alloc2(&device->alloc, pAllocator, size, 8,
                                 VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
        if (!set_layout)
-               return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
+               return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
 
        set_layout->flags = pCreateInfo->flags;
 
@@ -106,7 +106,7 @@ VkResult radv_CreateDescriptorSetLayout(
                                                                        pCreateInfo->bindingCount);
        if (!bindings) {
                vk_free2(&device->alloc, pAllocator, set_layout);
-               return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
+               return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
        }
 
        set_layout->binding_count = max_binding + 1;
@@ -117,12 +117,14 @@ VkResult radv_CreateDescriptorSetLayout(
 
        memset(set_layout->binding, 0, size - sizeof(struct radv_descriptor_set_layout));
 
+       uint32_t buffer_count = 0;
        uint32_t dynamic_offset_count = 0;
 
        for (uint32_t j = 0; j < pCreateInfo->bindingCount; j++) {
                const VkDescriptorSetLayoutBinding *binding = bindings + j;
                uint32_t b = binding->binding;
                uint32_t alignment;
+               unsigned binding_buffer_count = 0;
 
                switch (binding->descriptorType) {
                case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
@@ -131,6 +133,7 @@ VkResult radv_CreateDescriptorSetLayout(
                        set_layout->binding[b].dynamic_offset_count = 1;
                        set_layout->dynamic_shader_stages |= binding->stageFlags;
                        set_layout->binding[b].size = 0;
+                       binding_buffer_count = 1;
                        alignment = 1;
                        break;
                case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
@@ -138,6 +141,7 @@ VkResult radv_CreateDescriptorSetLayout(
                case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
                case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
                        set_layout->binding[b].size = 16;
+                       binding_buffer_count = 1;
                        alignment = 16;
                        break;
                case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
@@ -145,11 +149,13 @@ VkResult radv_CreateDescriptorSetLayout(
                case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
                        /* main descriptor + fmask descriptor */
                        set_layout->binding[b].size = 64;
+                       binding_buffer_count = 1;
                        alignment = 32;
                        break;
                case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
                        /* main descriptor + fmask descriptor + sampler */
                        set_layout->binding[b].size = 96;
+                       binding_buffer_count = 1;
                        alignment = 32;
                        break;
                case VK_DESCRIPTOR_TYPE_SAMPLER:
@@ -165,6 +171,7 @@ VkResult radv_CreateDescriptorSetLayout(
                set_layout->binding[b].type = binding->descriptorType;
                set_layout->binding[b].array_size = binding->descriptorCount;
                set_layout->binding[b].offset = set_layout->size;
+               set_layout->binding[b].buffer_offset = buffer_count;
                set_layout->binding[b].dynamic_offset_offset = dynamic_offset_count;
 
                if (variable_flags && binding->binding < variable_flags->bindingCount &&
@@ -197,6 +204,7 @@ VkResult radv_CreateDescriptorSetLayout(
                }
 
                set_layout->size += binding->descriptorCount * set_layout->binding[b].size;
+               buffer_count += binding->descriptorCount * binding_buffer_count;
                dynamic_offset_count += binding->descriptorCount *
                        set_layout->binding[b].dynamic_offset_count;
                set_layout->shader_stages |= binding->stageFlags;
@@ -204,6 +212,7 @@ VkResult radv_CreateDescriptorSetLayout(
 
        free(bindings);
 
+       set_layout->buffer_count = buffer_count;
        set_layout->dynamic_offset_count = dynamic_offset_count;
 
        *pSetLayout = radv_descriptor_set_layout_to_handle(set_layout);
@@ -313,7 +322,7 @@ void radv_GetDescriptorSetLayoutSupport(VkDevice device,
 
 /*
  * Pipeline layouts.  These have nothing to do with the pipeline.  They are
- * just muttiple descriptor set layouts pasted together
+ * just multiple descriptor set layouts pasted together.
  */
 
 VkResult radv_CreatePipelineLayout(
@@ -331,7 +340,7 @@ VkResult radv_CreatePipelineLayout(
        layout = vk_alloc2(&device->alloc, pAllocator, sizeof(*layout), 8,
                             VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
        if (layout == NULL)
-               return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
+               return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
 
        layout->num_sets = pCreateInfo->setLayoutCount;
 
@@ -396,13 +405,14 @@ radv_descriptor_set_create(struct radv_device *device,
                           struct radv_descriptor_set **out_set)
 {
        struct radv_descriptor_set *set;
-       unsigned range_offset = sizeof(struct radv_descriptor_set);
+       unsigned range_offset = sizeof(struct radv_descriptor_set) +
+               sizeof(struct radeon_winsys_bo *) * layout->buffer_count;
        unsigned mem_size = range_offset +
                sizeof(struct radv_descriptor_range) * layout->dynamic_offset_count;
 
        if (pool->host_memory_base) {
                if (pool->host_memory_end - pool->host_memory_ptr < mem_size)
-                       return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
+                       return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
 
                set = (struct radv_descriptor_set*)pool->host_memory_ptr;
                pool->host_memory_ptr += mem_size;
@@ -411,7 +421,7 @@ radv_descriptor_set_create(struct radv_device *device,
                                VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
 
                if (!set)
-                       return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
+                       return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
        }
 
        memset(set, 0, mem_size);
@@ -427,7 +437,7 @@ radv_descriptor_set_create(struct radv_device *device,
 
                if (!pool->host_memory_base && pool->entry_count == pool->max_entry_count) {
                        vk_free2(&device->alloc, NULL, set);
-                       return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
+                       return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
                }
 
                /* try to allocate linearly first, so that we don't spend
@@ -456,7 +466,7 @@ radv_descriptor_set_create(struct radv_device *device,
 
                        if (pool->size - offset < layout_size) {
                                vk_free2(&device->alloc, NULL, set);
-                               return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
+                               return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
                        }
                        set->bo = pool->bo;
                        set->mapped_ptr = (uint32_t*)(pool->mapped_ptr + offset);
@@ -468,7 +478,7 @@ radv_descriptor_set_create(struct radv_device *device,
                        pool->entries[index].set = set;
                        pool->entry_count++;
                } else
-                       return vk_error(VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
+                       return vk_error(device->instance, VK_ERROR_OUT_OF_POOL_MEMORY_KHR);
        }
 
        if (layout->has_immutable_samplers) {
@@ -570,7 +580,7 @@ VkResult radv_CreateDescriptorPool(
        pool = vk_alloc2(&device->alloc, pAllocator, size, 8,
                         VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
        if (!pool)
-               return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
+               return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
 
        memset(pool, 0, sizeof(*pool));
 
@@ -584,7 +594,8 @@ VkResult radv_CreateDescriptorPool(
                pool->bo = device->ws->buffer_create(device->ws, bo_size, 32,
                                                     RADEON_DOMAIN_VRAM,
                                                     RADEON_FLAG_NO_INTERPROCESS_SHARING |
-                                                    RADEON_FLAG_READ_ONLY);
+                                                    RADEON_FLAG_READ_ONLY |
+                                                    RADEON_FLAG_32BIT);
                pool->mapped_ptr = (uint8_t*)device->ws->buffer_map(pool->bo);
        }
        pool->size = bo_size;
@@ -700,16 +711,25 @@ VkResult radv_FreeDescriptorSets(
 }
 
 static void write_texel_buffer_descriptor(struct radv_device *device,
+                                         struct radv_cmd_buffer *cmd_buffer,
                                          unsigned *dst,
+                                         struct radeon_winsys_bo **buffer_list,
                                          const VkBufferView _buffer_view)
 {
        RADV_FROM_HANDLE(radv_buffer_view, buffer_view, _buffer_view);
 
        memcpy(dst, buffer_view->state, 4 * 4);
+
+       if (cmd_buffer)
+               radv_cs_add_buffer(device->ws, cmd_buffer->cs, buffer_view->bo);
+       else
+               *buffer_list = buffer_view->bo;
 }
 
 static void write_buffer_descriptor(struct radv_device *device,
+                                    struct radv_cmd_buffer *cmd_buffer,
                                     unsigned *dst,
+                                    struct radeon_winsys_bo **buffer_list,
                                     const VkDescriptorBufferInfo *buffer_info)
 {
        RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
@@ -730,10 +750,15 @@ static void write_buffer_descriptor(struct radv_device *device,
                S_008F0C_NUM_FORMAT(V_008F0C_BUF_NUM_FORMAT_FLOAT) |
                S_008F0C_DATA_FORMAT(V_008F0C_BUF_DATA_FORMAT_32);
 
+       if (cmd_buffer)
+               radv_cs_add_buffer(device->ws, cmd_buffer->cs, buffer->bo);
+       else
+               *buffer_list = buffer->bo;
 }
 
 static void write_dynamic_buffer_descriptor(struct radv_device *device,
                                             struct radv_descriptor_range *range,
+                                            struct radeon_winsys_bo **buffer_list,
                                             const VkDescriptorBufferInfo *buffer_info)
 {
        RADV_FROM_HANDLE(radv_buffer, buffer, buffer_info->buffer);
@@ -746,11 +771,15 @@ static void write_dynamic_buffer_descriptor(struct radv_device *device,
        va += buffer_info->offset + buffer->offset;
        range->va = va;
        range->size = size;
+
+       *buffer_list = buffer->bo;
 }
 
 static void
 write_image_descriptor(struct radv_device *device,
+                      struct radv_cmd_buffer *cmd_buffer,
                       unsigned *dst,
+                      struct radeon_winsys_bo **buffer_list,
                       VkDescriptorType descriptor_type,
                       const VkDescriptorImageInfo *image_info)
 {
@@ -764,18 +793,25 @@ write_image_descriptor(struct radv_device *device,
        }
 
        memcpy(dst, descriptor, 16 * 4);
+
+       if (cmd_buffer)
+               radv_cs_add_buffer(device->ws, cmd_buffer->cs, iview->bo);
+       else
+               *buffer_list = iview->bo;
 }
 
 static void
 write_combined_image_sampler_descriptor(struct radv_device *device,
+                                       struct radv_cmd_buffer *cmd_buffer,
                                        unsigned *dst,
+                                       struct radeon_winsys_bo **buffer_list,
                                        VkDescriptorType descriptor_type,
                                        const VkDescriptorImageInfo *image_info,
                                        bool has_sampler)
 {
        RADV_FROM_HANDLE(radv_sampler, sampler, image_info->sampler);
 
-       write_image_descriptor(device, dst, descriptor_type, image_info);
+       write_image_descriptor(device, cmd_buffer, dst, buffer_list, descriptor_type, image_info);
        /* copy over sampler state */
        if (has_sampler)
                memcpy(dst + 16, sampler->state, 16);
@@ -808,7 +844,7 @@ void radv_update_descriptor_sets(
                const struct radv_descriptor_set_binding_layout *binding_layout =
                        set->layout->binding + writeset->dstBinding;
                uint32_t *ptr = set->mapped_ptr;
-
+               struct radeon_winsys_bo **buffer_list =  set->descriptors;
                /* Immutable samplers are not copied into push descriptors when they are
                 * allocated, so if we are writing push descriptors we have to copy the
                 * immutable samplers into them now.
@@ -819,6 +855,8 @@ void radv_update_descriptor_sets(
 
                ptr += binding_layout->offset / 4;
                ptr += binding_layout->size * writeset->dstArrayElement / 4;
+               buffer_list += binding_layout->buffer_offset;
+               buffer_list += writeset->dstArrayElement;
                for (j = 0; j < writeset->descriptorCount; ++j) {
                        switch(writeset->descriptorType) {
                        case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
@@ -827,25 +865,28 @@ void radv_update_descriptor_sets(
                                idx += binding_layout->dynamic_offset_offset;
                                assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
                                write_dynamic_buffer_descriptor(device, set->dynamic_descriptors + idx,
-                                                               writeset->pBufferInfo + j);
+                                                               buffer_list, writeset->pBufferInfo + j);
                                break;
                        }
                        case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
                        case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
-                               write_buffer_descriptor(device, ptr, writeset->pBufferInfo + j);
+                               write_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
+                                                       writeset->pBufferInfo + j);
                                break;
                        case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
                        case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
-                               write_texel_buffer_descriptor(device, ptr, writeset->pTexelBufferView[j]);
+                               write_texel_buffer_descriptor(device, cmd_buffer, ptr, buffer_list,
+                                                             writeset->pTexelBufferView[j]);
                                break;
                        case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
                        case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
                        case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
-                               write_image_descriptor(device, ptr, writeset->descriptorType,
+                               write_image_descriptor(device, cmd_buffer, ptr, buffer_list,
+                                                      writeset->descriptorType,
                                                       writeset->pImageInfo + j);
                                break;
                        case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
-                               write_combined_image_sampler_descriptor(device, ptr,
+                               write_combined_image_sampler_descriptor(device, cmd_buffer, ptr, buffer_list,
                                                                        writeset->descriptorType,
                                                                        writeset->pImageInfo + j,
                                                                        !binding_layout->immutable_samplers_offset);
@@ -868,6 +909,7 @@ void radv_update_descriptor_sets(
                                break;
                        }
                        ptr += binding_layout->size / 4;
+                       ++buffer_list;
                }
 
        }
@@ -884,6 +926,8 @@ void radv_update_descriptor_sets(
                        dst_set->layout->binding + copyset->dstBinding;
                uint32_t *src_ptr = src_set->mapped_ptr;
                uint32_t *dst_ptr = dst_set->mapped_ptr;
+               struct radeon_winsys_bo **src_buffer_list = src_set->descriptors;
+               struct radeon_winsys_bo **dst_buffer_list = dst_set->descriptors;
 
                src_ptr += src_binding_layout->offset / 4;
                dst_ptr += dst_binding_layout->offset / 4;
@@ -891,6 +935,12 @@ void radv_update_descriptor_sets(
                src_ptr += src_binding_layout->size * copyset->srcArrayElement / 4;
                dst_ptr += dst_binding_layout->size * copyset->dstArrayElement / 4;
 
+               src_buffer_list += src_binding_layout->buffer_offset;
+               src_buffer_list += copyset->srcArrayElement;
+
+               dst_buffer_list += dst_binding_layout->buffer_offset;
+               dst_buffer_list += copyset->dstArrayElement;
+
                for (j = 0; j < copyset->descriptorCount; ++j) {
                        switch (src_binding_layout->type) {
                        case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER_DYNAMIC:
@@ -911,6 +961,9 @@ void radv_update_descriptor_sets(
                        }
                        src_ptr += src_binding_layout->size / 4;
                        dst_ptr += dst_binding_layout->size / 4;
+                       dst_buffer_list[j] = src_buffer_list[j];
+                       ++src_buffer_list;
+                       ++dst_buffer_list;
                }
        }
 }
@@ -943,7 +996,7 @@ VkResult radv_CreateDescriptorUpdateTemplate(VkDevice _device,
 
        templ = vk_alloc2(&device->alloc, pAllocator, size, 8, VK_SYSTEM_ALLOCATION_SCOPE_OBJECT);
        if (!templ)
-               return vk_error(VK_ERROR_OUT_OF_HOST_MEMORY);
+               return vk_error(device->instance, VK_ERROR_OUT_OF_HOST_MEMORY);
 
        templ->entry_count = entry_count;
        templ->bind_point = pCreateInfo->pipelineBindPoint;
@@ -952,6 +1005,7 @@ VkResult radv_CreateDescriptorUpdateTemplate(VkDevice _device,
                const VkDescriptorUpdateTemplateEntryKHR *entry = &pCreateInfo->pDescriptorUpdateEntries[i];
                const struct radv_descriptor_set_binding_layout *binding_layout =
                        set_layout->binding + entry->dstBinding;
+               const uint32_t buffer_offset = binding_layout->buffer_offset + entry->dstArrayElement;
                const uint32_t *immutable_samplers = NULL;
                uint32_t dst_offset;
                uint32_t dst_stride;
@@ -990,6 +1044,7 @@ VkResult radv_CreateDescriptorUpdateTemplate(VkDevice _device,
                        .src_stride = entry->stride,
                        .dst_offset = dst_offset,
                        .dst_stride = dst_stride,
+                       .buffer_offset = buffer_offset,
                        .has_sampler = !binding_layout->immutable_samplers_offset,
                        .immutable_samplers = immutable_samplers
                };
@@ -1022,6 +1077,7 @@ void radv_update_descriptor_set_with_template(struct radv_device *device,
        uint32_t i;
 
        for (i = 0; i < templ->entry_count; ++i) {
+               struct radeon_winsys_bo **buffer_list = set->descriptors + templ->entry[i].buffer_offset;
                uint32_t *pDst = set->mapped_ptr + templ->entry[i].dst_offset;
                const uint8_t *pSrc = ((const uint8_t *) pData) + templ->entry[i].src_offset;
                uint32_t j;
@@ -1033,28 +1089,28 @@ void radv_update_descriptor_set_with_template(struct radv_device *device,
                                const unsigned idx = templ->entry[i].dst_offset + j;
                                assert(!(set->layout->flags & VK_DESCRIPTOR_SET_LAYOUT_CREATE_PUSH_DESCRIPTOR_BIT_KHR));
                                write_dynamic_buffer_descriptor(device, set->dynamic_descriptors + idx,
-                                                               (struct VkDescriptorBufferInfo *) pSrc);
+                                                               buffer_list, (struct VkDescriptorBufferInfo *) pSrc);
                                break;
                        }
                        case VK_DESCRIPTOR_TYPE_UNIFORM_BUFFER:
                        case VK_DESCRIPTOR_TYPE_STORAGE_BUFFER:
-                               write_buffer_descriptor(device, pDst,
+                               write_buffer_descriptor(device, cmd_buffer, pDst, buffer_list,
                                                        (struct VkDescriptorBufferInfo *) pSrc);
                                break;
                        case VK_DESCRIPTOR_TYPE_UNIFORM_TEXEL_BUFFER:
                        case VK_DESCRIPTOR_TYPE_STORAGE_TEXEL_BUFFER:
-                               write_texel_buffer_descriptor(device, pDst,
+                               write_texel_buffer_descriptor(device, cmd_buffer, pDst, buffer_list,
                                                              *(VkBufferView *) pSrc);
                                break;
                        case VK_DESCRIPTOR_TYPE_SAMPLED_IMAGE:
                        case VK_DESCRIPTOR_TYPE_STORAGE_IMAGE:
                        case VK_DESCRIPTOR_TYPE_INPUT_ATTACHMENT:
-                               write_image_descriptor(device, pDst,
+                               write_image_descriptor(device, cmd_buffer, pDst, buffer_list,
                                                       templ->entry[i].descriptor_type,
                                                       (struct VkDescriptorImageInfo *) pSrc);
                                break;
                        case VK_DESCRIPTOR_TYPE_COMBINED_IMAGE_SAMPLER:
-                               write_combined_image_sampler_descriptor(device, pDst,
+                               write_combined_image_sampler_descriptor(device, cmd_buffer, pDst, buffer_list,
                                                                        templ->entry[i].descriptor_type,
                                                                        (struct VkDescriptorImageInfo *) pSrc,
                                                                        templ->entry[i].has_sampler);
@@ -1074,6 +1130,7 @@ void radv_update_descriptor_set_with_template(struct radv_device *device,
                        }
                        pSrc += templ->entry[i].src_stride;
                        pDst += templ->entry[i].dst_stride;
+                       ++buffer_list;
                }
        }
 }