amd/common: cleanup DATA_FORMAT/NUM_FORMAT field names
[mesa.git] / src / amd / vulkan / radv_meta_resolve.c
index d4d3552f317a1676bb331a28c4e1dc15ebbdcc84..2b97c42fc6937127d5b5c4d11af5827f3a59ad3c 100644 (file)
@@ -251,24 +251,12 @@ radv_device_finish_meta_resolve_state(struct radv_device *device)
 
 }
 
-static VkFormat pipeline_formats[] = {
-       VK_FORMAT_R8G8B8A8_UNORM,
-       VK_FORMAT_R8G8B8A8_UINT,
-       VK_FORMAT_R8G8B8A8_SINT,
-       VK_FORMAT_A2R10G10B10_UINT_PACK32,
-       VK_FORMAT_A2R10G10B10_SINT_PACK32,
-       VK_FORMAT_R16G16B16A16_UNORM,
-       VK_FORMAT_R16G16B16A16_SNORM,
-       VK_FORMAT_R16G16B16A16_UINT,
-       VK_FORMAT_R16G16B16A16_SINT,
-       VK_FORMAT_R32_SFLOAT,
-       VK_FORMAT_R32G32_SFLOAT,
-       VK_FORMAT_R32G32B32A32_SFLOAT
-};
-
 VkResult
-radv_device_init_meta_resolve_state(struct radv_device *device)
+radv_device_init_meta_resolve_state(struct radv_device *device, bool on_demand)
 {
+       if (on_demand)
+               return VK_SUCCESS;
+
        VkResult res = VK_SUCCESS;
        struct radv_meta_state *state = &device->meta_state;
        struct radv_shader_module vs_module = { .nir = radv_meta_build_nir_vs_generate_vertices() };
@@ -278,8 +266,8 @@ radv_device_init_meta_resolve_state(struct radv_device *device)
                goto fail;
        }
 
-       for (uint32_t i = 0; i < ARRAY_SIZE(pipeline_formats); ++i) {
-               VkFormat format = pipeline_formats[i];
+       for (uint32_t i = 0; i < NUM_META_FS_KEYS; ++i) {
+               VkFormat format = radv_fs_key_format_exemplars[i];
                unsigned fs_key = radv_format_meta_fs_key(format);
                res = create_pass(device, format, &state->resolve.pass[fs_key]);
                if (res != VK_SUCCESS)
@@ -343,6 +331,7 @@ enum radv_resolve_method {
 };
 
 static void radv_pick_resolve_method_images(struct radv_image *src_image,
+                                           VkFormat src_format,
                                            struct radv_image *dest_image,
                                            VkImageLayout dest_image_layout,
                                            struct radv_cmd_buffer *cmd_buffer,
@@ -353,21 +342,53 @@ static void radv_pick_resolve_method_images(struct radv_image *src_image,
                                                           cmd_buffer->queue_family_index,
                                                           cmd_buffer->queue_family_index);
 
-       if (src_image->vk_format == VK_FORMAT_R16G16_UNORM ||
-           src_image->vk_format == VK_FORMAT_R16G16_SNORM)
+       if (src_format == VK_FORMAT_R16G16_UNORM ||
+           src_format == VK_FORMAT_R16G16_SNORM)
                *method = RESOLVE_COMPUTE;
-       else if (vk_format_is_int(src_image->vk_format))
+       else if (vk_format_is_int(src_format))
                *method = RESOLVE_COMPUTE;
-       else if (src_image->info.array_size > 1)
+       else if (src_image->info.array_size > 1 ||
+                dest_image->info.array_size > 1)
                *method = RESOLVE_COMPUTE;
        
        if (radv_layout_dcc_compressed(dest_image, dest_image_layout, queue_mask)) {
                *method = RESOLVE_FRAGMENT;
-       } else if (dest_image->surface.micro_tile_mode != src_image->surface.micro_tile_mode) {
+       } else if (dest_image->planes[0].surface.micro_tile_mode !=
+                  src_image->planes[0].surface.micro_tile_mode) {
                *method = RESOLVE_COMPUTE;
        }
 }
 
+static VkResult
+build_resolve_pipeline(struct radv_device *device,
+                       unsigned fs_key)
+{
+       VkResult result = VK_SUCCESS;
+
+       if (device->meta_state.resolve.pipeline[fs_key])
+               return result;
+
+       mtx_lock(&device->meta_state.mtx);
+       if (device->meta_state.resolve.pipeline[fs_key]) {
+               mtx_unlock(&device->meta_state.mtx);
+               return result;
+       }
+
+       struct radv_shader_module vs_module = { .nir = radv_meta_build_nir_vs_generate_vertices() };
+
+       result = create_pass(device, radv_fs_key_format_exemplars[fs_key], &device->meta_state.resolve.pass[fs_key]);
+       if (result != VK_SUCCESS)
+               goto fail;
+
+       VkShaderModule vs_module_h = radv_shader_module_to_handle(&vs_module);
+       result = create_pipeline(device, vs_module_h, &device->meta_state.resolve.pipeline[fs_key], device->meta_state.resolve.pass[fs_key]);
+
+fail:
+       ralloc_free(vs_module.nir);
+       mtx_unlock(&device->meta_state.mtx);
+       return result;
+}
+
 void radv_CmdResolveImage(
        VkCommandBuffer                             cmd_buffer_h,
        VkImage                                     src_image_h,
@@ -402,9 +423,9 @@ void radv_CmdResolveImage(
        } else
                resolve_method = RESOLVE_COMPUTE;
 
-       radv_pick_resolve_method_images(src_image, dest_image,
-                                       dest_image_layout, cmd_buffer,
-                                       &resolve_method);
+       radv_pick_resolve_method_images(src_image, src_image->vk_format,
+                                       dest_image, dest_image_layout,
+                                       cmd_buffer, &resolve_method);
 
        if (resolve_method == RESOLVE_FRAGMENT) {
                radv_meta_resolve_fragment_image(cmd_buffer,
@@ -419,8 +440,10 @@ void radv_CmdResolveImage(
        if (resolve_method == RESOLVE_COMPUTE) {
                radv_meta_resolve_compute_image(cmd_buffer,
                                                src_image,
+                                               src_image->vk_format,
                                                src_image_layout,
                                                dest_image,
+                                               dest_image->vk_format,
                                                dest_image_layout,
                                                region_count, regions);
                return;
@@ -437,14 +460,6 @@ void radv_CmdResolveImage(
        }
        assert(dest_image->info.samples == 1);
 
-       if (src_image->info.samples >= 16) {
-               /* See commit aa3f9aaf31e9056a255f9e0472ebdfdaa60abe54 for the
-                * glBlitFramebuffer workaround for samples >= 16.
-                */
-               radv_finishme("vkCmdResolveImage: need interpolation workaround when "
-                             "samples >= 16");
-       }
-
        if (src_image->info.array_size > 1)
                radv_finishme("vkCmdResolveImage: multisample array images");
 
@@ -498,6 +513,12 @@ void radv_CmdResolveImage(
                for (uint32_t layer = 0; layer < region->srcSubresource.layerCount;
                     ++layer) {
 
+                       VkResult ret = build_resolve_pipeline(device, fs_key);
+                       if (ret != VK_SUCCESS) {
+                               cmd_buffer->record_result = ret;
+                               break;
+                       }
+
                        struct radv_image_view src_iview;
                        radv_image_view_init(&src_iview, cmd_buffer->device,
                                             &(VkImageViewCreateInfo) {
@@ -600,30 +621,27 @@ radv_cmd_buffer_resolve_subpass(struct radv_cmd_buffer *cmd_buffer)
        struct radv_meta_saved_state saved_state;
        enum radv_resolve_method resolve_method = RESOLVE_HW;
 
-       /* FINISHME(perf): Skip clears for resolve attachments.
-        *
-        * From the Vulkan 1.0 spec:
-        *
-        *    If the first use of an attachment in a render pass is as a resolve
-        *    attachment, then the loadOp is effectively ignored as the resolve is
-        *    guaranteed to overwrite all pixels in the render area.
-        */
-
        if (!subpass->has_resolve)
                return;
 
        for (uint32_t i = 0; i < subpass->color_count; ++i) {
-               VkAttachmentReference src_att = subpass->color_attachments[i];
-               VkAttachmentReference dest_att = subpass->resolve_attachments[i];
+               struct radv_subpass_attachment src_att = subpass->color_attachments[i];
+               struct radv_subpass_attachment dest_att = subpass->resolve_attachments[i];
 
-               if (src_att.attachment == VK_ATTACHMENT_UNUSED ||
-                   dest_att.attachment == VK_ATTACHMENT_UNUSED)
+               if (dest_att.attachment == VK_ATTACHMENT_UNUSED)
                        continue;
 
+               /* Make sure to not clear color attachments after resolves. */
+               cmd_buffer->state.attachments[dest_att.attachment].pending_clear_aspects = 0;
+
                struct radv_image *dst_img = cmd_buffer->state.framebuffer->attachments[dest_att.attachment].attachment->image;
-               struct radv_image *src_img = cmd_buffer->state.framebuffer->attachments[src_att.attachment].attachment->image;
+               struct radv_image_view *src_iview= cmd_buffer->state.framebuffer->attachments[src_att.attachment].attachment;
+               struct radv_image *src_img = src_iview->image;
+
+               radv_pick_resolve_method_images(src_img, src_iview->vk_format,
+                                               dst_img, dest_att.layout,
+                                               cmd_buffer, &resolve_method);
 
-               radv_pick_resolve_method_images(src_img, dst_img, dest_att.layout, cmd_buffer, &resolve_method);
                if (resolve_method == RESOLVE_FRAGMENT) {
                        break;
                }
@@ -641,14 +659,14 @@ radv_cmd_buffer_resolve_subpass(struct radv_cmd_buffer *cmd_buffer)
                       RADV_META_SAVE_GRAPHICS_PIPELINE);
 
        for (uint32_t i = 0; i < subpass->color_count; ++i) {
-               VkAttachmentReference src_att = subpass->color_attachments[i];
-               VkAttachmentReference dest_att = subpass->resolve_attachments[i];
+               struct radv_subpass_attachment src_att = subpass->color_attachments[i];
+               struct radv_subpass_attachment dest_att = subpass->resolve_attachments[i];
 
-               if (src_att.attachment == VK_ATTACHMENT_UNUSED ||
-                   dest_att.attachment == VK_ATTACHMENT_UNUSED)
+               if (dest_att.attachment == VK_ATTACHMENT_UNUSED)
                        continue;
 
-               struct radv_image *dst_img = cmd_buffer->state.framebuffer->attachments[dest_att.attachment].attachment->image;
+               struct radv_image_view *dest_iview = cmd_buffer->state.framebuffer->attachments[dest_att.attachment].attachment;
+               struct radv_image *dst_img = dest_iview->image;
 
                if (radv_image_has_dcc(dst_img)) {
                        radv_initialize_dcc(cmd_buffer, dst_img, 0xffffffff);
@@ -657,19 +675,26 @@ radv_cmd_buffer_resolve_subpass(struct radv_cmd_buffer *cmd_buffer)
 
                struct radv_subpass resolve_subpass = {
                        .color_count = 2,
-                       .color_attachments = (VkAttachmentReference[]) { src_att, dest_att },
-                       .depth_stencil_attachment = { .attachment = VK_ATTACHMENT_UNUSED },
+                       .color_attachments = (struct radv_subpass_attachment[]) { src_att, dest_att },
+                       .depth_stencil_attachment = NULL,
                };
 
-               radv_cmd_buffer_set_subpass(cmd_buffer, &resolve_subpass, false);
+               radv_cmd_buffer_set_subpass(cmd_buffer, &resolve_subpass);
+
+               VkResult ret = build_resolve_pipeline(cmd_buffer->device, radv_format_meta_fs_key(dest_iview->vk_format));
+               if (ret != VK_SUCCESS) {
+                       cmd_buffer->record_result = ret;
+                       continue;
+               }
 
                emit_resolve(cmd_buffer,
-                            dst_img->vk_format,
+                            dest_iview->vk_format,
                             &(VkOffset2D) { 0, 0 },
                             &(VkExtent2D) { fb->width, fb->height });
        }
 
-       cmd_buffer->state.subpass = subpass;
+       radv_cmd_buffer_set_subpass(cmd_buffer, subpass);
+
        radv_meta_restore(&saved_state, cmd_buffer);
 }
 
@@ -684,11 +709,10 @@ radv_decompress_resolve_subpass_src(struct radv_cmd_buffer *cmd_buffer)
        struct radv_framebuffer *fb = cmd_buffer->state.framebuffer;
 
        for (uint32_t i = 0; i < subpass->color_count; ++i) {
-               VkAttachmentReference src_att = subpass->color_attachments[i];
-               VkAttachmentReference dest_att = subpass->resolve_attachments[i];
+               struct radv_subpass_attachment src_att = subpass->color_attachments[i];
+               struct radv_subpass_attachment dest_att = subpass->resolve_attachments[i];
 
-               if (src_att.attachment == VK_ATTACHMENT_UNUSED ||
-                   dest_att.attachment == VK_ATTACHMENT_UNUSED)
+               if (dest_att.attachment == VK_ATTACHMENT_UNUSED)
                        continue;
 
                struct radv_image *src_image =