radv: Don't expose heaps with 0 memory.
[mesa.git] / src / amd / vulkan / radv_device.c
index e6d595dfbe5e33a45cf597c83fa44136112de69e..e34b19c648a033ffddfcdfe856a5fba0a74db040 100644 (file)
@@ -76,178 +76,6 @@ radv_get_device_uuid(struct radeon_info *info, void *uuid)
        ac_compute_device_uuid(info, uuid, VK_UUID_SIZE);
 }
 
-static const VkExtensionProperties instance_extensions[] = {
-       {
-               .extensionName = VK_KHR_SURFACE_EXTENSION_NAME,
-               .specVersion = 25,
-       },
-#ifdef VK_USE_PLATFORM_XCB_KHR
-       {
-               .extensionName = VK_KHR_XCB_SURFACE_EXTENSION_NAME,
-               .specVersion = 6,
-       },
-#endif
-#ifdef VK_USE_PLATFORM_XLIB_KHR
-       {
-               .extensionName = VK_KHR_XLIB_SURFACE_EXTENSION_NAME,
-               .specVersion = 6,
-       },
-#endif
-#ifdef VK_USE_PLATFORM_WAYLAND_KHR
-       {
-               .extensionName = VK_KHR_WAYLAND_SURFACE_EXTENSION_NAME,
-               .specVersion = 6,
-       },
-#endif
-       {
-               .extensionName = VK_KHR_GET_PHYSICAL_DEVICE_PROPERTIES_2_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_EXTERNAL_MEMORY_CAPABILITIES_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_EXTERNAL_SEMAPHORE_CAPABILITIES_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-};
-
-static const VkExtensionProperties common_device_extensions[] = {
-       {
-               .extensionName = VK_KHR_DESCRIPTOR_UPDATE_TEMPLATE_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_INCREMENTAL_PRESENT_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_MAINTENANCE1_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_PUSH_DESCRIPTOR_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_SAMPLER_MIRROR_CLAMP_TO_EDGE_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_SWAPCHAIN_EXTENSION_NAME,
-               .specVersion = 68,
-       },
-       {
-               .extensionName = VK_AMD_DRAW_INDIRECT_COUNT_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_SHADER_DRAW_PARAMETERS_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_GET_MEMORY_REQUIREMENTS_2_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_DEDICATED_ALLOCATION_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_EXTERNAL_MEMORY_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_EXTERNAL_MEMORY_FD_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_STORAGE_BUFFER_STORAGE_CLASS_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_VARIABLE_POINTERS_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_IMAGE_FORMAT_LIST_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-};
-static const VkExtensionProperties ext_sema_device_extensions[] = {
-       {
-               .extensionName = VK_KHR_EXTERNAL_SEMAPHORE_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHR_EXTERNAL_SEMAPHORE_FD_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-       {
-               .extensionName = VK_KHX_MULTIVIEW_EXTENSION_NAME,
-               .specVersion = 1,
-       },
-};
-
-static VkResult
-radv_extensions_register(struct radv_instance *instance,
-                       struct radv_extensions *extensions,
-                       const VkExtensionProperties *new_ext,
-                       uint32_t num_ext)
-{
-       size_t new_size;
-       VkExtensionProperties *new_ptr;
-
-       assert(new_ext && num_ext > 0);
-
-       if (!new_ext)
-               return VK_ERROR_INITIALIZATION_FAILED;
-
-       new_size = (extensions->num_ext + num_ext) * sizeof(VkExtensionProperties);
-       new_ptr = vk_realloc(&instance->alloc, extensions->ext_array,
-                               new_size, 8, VK_SYSTEM_ALLOCATION_SCOPE_INSTANCE);
-
-       /* Old array continues to be valid, update nothing */
-       if (!new_ptr)
-               return VK_ERROR_OUT_OF_HOST_MEMORY;
-
-       memcpy(&new_ptr[extensions->num_ext], new_ext,
-               num_ext * sizeof(VkExtensionProperties));
-       extensions->ext_array = new_ptr;
-       extensions->num_ext += num_ext;
-
-       return VK_SUCCESS;
-}
-
-static void
-radv_extensions_finish(struct radv_instance *instance,
-                       struct radv_extensions *extensions)
-{
-       assert(extensions);
-
-       if (!extensions)
-               radv_loge("Attemted to free invalid extension struct\n");
-
-       if (extensions->ext_array)
-               vk_free(&instance->alloc, extensions->ext_array);
-}
-
-static bool
-is_extension_enabled(const VkExtensionProperties *extensions,
-                       size_t num_ext,
-                       const char *name)
-{
-       assert(extensions && name);
-
-       for (uint32_t i = 0; i < num_ext; i++) {
-               if (strcmp(name, extensions[i].extensionName) == 0)
-                       return true;
-       }
-
-       return false;
-}
-
 static const char *
 get_chip_name(enum radeon_family family)
 {
@@ -276,6 +104,75 @@ get_chip_name(enum radeon_family family)
        }
 }
 
+static void
+radv_physical_device_init_mem_types(struct radv_physical_device *device)
+{
+       STATIC_ASSERT(RADV_MEM_HEAP_COUNT <= VK_MAX_MEMORY_HEAPS);
+       uint64_t visible_vram_size = MIN2(device->rad_info.vram_size,
+                                         device->rad_info.vram_vis_size);
+
+       int vram_index = -1, visible_vram_index = -1, gart_index = -1;
+       device->memory_properties.memoryHeapCount = 0;
+       if (device->rad_info.vram_size - visible_vram_size > 0) {
+               vram_index = device->memory_properties.memoryHeapCount++;
+               device->memory_properties.memoryHeaps[vram_index] = (VkMemoryHeap) {
+                       .size = device->rad_info.vram_size - visible_vram_size,
+                       .flags = VK_MEMORY_HEAP_DEVICE_LOCAL_BIT,
+               };
+       }
+       if (visible_vram_size) {
+               visible_vram_index = device->memory_properties.memoryHeapCount++;
+               device->memory_properties.memoryHeaps[visible_vram_index] = (VkMemoryHeap) {
+                       .size = visible_vram_size,
+                       .flags = VK_MEMORY_HEAP_DEVICE_LOCAL_BIT,
+               };
+       }
+       if (device->rad_info.gart_size > 0) {
+               gart_index = device->memory_properties.memoryHeapCount++;
+               device->memory_properties.memoryHeaps[gart_index] = (VkMemoryHeap) {
+                       .size = device->rad_info.gart_size,
+                       .flags = 0,
+               };
+       }
+
+       STATIC_ASSERT(RADV_MEM_TYPE_COUNT <= VK_MAX_MEMORY_TYPES);
+       unsigned type_count = 0;
+       if (vram_index >= 0) {
+               device->mem_type_indices[type_count] = RADV_MEM_TYPE_VRAM;
+               device->memory_properties.memoryTypes[type_count++] = (VkMemoryType) {
+                       .propertyFlags = VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT,
+                       .heapIndex = vram_index,
+               };
+       }
+       if (gart_index >= 0) {
+               device->mem_type_indices[type_count] = RADV_MEM_TYPE_GTT_WRITE_COMBINE;
+               device->memory_properties.memoryTypes[type_count++] = (VkMemoryType) {
+                       .propertyFlags = VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
+                       VK_MEMORY_PROPERTY_HOST_COHERENT_BIT,
+                       .heapIndex = gart_index,
+               };
+       }
+       if (visible_vram_index >= 0) {
+               device->mem_type_indices[type_count] = RADV_MEM_TYPE_VRAM_CPU_ACCESS;
+               device->memory_properties.memoryTypes[type_count++] = (VkMemoryType) {
+                       .propertyFlags = VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
+                       VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
+                       VK_MEMORY_PROPERTY_HOST_COHERENT_BIT,
+                       .heapIndex = visible_vram_index,
+               };
+       }
+       if (gart_index >= 0) {
+               device->mem_type_indices[type_count] = RADV_MEM_TYPE_GTT_CACHED;
+               device->memory_properties.memoryTypes[type_count++] = (VkMemoryType) {
+                       .propertyFlags = VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
+                       VK_MEMORY_PROPERTY_HOST_COHERENT_BIT |
+                       VK_MEMORY_PROPERTY_HOST_CACHED_BIT,
+                       .heapIndex = gart_index,
+               };
+       }
+       device->memory_properties.memoryTypeCount = type_count;
+}
+
 static VkResult
 radv_physical_device_init(struct radv_physical_device *device,
                          struct radv_instance *instance,
@@ -324,6 +221,8 @@ radv_physical_device_init(struct radv_physical_device *device,
                goto fail;
        }
 
+       device->name = get_chip_name(device->rad_info.family);
+
        if (radv_device_get_cache_uuid(device->rad_info.family, device->cache_uuid)) {
                radv_finish_wsi(device);
                device->ws->destroy(device->ws);
@@ -332,24 +231,19 @@ radv_physical_device_init(struct radv_physical_device *device,
                goto fail;
        }
 
-       result = radv_extensions_register(instance,
-                                       &device->extensions,
-                                       common_device_extensions,
-                                       ARRAY_SIZE(common_device_extensions));
-       if (result != VK_SUCCESS)
-               goto fail;
+       /* These flags affect shader compilation. */
+       uint64_t shader_env_flags =
+               (device->instance->perftest_flags & RADV_PERFTEST_SISCHED ? 0x1 : 0) |
+               (device->instance->debug_flags & RADV_DEBUG_UNSAFE_MATH ? 0x2 : 0);
 
-       if (device->rad_info.has_syncobj) {
-               result = radv_extensions_register(instance,
-                                                 &device->extensions,
-                                                 ext_sema_device_extensions,
-                                                 ARRAY_SIZE(ext_sema_device_extensions));
-               if (result != VK_SUCCESS)
-                       goto fail;
-       }
+       /* The gpu id is already embeded in the uuid so we just pass "radv"
+        * when creating the cache.
+        */
+       char buf[VK_UUID_SIZE * 2 + 1];
+       disk_cache_format_hex_id(buf, device->cache_uuid, VK_UUID_SIZE * 2);
+       device->disk_cache = disk_cache_create(device->name, buf, shader_env_flags);
 
        fprintf(stderr, "WARNING: radv is not a conformant vulkan implementation, testing use only.\n");
-       device->name = get_chip_name(device->rad_info.family);
 
        radv_get_driver_uuid(&device->device_uuid);
        radv_get_device_uuid(&device->rad_info, &device->device_uuid);
@@ -360,6 +254,12 @@ radv_physical_device_init(struct radv_physical_device *device,
                device->rbplus_allowed = device->rad_info.family == CHIP_STONEY;
        }
 
+       /* The mere presense of CLEAR_STATE in the IB causes random GPU hangs
+        * on SI.
+        */
+       device->has_clear_state = device->rad_info.chip_class >= CIK;
+
+       radv_physical_device_init_mem_types(device);
        return VK_SUCCESS;
 
 fail:
@@ -370,9 +270,9 @@ fail:
 static void
 radv_physical_device_finish(struct radv_physical_device *device)
 {
-       radv_extensions_finish(device->instance, &device->extensions);
        radv_finish_wsi(device);
        device->ws->destroy(device->ws);
+       disk_cache_destroy(device->disk_cache);
        close(device->local_fd);
 }
 
@@ -468,9 +368,8 @@ VkResult radv_CreateInstance(
        }
 
        for (uint32_t i = 0; i < pCreateInfo->enabledExtensionCount; i++) {
-               if (!is_extension_enabled(instance_extensions,
-                                       ARRAY_SIZE(instance_extensions),
-                                       pCreateInfo->ppEnabledExtensionNames[i]))
+               const char *ext_name = pCreateInfo->ppEnabledExtensionNames[i];
+               if (!radv_instance_extension_supported(ext_name))
                        return vk_error(VK_ERROR_EXTENSION_NOT_PRESENT);
        }
 
@@ -543,7 +442,7 @@ radv_enumerate_devices(struct radv_instance *instance)
        for (unsigned i = 0; i < (unsigned)max_devices; i++) {
                if (devices[i]->available_nodes & 1 << DRM_NODE_RENDER &&
                    devices[i]->bustype == DRM_BUS_PCI &&
-                   devices[i]->deviceinfo.pci->vendor_id == 0x1002) {
+                   devices[i]->deviceinfo.pci->vendor_id == ATI_VENDOR_ID) {
 
                        result = radv_physical_device_init(instance->physicalDevices +
                                                           instance->physicalDeviceCount,
@@ -591,8 +490,6 @@ void radv_GetPhysicalDeviceFeatures(
        VkPhysicalDevice                            physicalDevice,
        VkPhysicalDeviceFeatures*                   pFeatures)
 {
-       RADV_FROM_HANDLE(radv_physical_device, pdevice, physicalDevice);
-       bool is_gfx9 = pdevice->rad_info.chip_class >= GFX9;
        memset(pFeatures, 0, sizeof(*pFeatures));
 
        *pFeatures = (VkPhysicalDeviceFeatures) {
@@ -600,8 +497,8 @@ void radv_GetPhysicalDeviceFeatures(
                .fullDrawIndexUint32                      = true,
                .imageCubeArray                           = true,
                .independentBlend                         = true,
-               .geometryShader                           = !is_gfx9,
-               .tessellationShader                       = !is_gfx9,
+               .geometryShader                           = true,
+               .tessellationShader                       = true,
                .sampleRateShading                        = true,
                .dualSrcBlend                             = true,
                .logicOp                                  = true,
@@ -804,9 +701,9 @@ void radv_GetPhysicalDeviceProperties(
        };
 
        *pProperties = (VkPhysicalDeviceProperties) {
-               .apiVersion = VK_MAKE_VERSION(1, 0, 42),
+               .apiVersion = radv_physical_device_api_version(pdevice),
                .driverVersion = vk_get_driver_version(),
-               .vendorID = 0x1002,
+               .vendorID = ATI_VENDOR_ID,
                .deviceID = pdevice->rad_info.pci_id,
                .deviceType = pdevice->rad_info.has_dedicated_vram ? VK_PHYSICAL_DEVICE_TYPE_DISCRETE_GPU : VK_PHYSICAL_DEVICE_TYPE_INTEGRATED_GPU,
                .limits = limits,
@@ -845,6 +742,12 @@ void radv_GetPhysicalDeviceProperties2KHR(
                        properties->maxMultiviewInstanceIndex = INT_MAX;
                        break;
                }
+               case VK_STRUCTURE_TYPE_PHYSICAL_DEVICE_POINT_CLIPPING_PROPERTIES_KHR: {
+                       VkPhysicalDevicePointClippingPropertiesKHR *properties =
+                           (VkPhysicalDevicePointClippingPropertiesKHR*)ext;
+                       properties->pointClippingBehavior = VK_POINT_CLIPPING_BEHAVIOR_ALL_CLIP_PLANES_KHR;
+                       break;
+               }
                default:
                        break;
                }
@@ -947,49 +850,7 @@ void radv_GetPhysicalDeviceMemoryProperties(
 {
        RADV_FROM_HANDLE(radv_physical_device, physical_device, physicalDevice);
 
-       STATIC_ASSERT(RADV_MEM_TYPE_COUNT <= VK_MAX_MEMORY_TYPES);
-
-       pMemoryProperties->memoryTypeCount = RADV_MEM_TYPE_COUNT;
-       pMemoryProperties->memoryTypes[RADV_MEM_TYPE_VRAM] = (VkMemoryType) {
-               .propertyFlags = VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT,
-               .heapIndex = RADV_MEM_HEAP_VRAM,
-       };
-       pMemoryProperties->memoryTypes[RADV_MEM_TYPE_GTT_WRITE_COMBINE] = (VkMemoryType) {
-               .propertyFlags = VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
-               VK_MEMORY_PROPERTY_HOST_COHERENT_BIT,
-               .heapIndex = RADV_MEM_HEAP_GTT,
-       };
-       pMemoryProperties->memoryTypes[RADV_MEM_TYPE_VRAM_CPU_ACCESS] = (VkMemoryType) {
-               .propertyFlags = VK_MEMORY_PROPERTY_DEVICE_LOCAL_BIT |
-               VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
-               VK_MEMORY_PROPERTY_HOST_COHERENT_BIT,
-               .heapIndex = RADV_MEM_HEAP_VRAM_CPU_ACCESS,
-       };
-       pMemoryProperties->memoryTypes[RADV_MEM_TYPE_GTT_CACHED] = (VkMemoryType) {
-               .propertyFlags = VK_MEMORY_PROPERTY_HOST_VISIBLE_BIT |
-               VK_MEMORY_PROPERTY_HOST_COHERENT_BIT |
-               VK_MEMORY_PROPERTY_HOST_CACHED_BIT,
-               .heapIndex = RADV_MEM_HEAP_GTT,
-       };
-
-       STATIC_ASSERT(RADV_MEM_HEAP_COUNT <= VK_MAX_MEMORY_HEAPS);
-       uint64_t visible_vram_size = MIN2(physical_device->rad_info.vram_size,
-                                         physical_device->rad_info.vram_vis_size);
-
-       pMemoryProperties->memoryHeapCount = RADV_MEM_HEAP_COUNT;
-       pMemoryProperties->memoryHeaps[RADV_MEM_HEAP_VRAM] = (VkMemoryHeap) {
-               .size = physical_device->rad_info.vram_size -
-                               visible_vram_size,
-               .flags = VK_MEMORY_HEAP_DEVICE_LOCAL_BIT,
-       };
-       pMemoryProperties->memoryHeaps[RADV_MEM_HEAP_VRAM_CPU_ACCESS] = (VkMemoryHeap) {
-               .size = visible_vram_size,
-               .flags = VK_MEMORY_HEAP_DEVICE_LOCAL_BIT,
-       };
-       pMemoryProperties->memoryHeaps[RADV_MEM_HEAP_GTT] = (VkMemoryHeap) {
-               .size = physical_device->rad_info.gart_size,
-               .flags = 0,
-       };
+       *pMemoryProperties = physical_device->memory_properties;
 }
 
 void radv_GetPhysicalDeviceMemoryProperties2KHR(
@@ -1000,16 +861,40 @@ void radv_GetPhysicalDeviceMemoryProperties2KHR(
                                                      &pMemoryProperties->memoryProperties);
 }
 
+static enum radeon_ctx_priority
+radv_get_queue_global_priority(const VkDeviceQueueGlobalPriorityCreateInfoEXT *pObj)
+{
+       /* Default to MEDIUM when a specific global priority isn't requested */
+       if (!pObj)
+               return RADEON_CTX_PRIORITY_MEDIUM;
+
+       switch(pObj->globalPriority) {
+       case VK_QUEUE_GLOBAL_PRIORITY_REALTIME:
+               return RADEON_CTX_PRIORITY_REALTIME;
+       case VK_QUEUE_GLOBAL_PRIORITY_HIGH:
+               return RADEON_CTX_PRIORITY_HIGH;
+       case VK_QUEUE_GLOBAL_PRIORITY_MEDIUM:
+               return RADEON_CTX_PRIORITY_MEDIUM;
+       case VK_QUEUE_GLOBAL_PRIORITY_LOW:
+               return RADEON_CTX_PRIORITY_LOW;
+       default:
+               unreachable("Illegal global priority value");
+               return RADEON_CTX_PRIORITY_INVALID;
+       }
+}
+
 static int
 radv_queue_init(struct radv_device *device, struct radv_queue *queue,
-               int queue_family_index, int idx)
+               int queue_family_index, int idx,
+               const VkDeviceQueueGlobalPriorityCreateInfoEXT *global_priority)
 {
        queue->_loader_data.loaderMagic = ICD_LOADER_MAGIC;
        queue->device = device;
        queue->queue_family_index = queue_family_index;
        queue->queue_idx = idx;
+       queue->priority = radv_get_queue_global_priority(global_priority);
 
-       queue->hw_ctx = device->ws->ctx_create(device->ws);
+       queue->hw_ctx = device->ws->ctx_create(device->ws, queue->priority);
        if (!queue->hw_ctx)
                return VK_ERROR_OUT_OF_HOST_MEMORY;
 
@@ -1087,11 +972,15 @@ VkResult radv_CreateDevice(
        VkResult result;
        struct radv_device *device;
 
+       bool keep_shader_info = false;
+
        for (uint32_t i = 0; i < pCreateInfo->enabledExtensionCount; i++) {
-               if (!is_extension_enabled(physical_device->extensions.ext_array,
-                                       physical_device->extensions.num_ext,
-                                       pCreateInfo->ppEnabledExtensionNames[i]))
+               const char *ext_name = pCreateInfo->ppEnabledExtensionNames[i];
+               if (!radv_physical_device_extension_supported(physical_device, ext_name))
                        return vk_error(VK_ERROR_EXTENSION_NOT_PRESENT);
+
+               if (strcmp(ext_name, VK_AMD_SHADER_INFO_EXTENSION_NAME) == 0)
+                       keep_shader_info = true;
        }
 
        /* Check enabled features */
@@ -1119,8 +1008,6 @@ VkResult radv_CreateDevice(
        device->instance = physical_device->instance;
        device->physical_device = physical_device;
 
-       device->debug_flags = device->instance->debug_flags;
-
        device->ws = physical_device->ws;
        if (pAllocator)
                device->alloc = *pAllocator;
@@ -1133,6 +1020,10 @@ VkResult radv_CreateDevice(
        for (unsigned i = 0; i < pCreateInfo->queueCreateInfoCount; i++) {
                const VkDeviceQueueCreateInfo *queue_create = &pCreateInfo->pQueueCreateInfos[i];
                uint32_t qfi = queue_create->queueFamilyIndex;
+               const VkDeviceQueueGlobalPriorityCreateInfoEXT *global_priority =
+                       vk_find_struct_const(queue_create->pNext, DEVICE_QUEUE_GLOBAL_PRIORITY_CREATE_INFO_EXT);
+
+               assert(!global_priority || device->physical_device->rad_info.has_ctx_priority);
 
                device->queues[qfi] = vk_alloc(&device->alloc,
                                               queue_create->queueCount * sizeof(struct radv_queue), 8, VK_SYSTEM_ALLOCATION_SCOPE_DEVICE);
@@ -1146,7 +1037,7 @@ VkResult radv_CreateDevice(
                device->queue_count[qfi] = queue_create->queueCount;
 
                for (unsigned q = 0; q < queue_create->queueCount; q++) {
-                       result = radv_queue_init(device, &device->queues[qfi][q], qfi, q);
+                       result = radv_queue_init(device, &device->queues[qfi][q], qfi, q, global_priority);
                        if (result != VK_SUCCESS)
                                goto fail;
                }
@@ -1182,6 +1073,15 @@ VkResult radv_CreateDevice(
                device->physical_device->rad_info.chip_class >= VI &&
                device->physical_device->rad_info.max_se >= 2;
 
+       if (getenv("RADV_TRACE_FILE")) {
+               keep_shader_info = true;
+
+               if (!radv_init_trace(device))
+                       goto fail;
+       }
+
+       device->keep_shader_info = keep_shader_info;
+
        result = radv_device_init_meta(device);
        if (result != VK_SUCCESS)
                goto fail;
@@ -1204,11 +1104,6 @@ VkResult radv_CreateDevice(
                device->ws->cs_finalize(device->empty_cs[family]);
        }
 
-       if (getenv("RADV_TRACE_FILE")) {
-               if (!radv_init_trace(device))
-                       goto fail;
-       }
-
        if (device->physical_device->rad_info.chip_class >= CIK)
                cik_create_gfx_config(device);
 
@@ -1280,47 +1175,6 @@ void radv_DestroyDevice(
        vk_free(&device->alloc, device);
 }
 
-VkResult radv_EnumerateInstanceExtensionProperties(
-       const char*                                 pLayerName,
-       uint32_t*                                   pPropertyCount,
-       VkExtensionProperties*                      pProperties)
-{
-       if (pProperties == NULL) {
-               *pPropertyCount = ARRAY_SIZE(instance_extensions);
-               return VK_SUCCESS;
-       }
-
-       *pPropertyCount = MIN2(*pPropertyCount, ARRAY_SIZE(instance_extensions));
-       typed_memcpy(pProperties, instance_extensions, *pPropertyCount);
-
-       if (*pPropertyCount < ARRAY_SIZE(instance_extensions))
-               return VK_INCOMPLETE;
-
-       return VK_SUCCESS;
-}
-
-VkResult radv_EnumerateDeviceExtensionProperties(
-       VkPhysicalDevice                            physicalDevice,
-       const char*                                 pLayerName,
-       uint32_t*                                   pPropertyCount,
-       VkExtensionProperties*                      pProperties)
-{
-       RADV_FROM_HANDLE(radv_physical_device, pdevice, physicalDevice);
-
-       if (pProperties == NULL) {
-               *pPropertyCount = pdevice->extensions.num_ext;
-               return VK_SUCCESS;
-       }
-
-       *pPropertyCount = MIN2(*pPropertyCount, pdevice->extensions.num_ext);
-       typed_memcpy(pProperties, pdevice->extensions.ext_array, *pPropertyCount);
-
-       if (*pPropertyCount < pdevice->extensions.num_ext)
-               return VK_INCOMPLETE;
-
-       return VK_SUCCESS;
-}
-
 VkResult radv_EnumerateInstanceLayerProperties(
        uint32_t*                                   pPropertyCount,
        VkLayerProperties*                          pProperties)
@@ -1377,13 +1231,13 @@ fill_geom_tess_rings(struct radv_queue *queue,
        uint32_t *desc = &map[4];
 
        if (esgs_ring_bo)
-               esgs_va = queue->device->ws->buffer_get_va(esgs_ring_bo);
+               esgs_va = radv_buffer_get_va(esgs_ring_bo);
        if (gsvs_ring_bo)
-               gsvs_va = queue->device->ws->buffer_get_va(gsvs_ring_bo);
+               gsvs_va = radv_buffer_get_va(gsvs_ring_bo);
        if (tess_factor_ring_bo)
-               tess_factor_va = queue->device->ws->buffer_get_va(tess_factor_ring_bo);
+               tess_factor_va = radv_buffer_get_va(tess_factor_ring_bo);
        if (tess_offchip_ring_bo)
-               tess_offchip_va = queue->device->ws->buffer_get_va(tess_offchip_ring_bo);
+               tess_offchip_va = radv_buffer_get_va(tess_offchip_ring_bo);
 
        /* stride 0, num records - size, add tid, swizzle, elsize4,
           index stride 64 */
@@ -1577,6 +1431,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
        unsigned tess_factor_ring_size = 0, tess_offchip_ring_size = 0;
        unsigned max_offchip_buffers;
        unsigned hs_offchip_param = 0;
+       uint32_t ring_bo_flags = RADEON_FLAG_NO_CPU_ACCESS | RADEON_FLAG_NO_INTERPROCESS_SHARING;
        if (!queue->has_tess_rings) {
                if (needs_tess_rings)
                        add_tess_rings = true;
@@ -1610,7 +1465,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                                                              scratch_size,
                                                              4096,
                                                              RADEON_DOMAIN_VRAM,
-                                                             RADEON_FLAG_NO_CPU_ACCESS);
+                                                             ring_bo_flags);
                if (!scratch_bo)
                        goto fail;
        } else
@@ -1621,7 +1476,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                                                                      compute_scratch_size,
                                                                      4096,
                                                                      RADEON_DOMAIN_VRAM,
-                                                                     RADEON_FLAG_NO_CPU_ACCESS);
+                                                                     ring_bo_flags);
                if (!compute_scratch_bo)
                        goto fail;
 
@@ -1633,7 +1488,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                                                                esgs_ring_size,
                                                                4096,
                                                                RADEON_DOMAIN_VRAM,
-                                                               RADEON_FLAG_NO_CPU_ACCESS);
+                                                               ring_bo_flags);
                if (!esgs_ring_bo)
                        goto fail;
        } else {
@@ -1646,7 +1501,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                                                                gsvs_ring_size,
                                                                4096,
                                                                RADEON_DOMAIN_VRAM,
-                                                               RADEON_FLAG_NO_CPU_ACCESS);
+                                                               ring_bo_flags);
                if (!gsvs_ring_bo)
                        goto fail;
        } else {
@@ -1659,14 +1514,14 @@ radv_get_preamble_cs(struct radv_queue *queue,
                                                                       tess_factor_ring_size,
                                                                       256,
                                                                       RADEON_DOMAIN_VRAM,
-                                                                      RADEON_FLAG_NO_CPU_ACCESS);
+                                                                      ring_bo_flags);
                if (!tess_factor_ring_bo)
                        goto fail;
                tess_offchip_ring_bo = queue->device->ws->buffer_create(queue->device->ws,
                                                                       tess_offchip_ring_size,
                                                                       256,
                                                                       RADEON_DOMAIN_VRAM,
-                                                                      RADEON_FLAG_NO_CPU_ACCESS);
+                                                                       ring_bo_flags);
                if (!tess_offchip_ring_bo)
                        goto fail;
        } else {
@@ -1693,7 +1548,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                                                                 size,
                                                                 4096,
                                                                 RADEON_DOMAIN_VRAM,
-                                                                RADEON_FLAG_CPU_ACCESS);
+                                                                RADEON_FLAG_CPU_ACCESS|RADEON_FLAG_NO_INTERPROCESS_SHARING);
                if (!descriptor_bo)
                        goto fail;
        } else
@@ -1730,7 +1585,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                        uint32_t *map = (uint32_t*)queue->device->ws->buffer_map(descriptor_bo);
 
                        if (scratch_bo) {
-                               uint64_t scratch_va = queue->device->ws->buffer_get_va(scratch_bo);
+                               uint64_t scratch_va = radv_buffer_get_va(scratch_bo);
                                uint32_t rsrc1 = S_008F04_BASE_ADDRESS_HI(scratch_va >> 32) |
                                                 S_008F04_SWIZZLE_ENABLE(1);
                                map[0] = scratch_va;
@@ -1768,7 +1623,7 @@ radv_get_preamble_cs(struct radv_queue *queue,
                }
 
                if (tess_factor_ring_bo) {
-                       uint64_t tf_va = queue->device->ws->buffer_get_va(tess_factor_ring_bo);
+                       uint64_t tf_va = radv_buffer_get_va(tess_factor_ring_bo);
                        if (queue->device->physical_device->rad_info.chip_class >= CIK) {
                                radeon_set_uconfig_reg(cs, R_030938_VGT_TF_RING_SIZE,
                                                       S_030938_SIZE(tess_factor_ring_size / 4));
@@ -1790,24 +1645,36 @@ radv_get_preamble_cs(struct radv_queue *queue,
                }
 
                if (descriptor_bo) {
-                       uint32_t regs[] = {R_00B030_SPI_SHADER_USER_DATA_PS_0,
-                                          R_00B130_SPI_SHADER_USER_DATA_VS_0,
-                                          R_00B230_SPI_SHADER_USER_DATA_GS_0,
-                                          R_00B330_SPI_SHADER_USER_DATA_ES_0,
-                                          R_00B430_SPI_SHADER_USER_DATA_HS_0,
-                                          R_00B530_SPI_SHADER_USER_DATA_LS_0};
-
-                       uint64_t va = queue->device->ws->buffer_get_va(descriptor_bo);
-
-                       for (int i = 0; i < ARRAY_SIZE(regs); ++i) {
-                               radeon_set_sh_reg_seq(cs, regs[i], 2);
-                               radeon_emit(cs, va);
-                               radeon_emit(cs, va >> 32);
+                       uint64_t va = radv_buffer_get_va(descriptor_bo);
+                       if (queue->device->physical_device->rad_info.chip_class >= GFX9) {
+                               uint32_t regs[] = {R_00B030_SPI_SHADER_USER_DATA_PS_0,
+                                               R_00B130_SPI_SHADER_USER_DATA_VS_0,
+                                               R_00B208_SPI_SHADER_USER_DATA_ADDR_LO_GS,
+                                               R_00B408_SPI_SHADER_USER_DATA_ADDR_LO_HS};
+
+                               for (int i = 0; i < ARRAY_SIZE(regs); ++i) {
+                                       radeon_set_sh_reg_seq(cs, regs[i], 2);
+                                       radeon_emit(cs, va);
+                                       radeon_emit(cs, va >> 32);
+                               }
+                       } else {
+                               uint32_t regs[] = {R_00B030_SPI_SHADER_USER_DATA_PS_0,
+                                               R_00B130_SPI_SHADER_USER_DATA_VS_0,
+                                               R_00B230_SPI_SHADER_USER_DATA_GS_0,
+                                               R_00B330_SPI_SHADER_USER_DATA_ES_0,
+                                               R_00B430_SPI_SHADER_USER_DATA_HS_0,
+                                               R_00B530_SPI_SHADER_USER_DATA_LS_0};
+
+                               for (int i = 0; i < ARRAY_SIZE(regs); ++i) {
+                                       radeon_set_sh_reg_seq(cs, regs[i], 2);
+                                       radeon_emit(cs, va);
+                                       radeon_emit(cs, va >> 32);
+                               }
                        }
                }
 
                if (compute_scratch_bo) {
-                       uint64_t scratch_va = queue->device->ws->buffer_get_va(compute_scratch_bo);
+                       uint64_t scratch_va = radv_buffer_get_va(compute_scratch_bo);
                        uint32_t rsrc1 = S_008F04_BASE_ADDRESS_HI(scratch_va >> 32) |
                                         S_008F04_SWIZZLE_ENABLE(1);
 
@@ -2220,17 +2087,18 @@ bool radv_get_memory_fd(struct radv_device *device,
                                         pFD);
 }
 
-VkResult radv_AllocateMemory(
-       VkDevice                                    _device,
-       const VkMemoryAllocateInfo*                 pAllocateInfo,
-       const VkAllocationCallbacks*                pAllocator,
-       VkDeviceMemory*                             pMem)
+VkResult radv_alloc_memory(VkDevice                        _device,
+                          const VkMemoryAllocateInfo*     pAllocateInfo,
+                          const VkAllocationCallbacks*    pAllocator,
+                          enum radv_mem_flags_bits        mem_flags,
+                          VkDeviceMemory*                 pMem)
 {
        RADV_FROM_HANDLE(radv_device, device, _device);
        struct radv_device_memory *mem;
        VkResult result;
        enum radeon_bo_domain domain;
        uint32_t flags = 0;
+       enum radv_mem_type mem_type_index = device->physical_device->mem_type_indices[pAllocateInfo->memoryTypeIndex];
 
        assert(pAllocateInfo->sType == VK_STRUCTURE_TYPE_MEMORY_ALLOCATE_INFO);
 
@@ -2273,20 +2141,26 @@ VkResult radv_AllocateMemory(
        }
 
        uint64_t alloc_size = align_u64(pAllocateInfo->allocationSize, 4096);
-       if (pAllocateInfo->memoryTypeIndex == RADV_MEM_TYPE_GTT_WRITE_COMBINE ||
-           pAllocateInfo->memoryTypeIndex == RADV_MEM_TYPE_GTT_CACHED)
+       if (mem_type_index == RADV_MEM_TYPE_GTT_WRITE_COMBINE ||
+           mem_type_index == RADV_MEM_TYPE_GTT_CACHED)
                domain = RADEON_DOMAIN_GTT;
        else
                domain = RADEON_DOMAIN_VRAM;
 
-       if (pAllocateInfo->memoryTypeIndex == RADV_MEM_TYPE_VRAM)
+       if (mem_type_index == RADV_MEM_TYPE_VRAM)
                flags |= RADEON_FLAG_NO_CPU_ACCESS;
        else
                flags |= RADEON_FLAG_CPU_ACCESS;
 
-       if (pAllocateInfo->memoryTypeIndex == RADV_MEM_TYPE_GTT_WRITE_COMBINE)
+       if (mem_type_index == RADV_MEM_TYPE_GTT_WRITE_COMBINE)
                flags |= RADEON_FLAG_GTT_WC;
 
+       if (mem_flags & RADV_MEM_IMPLICIT_SYNC)
+               flags |= RADEON_FLAG_IMPLICIT_SYNC;
+
+       if (!dedicate_info && !import_info)
+               flags |= RADEON_FLAG_NO_INTERPROCESS_SHARING;
+
        mem->bo = device->ws->buffer_create(device->ws, alloc_size, device->physical_device->rad_info.max_alignment,
                                               domain, flags);
 
@@ -2294,7 +2168,7 @@ VkResult radv_AllocateMemory(
                result = VK_ERROR_OUT_OF_DEVICE_MEMORY;
                goto fail;
        }
-       mem->type_index = pAllocateInfo->memoryTypeIndex;
+       mem->type_index = mem_type_index;
 out_success:
        *pMem = radv_device_memory_to_handle(mem);
 
@@ -2306,6 +2180,15 @@ fail:
        return result;
 }
 
+VkResult radv_AllocateMemory(
+       VkDevice                                    _device,
+       const VkMemoryAllocateInfo*                 pAllocateInfo,
+       const VkAllocationCallbacks*                pAllocator,
+       VkDeviceMemory*                             pMem)
+{
+       return radv_alloc_memory(_device, pAllocateInfo, pAllocator, 0, pMem);
+}
+
 void radv_FreeMemory(
        VkDevice                                    _device,
        VkDeviceMemory                              _mem,
@@ -2378,13 +2261,14 @@ VkResult radv_InvalidateMappedMemoryRanges(
 }
 
 void radv_GetBufferMemoryRequirements(
-       VkDevice                                    device,
+       VkDevice                                    _device,
        VkBuffer                                    _buffer,
        VkMemoryRequirements*                       pMemoryRequirements)
 {
+       RADV_FROM_HANDLE(radv_device, device, _device);
        RADV_FROM_HANDLE(radv_buffer, buffer, _buffer);
 
-       pMemoryRequirements->memoryTypeBits = (1u << RADV_MEM_TYPE_COUNT) - 1;
+       pMemoryRequirements->memoryTypeBits = (1u << device->physical_device->memory_properties.memoryTypeCount) - 1;
 
        if (buffer->flags & VK_BUFFER_CREATE_SPARSE_BINDING_BIT)
                pMemoryRequirements->alignment = 4096;
@@ -2401,13 +2285,13 @@ void radv_GetBufferMemoryRequirements2KHR(
 {
        radv_GetBufferMemoryRequirements(device, pInfo->buffer,
                                         &pMemoryRequirements->memoryRequirements);
-
+       RADV_FROM_HANDLE(radv_buffer, buffer, pInfo->buffer);
        vk_foreach_struct(ext, pMemoryRequirements->pNext) {
                switch (ext->sType) {
                case VK_STRUCTURE_TYPE_MEMORY_DEDICATED_REQUIREMENTS_KHR: {
                        VkMemoryDedicatedRequirementsKHR *req =
                                       (VkMemoryDedicatedRequirementsKHR *) ext;
-                       req->requiresDedicatedAllocation = false;
+                       req->requiresDedicatedAllocation = buffer->shareable;
                        req->prefersDedicatedAllocation = req->requiresDedicatedAllocation;
                        break;
                }
@@ -2418,13 +2302,14 @@ void radv_GetBufferMemoryRequirements2KHR(
 }
 
 void radv_GetImageMemoryRequirements(
-       VkDevice                                    device,
+       VkDevice                                    _device,
        VkImage                                     _image,
        VkMemoryRequirements*                       pMemoryRequirements)
 {
+       RADV_FROM_HANDLE(radv_device, device, _device);
        RADV_FROM_HANDLE(radv_image, image, _image);
 
-       pMemoryRequirements->memoryTypeBits = (1u << RADV_MEM_TYPE_COUNT) - 1;
+       pMemoryRequirements->memoryTypeBits = (1u << device->physical_device->memory_properties.memoryTypeCount) - 1;
 
        pMemoryRequirements->size = image->size;
        pMemoryRequirements->alignment = image->alignment;
@@ -2481,44 +2366,74 @@ void radv_GetDeviceMemoryCommitment(
        *pCommittedMemoryInBytes = 0;
 }
 
+VkResult radv_BindBufferMemory2KHR(VkDevice device,
+                                   uint32_t bindInfoCount,
+                                   const VkBindBufferMemoryInfoKHR *pBindInfos)
+{
+       for (uint32_t i = 0; i < bindInfoCount; ++i) {
+               RADV_FROM_HANDLE(radv_device_memory, mem, pBindInfos[i].memory);
+               RADV_FROM_HANDLE(radv_buffer, buffer, pBindInfos[i].buffer);
+
+               if (mem) {
+                       buffer->bo = mem->bo;
+                       buffer->offset = pBindInfos[i].memoryOffset;
+               } else {
+                       buffer->bo = NULL;
+               }
+       }
+       return VK_SUCCESS;
+}
+
 VkResult radv_BindBufferMemory(
        VkDevice                                    device,
-       VkBuffer                                    _buffer,
-       VkDeviceMemory                              _memory,
+       VkBuffer                                    buffer,
+       VkDeviceMemory                              memory,
        VkDeviceSize                                memoryOffset)
 {
-       RADV_FROM_HANDLE(radv_device_memory, mem, _memory);
-       RADV_FROM_HANDLE(radv_buffer, buffer, _buffer);
+       const VkBindBufferMemoryInfoKHR info = {
+               .sType = VK_STRUCTURE_TYPE_BIND_BUFFER_MEMORY_INFO_KHR,
+               .buffer = buffer,
+               .memory = memory,
+               .memoryOffset = memoryOffset
+       };
 
-       if (mem) {
-               buffer->bo = mem->bo;
-               buffer->offset = memoryOffset;
-       } else {
-               buffer->bo = NULL;
-               buffer->offset = 0;
-       }
+       return radv_BindBufferMemory2KHR(device, 1, &info);
+}
+
+VkResult radv_BindImageMemory2KHR(VkDevice device,
+                                  uint32_t bindInfoCount,
+                                  const VkBindImageMemoryInfoKHR *pBindInfos)
+{
+       for (uint32_t i = 0; i < bindInfoCount; ++i) {
+               RADV_FROM_HANDLE(radv_device_memory, mem, pBindInfos[i].memory);
+               RADV_FROM_HANDLE(radv_image, image, pBindInfos[i].image);
 
+               if (mem) {
+                       image->bo = mem->bo;
+                       image->offset = pBindInfos[i].memoryOffset;
+               } else {
+                       image->bo = NULL;
+                       image->offset = 0;
+               }
+       }
        return VK_SUCCESS;
 }
 
+
 VkResult radv_BindImageMemory(
        VkDevice                                    device,
-       VkImage                                     _image,
-       VkDeviceMemory                              _memory,
+       VkImage                                     image,
+       VkDeviceMemory                              memory,
        VkDeviceSize                                memoryOffset)
 {
-       RADV_FROM_HANDLE(radv_device_memory, mem, _memory);
-       RADV_FROM_HANDLE(radv_image, image, _image);
-
-       if (mem) {
-               image->bo = mem->bo;
-               image->offset = memoryOffset;
-       } else {
-               image->bo = NULL;
-               image->offset = 0;
-       }
+       const VkBindImageMemoryInfoKHR info = {
+               .sType = VK_STRUCTURE_TYPE_BIND_BUFFER_MEMORY_INFO_KHR,
+               .image = image,
+               .memory = memory,
+               .memoryOffset = memoryOffset
+       };
 
-       return VK_SUCCESS;
+       return radv_BindImageMemory2KHR(device, 1, &info);
 }
 
 
@@ -2811,7 +2726,7 @@ VkResult radv_CreateEvent(
 
        event->bo = device->ws->buffer_create(device->ws, 8, 8,
                                              RADEON_DOMAIN_GTT,
-                                             RADEON_FLAG_VA_UNCACHED | RADEON_FLAG_CPU_ACCESS);
+                                             RADEON_FLAG_VA_UNCACHED | RADEON_FLAG_CPU_ACCESS | RADEON_FLAG_NO_INTERPROCESS_SHARING);
        if (!event->bo) {
                vk_free2(&device->alloc, pAllocator, event);
                return VK_ERROR_OUT_OF_DEVICE_MEMORY;
@@ -2891,6 +2806,9 @@ VkResult radv_CreateBuffer(
        buffer->offset = 0;
        buffer->flags = pCreateInfo->flags;
 
+       buffer->shareable = vk_find_struct_const(pCreateInfo->pNext,
+                                                EXTERNAL_MEMORY_BUFFER_CREATE_INFO_KHR) != NULL;
+
        if (pCreateInfo->flags & VK_BUFFER_CREATE_SPARSE_BINDING_BIT) {
                buffer->bo = device->ws->buffer_create(device->ws,
                                                       align64(buffer->size, 4096),
@@ -2955,7 +2873,7 @@ radv_initialise_color_surface(struct radv_device *device,
        /* Intensity is implemented as Red, so treat it that way. */
        cb->cb_color_attrib = S_028C74_FORCE_DST_ALPHA_1(desc->swizzle[3] == VK_SWIZZLE_1);
 
-       va = device->ws->buffer_get_va(iview->bo) + iview->image->offset;
+       va = radv_buffer_get_va(iview->bo) + iview->image->offset;
 
        cb->cb_color_base = va >> 8;
 
@@ -3007,11 +2925,11 @@ radv_initialise_color_surface(struct radv_device *device,
        }
 
        /* CMASK variables */
-       va = device->ws->buffer_get_va(iview->bo) + iview->image->offset;
+       va = radv_buffer_get_va(iview->bo) + iview->image->offset;
        va += iview->image->cmask.offset;
        cb->cb_color_cmask = va >> 8;
 
-       va = device->ws->buffer_get_va(iview->bo) + iview->image->offset;
+       va = radv_buffer_get_va(iview->bo) + iview->image->offset;
        va += iview->image->dcc_offset;
        cb->cb_dcc_base = va >> 8;
        cb->cb_dcc_base |= iview->image->surface.tile_swizzle;
@@ -3028,7 +2946,7 @@ radv_initialise_color_surface(struct radv_device *device,
        }
 
        if (iview->image->fmask.size) {
-               va = device->ws->buffer_get_va(iview->bo) + iview->image->offset + iview->image->fmask.offset;
+               va = radv_buffer_get_va(iview->bo) + iview->image->offset + iview->image->fmask.offset;
                cb->cb_color_fmask = va >> 8;
                cb->cb_color_fmask |= iview->image->fmask.tile_swizzle;
        } else {
@@ -3086,10 +3004,10 @@ radv_initialise_color_surface(struct radv_device *device,
        }
 
        if (iview->image->cmask.size &&
-           !(device->debug_flags & RADV_DEBUG_NO_FAST_CLEARS))
+           !(device->instance->debug_flags & RADV_DEBUG_NO_FAST_CLEARS))
                cb->cb_color_info |= S_028C70_FAST_CLEAR(1);
 
-       if (iview->image->surface.dcc_size && iview->base_mip < surf->num_dcc_levels)
+       if (radv_vi_dcc_enabled(iview->image, iview->base_mip))
                cb->cb_color_info |= S_028C70_DCC_ENABLE(1);
 
        if (device->physical_device->rad_info.chip_class >= VI) {
@@ -3173,7 +3091,7 @@ radv_initialise_ds_surface(struct radv_device *device,
        ds->db_htile_data_base = 0;
        ds->db_htile_surface = 0;
 
-       va = device->ws->buffer_get_va(iview->bo) + iview->image->offset;
+       va = radv_buffer_get_va(iview->bo) + iview->image->offset;
        s_offs = z_offs = va;
 
        if (device->physical_device->rad_info.chip_class >= GFX9) {
@@ -3194,14 +3112,25 @@ radv_initialise_ds_surface(struct radv_device *device,
                ds->db_depth_size = S_02801C_X_MAX(iview->image->info.width - 1) |
                        S_02801C_Y_MAX(iview->image->info.height - 1);
 
-               /* Only use HTILE for the first level. */
-               if (iview->image->surface.htile_size && !level) {
+               if (radv_htile_enabled(iview->image, level)) {
                        ds->db_z_info |= S_028038_TILE_SURFACE_ENABLE(1);
 
+                       if (iview->image->tc_compatible_htile) {
+                               unsigned max_zplanes = 4;
+
+                               if (iview->vk_format == VK_FORMAT_D16_UNORM  &&
+                                   iview->image->info.samples > 1)
+                                       max_zplanes = 2;
+
+                               ds->db_z_info |= S_028038_DECOMPRESS_ON_N_ZPLANES(max_zplanes + 1) |
+                                         S_028038_ITERATE_FLUSH(1);
+                               ds->db_stencil_info |= S_02803C_ITERATE_FLUSH(1);
+                       }
+
                        if (!iview->image->surface.has_stencil)
                                /* Use all of the htile_buffer for depth if there's no stencil. */
                                ds->db_stencil_info |= S_02803C_TILE_STENCIL_DISABLE(1);
-                       va = device->ws->buffer_get_va(iview->bo) + iview->image->offset +
+                       va = radv_buffer_get_va(iview->bo) + iview->image->offset +
                                iview->image->htile_offset;
                        ds->db_htile_data_base = va >> 8;
                        ds->db_htile_surface = S_028ABC_FULL_CACHE(1) |
@@ -3217,7 +3146,7 @@ radv_initialise_ds_surface(struct radv_device *device,
                z_offs += iview->image->surface.u.legacy.level[level].offset;
                s_offs += iview->image->surface.u.legacy.stencil_level[level].offset;
 
-               ds->db_depth_info = S_02803C_ADDR5_SWIZZLE_MASK(1);
+               ds->db_depth_info = S_02803C_ADDR5_SWIZZLE_MASK(!iview->image->tc_compatible_htile);
                ds->db_z_info = S_028040_FORMAT(format) | S_028040_ZRANGE_PRECISION(1);
                ds->db_stencil_info = S_028044_FORMAT(stencil_format);
 
@@ -3258,17 +3187,29 @@ radv_initialise_ds_surface(struct radv_device *device,
                        S_028058_HEIGHT_TILE_MAX((level_info->nblk_y / 8) - 1);
                ds->db_depth_slice = S_02805C_SLICE_TILE_MAX((level_info->nblk_x * level_info->nblk_y) / 64 - 1);
 
-               if (iview->image->surface.htile_size && !level) {
+               if (radv_htile_enabled(iview->image, level)) {
                        ds->db_z_info |= S_028040_TILE_SURFACE_ENABLE(1);
 
-                       if (!iview->image->surface.has_stencil)
+                       if (!iview->image->surface.has_stencil &&
+                           !iview->image->tc_compatible_htile)
                                /* Use all of the htile_buffer for depth if there's no stencil. */
                                ds->db_stencil_info |= S_028044_TILE_STENCIL_DISABLE(1);
 
-                       va = device->ws->buffer_get_va(iview->bo) + iview->image->offset +
+                       va = radv_buffer_get_va(iview->bo) + iview->image->offset +
                                iview->image->htile_offset;
                        ds->db_htile_data_base = va >> 8;
                        ds->db_htile_surface = S_028ABC_FULL_CACHE(1);
+
+                       if (iview->image->tc_compatible_htile) {
+                               ds->db_htile_surface |= S_028ABC_TC_COMPATIBLE(1);
+
+                               if (iview->image->info.samples <= 1)
+                                       ds->db_z_info |= S_028040_DECOMPRESS_ON_N_ZPLANES(5);
+                               else if (iview->image->info.samples <= 4)
+                                       ds->db_z_info |= S_028040_DECOMPRESS_ON_N_ZPLANES(3);
+                               else
+                                       ds->db_z_info|= S_028040_DECOMPRESS_ON_N_ZPLANES(2);
+                       }
                }
        }