radeonsi: update copyrights
[mesa.git] / src / gallium / drivers / radeon / r600_texture.c
index 2aa47b55d592bacd78485e35c295b5ccef3592d8..a41811a576d8f792c369d554f069e0cd3d68bae3 100644 (file)
@@ -1,5 +1,7 @@
 /*
  * Copyright 2010 Jerome Glisse <glisse@freedesktop.org>
+ * Copyright 2018 Advanced Micro Devices, Inc.
+ * All Rights Reserved.
  *
  * Permission is hereby granted, free of charge, to any person obtaining a
  * copy of this software and associated documentation files (the "Software"),
 #include "state_tracker/drm_driver.h"
 #include "amd/common/sid.h"
 
-static void r600_texture_discard_cmask(struct si_screen *sscreen,
-                                      struct r600_texture *rtex);
 static enum radeon_surf_mode
 r600_choose_tiling(struct si_screen *sscreen,
                   const struct pipe_resource *templ);
 
 
-bool si_prepare_for_dma_blit(struct r600_common_context *rctx,
+bool si_prepare_for_dma_blit(struct si_context *sctx,
                             struct r600_texture *rdst,
                             unsigned dst_level, unsigned dstx,
                             unsigned dsty, unsigned dstz,
@@ -51,7 +51,7 @@ bool si_prepare_for_dma_blit(struct r600_common_context *rctx,
                             unsigned src_level,
                             const struct pipe_box *src_box)
 {
-       if (!rctx->dma.cs)
+       if (!sctx->b.dma_cs)
                return false;
 
        if (rdst->surface.bpe != rsrc->surface.bpe)
@@ -90,12 +90,12 @@ bool si_prepare_for_dma_blit(struct r600_common_context *rctx,
                                                      src_box->height, src_box->depth))
                        return false;
 
-               r600_texture_discard_cmask(rctx->screen, rdst);
+               si_texture_discard_cmask(sctx->screen, rdst);
        }
 
        /* All requirements are met. Prepare textures for SDMA. */
        if (rsrc->cmask.size && rsrc->dirty_level_mask & (1 << src_level))
-               rctx->b.flush_resource(&rctx->b, &rsrc->resource.b.b);
+               sctx->b.b.flush_resource(&sctx->b.b, &rsrc->resource.b.b);
 
        assert(!(rsrc->dirty_level_mask & (1 << src_level)));
        assert(!(rdst->dirty_level_mask & (1 << dst_level)));
@@ -140,7 +140,7 @@ static void r600_copy_region_with_blit(struct pipe_context *pipe,
 /* Copy from a full GPU texture to a transfer's staging one. */
 static void r600_copy_to_staging_texture(struct pipe_context *ctx, struct r600_transfer *rtransfer)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
+       struct si_context *sctx = (struct si_context*)ctx;
        struct pipe_transfer *transfer = (struct pipe_transfer*)rtransfer;
        struct pipe_resource *dst = &rtransfer->staging->b.b;
        struct pipe_resource *src = transfer->resource;
@@ -151,14 +151,14 @@ static void r600_copy_to_staging_texture(struct pipe_context *ctx, struct r600_t
                return;
        }
 
-       rctx->dma_copy(ctx, dst, 0, 0, 0, 0, src, transfer->level,
+       sctx->b.dma_copy(ctx, dst, 0, 0, 0, 0, src, transfer->level,
                       &transfer->box);
 }
 
 /* Copy from a transfer's staging texture to a full GPU one. */
 static void r600_copy_from_staging_texture(struct pipe_context *ctx, struct r600_transfer *rtransfer)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
+       struct si_context *sctx = (struct si_context*)ctx;
        struct pipe_transfer *transfer = (struct pipe_transfer*)rtransfer;
        struct pipe_resource *dst = transfer->resource;
        struct pipe_resource *src = &rtransfer->staging->b.b;
@@ -173,7 +173,7 @@ static void r600_copy_from_staging_texture(struct pipe_context *ctx, struct r600
                return;
        }
 
-       rctx->dma_copy(ctx, dst, transfer->level,
+       sctx->b.dma_copy(ctx, dst, transfer->level,
                       transfer->box.x, transfer->box.y, transfer->box.z,
                       src, 0, &sbox);
 }
@@ -242,7 +242,7 @@ static int r600_init_surface(struct si_screen *sscreen,
                bpe = 4; /* stencil is allocated separately on evergreen */
        } else {
                bpe = util_format_get_blocksize(ptex->format);
-               assert(util_is_power_of_two(bpe));
+               assert(util_is_power_of_two_or_zero(bpe));
        }
 
        if (!is_flushed_depth && is_depth) {
@@ -298,11 +298,21 @@ static int r600_init_surface(struct si_screen *sscreen,
                return r;
        }
 
+       unsigned pitch = pitch_in_bytes_override / bpe;
+
        if (sscreen->info.chip_class >= GFX9) {
-               assert(!pitch_in_bytes_override ||
-                      pitch_in_bytes_override == surface->u.gfx9.surf_pitch * bpe);
+               if (pitch) {
+                       surface->u.gfx9.surf_pitch = pitch;
+                       surface->u.gfx9.surf_slice_size =
+                               (uint64_t)pitch * surface->u.gfx9.surf_height * bpe;
+               }
                surface->u.gfx9.surf_offset = offset;
        } else {
+               if (pitch) {
+                       surface->u.legacy.level[0].nblk_x = pitch;
+                       surface->u.legacy.level[0].slice_size_dw =
+                               ((uint64_t)pitch * surface->u.legacy.level[0].nblk_y * bpe) / 4;
+               }
                if (offset) {
                        for (i = 0; i < ARRAY_SIZE(surface->u.legacy.level); ++i)
                                surface->u.legacy.level[i].offset += offset;
@@ -372,24 +382,28 @@ static void r600_surface_import_metadata(struct si_screen *sscreen,
        }
 }
 
-static void r600_eliminate_fast_color_clear(struct r600_common_context *rctx,
-                                           struct r600_texture *rtex)
+void si_eliminate_fast_color_clear(struct si_context *sctx,
+                                  struct r600_texture *rtex)
 {
-       struct si_screen *sscreen = rctx->screen;
-       struct pipe_context *ctx = &rctx->b;
+       struct si_screen *sscreen = sctx->screen;
+       struct pipe_context *ctx = &sctx->b.b;
 
        if (ctx == sscreen->aux_context)
                mtx_lock(&sscreen->aux_context_lock);
 
+       unsigned n = sctx->b.num_decompress_calls;
        ctx->flush_resource(ctx, &rtex->resource.b.b);
-       ctx->flush(ctx, NULL, 0);
+
+       /* Flush only if any fast clear elimination took place. */
+       if (n != sctx->b.num_decompress_calls)
+               ctx->flush(ctx, NULL, 0);
 
        if (ctx == sscreen->aux_context)
                mtx_unlock(&sscreen->aux_context_lock);
 }
 
-static void r600_texture_discard_cmask(struct si_screen *sscreen,
-                                      struct r600_texture *rtex)
+void si_texture_discard_cmask(struct si_screen *sscreen,
+                             struct r600_texture *rtex)
 {
        if (!rtex->cmask.size)
                return;
@@ -453,36 +467,36 @@ static bool r600_texture_discard_dcc(struct si_screen *sscreen,
  *   context 1 & 2 read garbage, because DCC is disabled, yet there are
  *   compressed tiled
  *
- * \param rctx  the current context if you have one, or rscreen->aux_context
+ * \param sctx  the current context if you have one, or rscreen->aux_context
  *              if you don't.
  */
-bool si_texture_disable_dcc(struct r600_common_context *rctx,
+bool si_texture_disable_dcc(struct si_context *sctx,
                            struct r600_texture *rtex)
 {
-       struct si_screen *sscreen = rctx->screen;
+       struct si_screen *sscreen = sctx->screen;
 
        if (!r600_can_disable_dcc(rtex))
                return false;
 
-       if (&rctx->b == sscreen->aux_context)
+       if (&sctx->b.b == sscreen->aux_context)
                mtx_lock(&sscreen->aux_context_lock);
 
        /* Decompress DCC. */
-       rctx->decompress_dcc(&rctx->b, rtex);
-       rctx->b.flush(&rctx->b, NULL, 0);
+       si_decompress_dcc(&sctx->b.b, rtex);
+       sctx->b.b.flush(&sctx->b.b, NULL, 0);
 
-       if (&rctx->b == sscreen->aux_context)
+       if (&sctx->b.b == sscreen->aux_context)
                mtx_unlock(&sscreen->aux_context_lock);
 
        return r600_texture_discard_dcc(sscreen, rtex);
 }
 
-static void r600_reallocate_texture_inplace(struct r600_common_context *rctx,
+static void r600_reallocate_texture_inplace(struct si_context *sctx,
                                            struct r600_texture *rtex,
                                            unsigned new_bind_flag,
                                            bool invalidate_storage)
 {
-       struct pipe_screen *screen = rctx->b.screen;
+       struct pipe_screen *screen = sctx->b.b.screen;
        struct r600_texture *new_tex;
        struct pipe_resource templ = rtex->resource.b.b;
        unsigned i;
@@ -497,7 +511,7 @@ static void r600_reallocate_texture_inplace(struct r600_common_context *rctx,
                        return;
 
                /* This fails with MSAA, depth, and compressed textures. */
-               if (r600_choose_tiling(rctx->screen, &templ) !=
+               if (r600_choose_tiling(sctx->screen, &templ) !=
                    RADEON_SURF_MODE_LINEAR_ALIGNED)
                        return;
        }
@@ -513,16 +527,16 @@ static void r600_reallocate_texture_inplace(struct r600_common_context *rctx,
 
                        u_box_3d(0, 0, 0,
                                 u_minify(templ.width0, i), u_minify(templ.height0, i),
-                                util_max_layer(&templ, i) + 1, &box);
+                                util_num_layers(&templ, i), &box);
 
-                       rctx->dma_copy(&rctx->b, &new_tex->resource.b.b, i, 0, 0, 0,
+                       sctx->b.dma_copy(&sctx->b.b, &new_tex->resource.b.b, i, 0, 0, 0,
                                       &rtex->resource.b.b, i, &box);
                }
        }
 
        if (new_bind_flag == PIPE_BIND_LINEAR) {
-               r600_texture_discard_cmask(rctx->screen, rtex);
-               r600_texture_discard_dcc(rctx->screen, rtex);
+               si_texture_discard_cmask(sctx->screen, rtex);
+               r600_texture_discard_dcc(sctx->screen, rtex);
        }
 
        /* Replace the structure fields of rtex. */
@@ -562,7 +576,7 @@ static void r600_reallocate_texture_inplace(struct r600_common_context *rctx,
 
        r600_texture_reference(&new_tex, NULL);
 
-       p_atomic_inc(&rctx->screen->dirty_tex_counter);
+       p_atomic_inc(&sctx->screen->dirty_tex_counter);
 }
 
 static uint32_t si_get_bo_metadata_word1(struct si_screen *sscreen)
@@ -582,7 +596,7 @@ static void si_query_opaque_metadata(struct si_screen *sscreen,
                PIPE_SWIZZLE_W
        };
        uint32_t desc[8], i;
-       bool is_array = util_resource_is_array_texture(res);
+       bool is_array = util_texture_is_array(res->target);
 
        /* DRM 2.x.x doesn't support this. */
        if (sscreen->info.drm_major != 3)
@@ -667,7 +681,7 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                                        unsigned usage)
 {
        struct si_screen *sscreen = (struct si_screen*)screen;
-       struct r600_common_context *rctx;
+       struct si_context *sctx;
        struct r600_resource *res = (struct r600_resource*)resource;
        struct r600_texture *rtex = (struct r600_texture*)resource;
        struct radeon_bo_metadata metadata;
@@ -676,7 +690,7 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
        bool flush = false;
 
        ctx = threaded_context_unwrap_sync(ctx);
-       rctx = (struct r600_common_context*)(ctx ? ctx : sscreen->aux_context);
+       sctx = (struct si_context*)(ctx ? ctx : sscreen->aux_context);
 
        if (resource->target != PIPE_BUFFER) {
                /* This is not supported now, but it might be required for OpenCL
@@ -689,9 +703,10 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                if (sscreen->ws->buffer_is_suballocated(res->buf) ||
                    rtex->surface.tile_swizzle ||
                    (rtex->resource.flags & RADEON_FLAG_NO_INTERPROCESS_SHARING &&
+                    sscreen->info.has_local_buffers &&
                     whandle->type != DRM_API_HANDLE_TYPE_KMS)) {
                        assert(!res->b.is_shared);
-                       r600_reallocate_texture_inplace(rctx, rtex,
+                       r600_reallocate_texture_inplace(sctx, rtex,
                                                        PIPE_BIND_SHARED, false);
                        flush = true;
                        assert(res->b.b.bind & PIPE_BIND_SHARED);
@@ -705,7 +720,7 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                 * access.
                 */
                if (usage & PIPE_HANDLE_USAGE_WRITE && rtex->dcc_offset) {
-                       if (si_texture_disable_dcc(rctx, rtex)) {
+                       if (si_texture_disable_dcc(sctx, rtex)) {
                                update_metadata = true;
                                /* si_texture_disable_dcc flushes the context */
                                flush = false;
@@ -715,7 +730,7 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                if (!(usage & PIPE_HANDLE_USAGE_EXPLICIT_FLUSH) &&
                    (rtex->cmask.size || rtex->dcc_offset)) {
                        /* Eliminate fast clear (both CMASK and DCC) */
-                       r600_eliminate_fast_color_clear(rctx, rtex);
+                       si_eliminate_fast_color_clear(sctx, rtex);
                        /* eliminate_fast_color_clear flushes the context */
                        flush = false;
 
@@ -723,7 +738,7 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                         * to be called.
                         */
                        if (rtex->cmask.size)
-                               r600_texture_discard_cmask(sscreen, rtex);
+                               si_texture_discard_cmask(sscreen, rtex);
                }
 
                /* Set metadata. */
@@ -746,8 +761,12 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                        slice_size = (uint64_t)rtex->surface.u.legacy.level[0].slice_size_dw * 4;
                }
        } else {
+               /* Buffer exports are for the OpenCL interop. */
                /* Move a suballocated buffer into a non-suballocated allocation. */
-               if (sscreen->ws->buffer_is_suballocated(res->buf)) {
+               if (sscreen->ws->buffer_is_suballocated(res->buf) ||
+                   /* A DMABUF export always fails if the BO is local. */
+                   (rtex->resource.flags & RADEON_FLAG_NO_INTERPROCESS_SHARING &&
+                    sscreen->info.has_local_buffers)) {
                        assert(!res->b.is_shared);
 
                        /* Allocate a new buffer with PIPE_BIND_SHARED. */
@@ -762,11 +781,11 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
                        /* Copy the old buffer contents to the new one. */
                        struct pipe_box box;
                        u_box_1d(0, newb->width0, &box);
-                       rctx->b.resource_copy_region(&rctx->b, newb, 0, 0, 0, 0,
+                       sctx->b.b.resource_copy_region(&sctx->b.b, newb, 0, 0, 0, 0,
                                                     &res->b.b, 0, &box);
                        flush = true;
                        /* Move the new buffer storage to the old pipe_resource. */
-                       si_replace_buffer_storage(&rctx->b, &res->b.b, newb);
+                       si_replace_buffer_storage(&sctx->b.b, &res->b.b, newb);
                        pipe_resource_reference(&newb, NULL);
 
                        assert(res->b.b.bind & PIPE_BIND_SHARED);
@@ -780,7 +799,7 @@ static boolean r600_texture_get_handle(struct pipe_screen* screen,
        }
 
        if (flush)
-               rctx->b.flush(&rctx->b, NULL, 0);
+               sctx->b.b.flush(&sctx->b.b, NULL, 0);
 
        if (res->b.is_shared) {
                /* USAGE_EXPLICIT_FLUSH must be cleared if at least one user
@@ -833,6 +852,7 @@ void si_texture_get_fmask_info(struct si_screen *sscreen,
        if (sscreen->info.chip_class >= GFX9) {
                out->alignment = rtex->surface.u.gfx9.fmask_alignment;
                out->size = rtex->surface.u.gfx9.fmask_size;
+               out->tile_swizzle = rtex->surface.u.gfx9.fmask_tile_swizzle;
                return;
        }
 
@@ -932,7 +952,7 @@ void si_texture_get_cmask_info(struct si_screen *sscreen,
                out->slice_tile_max -= 1;
 
        out->alignment = MAX2(256, base_align);
-       out->size = (util_max_layer(&rtex->resource.b.b, 0) + 1) *
+       out->size = util_num_layers(&rtex->resource.b.b, 0) *
                    align(slice_bytes, base_align);
 }
 
@@ -1011,7 +1031,7 @@ static void r600_texture_get_htile_size(struct si_screen *sscreen,
 
        rtex->surface.htile_alignment = base_align;
        rtex->surface.htile_size =
-               (util_max_layer(&rtex->resource.b.b, 0) + 1) *
+               util_num_layers(&rtex->resource.b.b, 0) *
                align(slice_bytes, base_align);
 }
 
@@ -1250,12 +1270,13 @@ r600_texture_create_object(struct pipe_screen *screen,
                                r600_texture_allocate_htile(sscreen, rtex);
                }
        } else {
-               if (base->nr_samples > 1) {
-                       if (!buf) {
-                               r600_texture_allocate_fmask(sscreen, rtex);
-                               r600_texture_allocate_cmask(sscreen, rtex);
-                               rtex->cmask_buffer = &rtex->resource;
-                       }
+               if (base->nr_samples > 1 &&
+                   !buf &&
+                   !(sscreen->debug_flags & DBG(NO_FMASK))) {
+                       r600_texture_allocate_fmask(sscreen, rtex);
+                       r600_texture_allocate_cmask(sscreen, rtex);
+                       rtex->cmask_buffer = &rtex->resource;
+
                        if (!rtex->fmask.size || !rtex->cmask.size) {
                                FREE(rtex);
                                return NULL;
@@ -1330,7 +1351,7 @@ r600_texture_create_object(struct pipe_screen *screen,
                fprintf(stderr, "VM start=0x%"PRIX64"  end=0x%"PRIX64" | Texture %ix%ix%i, %i levels, %i samples, %s\n",
                        rtex->resource.gpu_address,
                        rtex->resource.gpu_address + rtex->resource.buf->size,
-                       base->width0, base->height0, util_max_layer(base, 0)+1, base->last_level+1,
+                       base->width0, base->height0, util_num_layers(base, 0), base->last_level+1,
                        base->nr_samples ? base->nr_samples : 1, util_format_short_name(base->format));
        }
 
@@ -1600,10 +1621,10 @@ static bool r600_can_invalidate_texture(struct si_screen *sscreen,
                                                 box->depth);
 }
 
-static void r600_texture_invalidate_storage(struct r600_common_context *rctx,
+static void r600_texture_invalidate_storage(struct si_context *sctx,
                                            struct r600_texture *rtex)
 {
-       struct si_screen *sscreen = rctx->screen;
+       struct si_screen *sscreen = sctx->screen;
 
        /* There is no point in discarding depth and tiled buffers. */
        assert(!rtex->is_depth);
@@ -1618,7 +1639,7 @@ static void r600_texture_invalidate_storage(struct r600_common_context *rctx,
 
        p_atomic_inc(&sscreen->dirty_tex_counter);
 
-       rctx->num_alloc_tex_transfer_bytes += rtex->size;
+       sctx->b.num_alloc_tex_transfer_bytes += rtex->size;
 }
 
 static void *r600_texture_transfer_map(struct pipe_context *ctx,
@@ -1628,7 +1649,7 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                                       const struct pipe_box *box,
                                       struct pipe_transfer **ptransfer)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
+       struct si_context *sctx = (struct si_context*)ctx;
        struct r600_texture *rtex = (struct r600_texture*)texture;
        struct r600_transfer *trans;
        struct r600_resource *buf;
@@ -1645,15 +1666,15 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                 * On dGPUs, the staging texture is always faster.
                 * Only count uploads that are at least 4x4 pixels large.
                 */
-               if (!rctx->screen->info.has_dedicated_vram &&
+               if (!sctx->screen->info.has_dedicated_vram &&
                    level == 0 &&
                    box->width >= 4 && box->height >= 4 &&
                    p_atomic_inc_return(&rtex->num_level0_transfers) == 10) {
                        bool can_invalidate =
-                               r600_can_invalidate_texture(rctx->screen, rtex,
+                               r600_can_invalidate_texture(sctx->screen, rtex,
                                                            usage, box);
 
-                       r600_reallocate_texture_inplace(rctx, rtex,
+                       r600_reallocate_texture_inplace(sctx, rtex,
                                                        PIPE_BIND_LINEAR,
                                                        can_invalidate);
                }
@@ -1674,14 +1695,14 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                                rtex->resource.domains & RADEON_DOMAIN_VRAM ||
                                rtex->resource.flags & RADEON_FLAG_GTT_WC;
                /* Write & linear only: */
-               else if (si_rings_is_buffer_referenced(rctx, rtex->resource.buf,
-                                                        RADEON_USAGE_READWRITE) ||
-                        !rctx->ws->buffer_wait(rtex->resource.buf, 0,
+               else if (si_rings_is_buffer_referenced(sctx, rtex->resource.buf,
+                                                      RADEON_USAGE_READWRITE) ||
+                        !sctx->b.ws->buffer_wait(rtex->resource.buf, 0,
                                                RADEON_USAGE_READWRITE)) {
                        /* It's busy. */
-                       if (r600_can_invalidate_texture(rctx->screen, rtex,
+                       if (r600_can_invalidate_texture(sctx->screen, rtex,
                                                        usage, box))
-                               r600_texture_invalidate_storage(rctx, rtex);
+                               r600_texture_invalidate_storage(sctx, rtex);
                        else
                                use_staging_texture = true;
                }
@@ -1728,13 +1749,13 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                                }
 
                                r600_copy_region_with_blit(ctx, temp, 0, 0, 0, 0, texture, level, box);
-                               rctx->blit_decompress_depth(ctx, (struct r600_texture*)temp, staging_depth,
-                                                           0, 0, 0, box->depth, 0, 0);
+                               si_blit_decompress_depth(ctx, (struct r600_texture*)temp, staging_depth,
+                                                        0, 0, 0, box->depth, 0, 0);
                                pipe_resource_reference(&temp, NULL);
                        }
 
                        /* Just get the strides. */
-                       r600_texture_get_offset(rctx->screen, staging_depth, level, NULL,
+                       r600_texture_get_offset(sctx->screen, staging_depth, level, NULL,
                                                &trans->b.b.stride,
                                                &trans->b.b.layer_stride);
                } else {
@@ -1746,12 +1767,12 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                                return NULL;
                        }
 
-                       rctx->blit_decompress_depth(ctx, rtex, staging_depth,
-                                                   level, level,
-                                                   box->z, box->z + box->depth - 1,
-                                                   0, 0);
+                       si_blit_decompress_depth(ctx, rtex, staging_depth,
+                                                level, level,
+                                                box->z, box->z + box->depth - 1,
+                                                0, 0);
 
-                       offset = r600_texture_get_offset(rctx->screen, staging_depth,
+                       offset = r600_texture_get_offset(sctx->screen, staging_depth,
                                                         level, box,
                                                         &trans->b.b.stride,
                                                         &trans->b.b.layer_stride);
@@ -1778,7 +1799,7 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                trans->staging = &staging->resource;
 
                /* Just get the strides. */
-               r600_texture_get_offset(rctx->screen, staging, 0, NULL,
+               r600_texture_get_offset(sctx->screen, staging, 0, NULL,
                                        &trans->b.b.stride,
                                        &trans->b.b.layer_stride);
 
@@ -1790,13 +1811,13 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
                buf = trans->staging;
        } else {
                /* the resource is mapped directly */
-               offset = r600_texture_get_offset(rctx->screen, rtex, level, box,
+               offset = r600_texture_get_offset(sctx->screen, rtex, level, box,
                                                 &trans->b.b.stride,
                                                 &trans->b.b.layer_stride);
                buf = &rtex->resource;
        }
 
-       if (!(map = si_buffer_map_sync_with_rings(rctx, buf, usage))) {
+       if (!(map = si_buffer_map_sync_with_rings(sctx, buf, usage))) {
                r600_resource_reference(&trans->staging, NULL);
                FREE(trans);
                return NULL;
@@ -1809,7 +1830,7 @@ static void *r600_texture_transfer_map(struct pipe_context *ctx,
 static void r600_texture_transfer_unmap(struct pipe_context *ctx,
                                        struct pipe_transfer* transfer)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
+       struct si_context *sctx = (struct si_context*)ctx;
        struct r600_transfer *rtransfer = (struct r600_transfer*)transfer;
        struct pipe_resource *texture = transfer->resource;
        struct r600_texture *rtex = (struct r600_texture*)texture;
@@ -1826,7 +1847,7 @@ static void r600_texture_transfer_unmap(struct pipe_context *ctx,
        }
 
        if (rtransfer->staging) {
-               rctx->num_alloc_tex_transfer_bytes += rtransfer->staging->buf->size;
+               sctx->b.num_alloc_tex_transfer_bytes += rtransfer->staging->buf->size;
                r600_resource_reference(&rtransfer->staging, NULL);
        }
 
@@ -1843,9 +1864,9 @@ static void r600_texture_transfer_unmap(struct pipe_context *ctx,
         *
         * The result is that the kernel memory manager is never a bottleneck.
         */
-       if (rctx->num_alloc_tex_transfer_bytes > rctx->screen->info.gart_size / 4) {
-               rctx->gfx.flush(rctx, PIPE_FLUSH_ASYNC, NULL);
-               rctx->num_alloc_tex_transfer_bytes = 0;
+       if (sctx->b.num_alloc_tex_transfer_bytes > sctx->screen->info.gart_size / 4) {
+               si_flush_gfx_cs(sctx, PIPE_FLUSH_ASYNC, NULL);
+               sctx->b.num_alloc_tex_transfer_bytes = 0;
        }
 
        pipe_resource_reference(&transfer->resource, NULL);
@@ -1864,15 +1885,12 @@ static const struct u_resource_vtbl r600_texture_vtbl =
 /* DCC channel type categories within which formats can be reinterpreted
  * while keeping the same DCC encoding. The swizzle must also match. */
 enum dcc_channel_type {
-       dcc_channel_float32,
-       dcc_channel_uint32,
-       dcc_channel_sint32,
-       dcc_channel_float16,
-       dcc_channel_uint16,
-       dcc_channel_sint16,
+       dcc_channel_float,
+       /* uint and sint can be merged if we never use TC-compatible DCC clear
+        * encoding with the clear value of 1. */
+       dcc_channel_uint,
+       dcc_channel_sint,
        dcc_channel_uint_10_10_10_2,
-       dcc_channel_uint8,
-       dcc_channel_sint8,
        dcc_channel_incompatible,
 };
 
@@ -1891,23 +1909,15 @@ vi_get_dcc_channel_type(const struct util_format_description *desc)
 
        switch (desc->channel[i].size) {
        case 32:
-               if (desc->channel[i].type == UTIL_FORMAT_TYPE_FLOAT)
-                       return dcc_channel_float32;
-               if (desc->channel[i].type == UTIL_FORMAT_TYPE_UNSIGNED)
-                       return dcc_channel_uint32;
-               return dcc_channel_sint32;
        case 16:
+       case 8:
                if (desc->channel[i].type == UTIL_FORMAT_TYPE_FLOAT)
-                       return dcc_channel_float16;
+                       return dcc_channel_float;
                if (desc->channel[i].type == UTIL_FORMAT_TYPE_UNSIGNED)
-                       return dcc_channel_uint16;
-               return dcc_channel_sint16;
+                       return dcc_channel_uint;
+               return dcc_channel_sint;
        case 10:
                return dcc_channel_uint_10_10_10_2;
-       case 8:
-               if (desc->channel[i].type == UTIL_FORMAT_TYPE_UNSIGNED)
-                       return dcc_channel_uint8;
-               return dcc_channel_sint8;
        default:
                return dcc_channel_incompatible;
        }
@@ -1957,7 +1967,7 @@ bool vi_dcc_formats_are_incompatible(struct pipe_resource *tex,
 
 /* This can't be merged with the above function, because
  * vi_dcc_formats_compatible should be called only when DCC is enabled. */
-void vi_disable_dcc_if_incompatible_format(struct r600_common_context *rctx,
+void vi_disable_dcc_if_incompatible_format(struct si_context *sctx,
                                           struct pipe_resource *tex,
                                           unsigned level,
                                           enum pipe_format view_format)
@@ -1965,8 +1975,8 @@ void vi_disable_dcc_if_incompatible_format(struct r600_common_context *rctx,
        struct r600_texture *rtex = (struct r600_texture *)tex;
 
        if (vi_dcc_formats_are_incompatible(tex, level, view_format))
-               if (!si_texture_disable_dcc(rctx, (struct r600_texture*)tex))
-                       rctx->decompress_dcc(&rctx->b, rtex);
+               if (!si_texture_disable_dcc(sctx, (struct r600_texture*)tex))
+                       si_decompress_dcc(&sctx->b.b, rtex);
 }
 
 struct pipe_surface *si_create_surface_custom(struct pipe_context *pipe,
@@ -2108,49 +2118,49 @@ unsigned si_translate_colorswap(enum pipe_format format, bool do_endian_swap)
 
 /* PIPELINE_STAT-BASED DCC ENABLEMENT FOR DISPLAYABLE SURFACES */
 
-static void vi_dcc_clean_up_context_slot(struct r600_common_context *rctx,
+static void vi_dcc_clean_up_context_slot(struct si_context *sctx,
                                         int slot)
 {
        int i;
 
-       if (rctx->dcc_stats[slot].query_active)
-               vi_separate_dcc_stop_query(&rctx->b,
-                                          rctx->dcc_stats[slot].tex);
+       if (sctx->b.dcc_stats[slot].query_active)
+               vi_separate_dcc_stop_query(&sctx->b.b,
+                                          sctx->b.dcc_stats[slot].tex);
 
-       for (i = 0; i < ARRAY_SIZE(rctx->dcc_stats[slot].ps_stats); i++)
-               if (rctx->dcc_stats[slot].ps_stats[i]) {
-                       rctx->b.destroy_query(&rctx->b,
-                                             rctx->dcc_stats[slot].ps_stats[i]);
-                       rctx->dcc_stats[slot].ps_stats[i] = NULL;
+       for (i = 0; i < ARRAY_SIZE(sctx->b.dcc_stats[slot].ps_stats); i++)
+               if (sctx->b.dcc_stats[slot].ps_stats[i]) {
+                       sctx->b.b.destroy_query(&sctx->b.b,
+                                             sctx->b.dcc_stats[slot].ps_stats[i]);
+                       sctx->b.dcc_stats[slot].ps_stats[i] = NULL;
                }
 
-       r600_texture_reference(&rctx->dcc_stats[slot].tex, NULL);
+       r600_texture_reference(&sctx->b.dcc_stats[slot].tex, NULL);
 }
 
 /**
  * Return the per-context slot where DCC statistics queries for the texture live.
  */
-static unsigned vi_get_context_dcc_stats_index(struct r600_common_context *rctx,
+static unsigned vi_get_context_dcc_stats_index(struct si_context *sctx,
                                               struct r600_texture *tex)
 {
        int i, empty_slot = -1;
 
        /* Remove zombie textures (textures kept alive by this array only). */
-       for (i = 0; i < ARRAY_SIZE(rctx->dcc_stats); i++)
-               if (rctx->dcc_stats[i].tex &&
-                   rctx->dcc_stats[i].tex->resource.b.b.reference.count == 1)
-                       vi_dcc_clean_up_context_slot(rctx, i);
+       for (i = 0; i < ARRAY_SIZE(sctx->b.dcc_stats); i++)
+               if (sctx->b.dcc_stats[i].tex &&
+                   sctx->b.dcc_stats[i].tex->resource.b.b.reference.count == 1)
+                       vi_dcc_clean_up_context_slot(sctx, i);
 
        /* Find the texture. */
-       for (i = 0; i < ARRAY_SIZE(rctx->dcc_stats); i++) {
+       for (i = 0; i < ARRAY_SIZE(sctx->b.dcc_stats); i++) {
                /* Return if found. */
-               if (rctx->dcc_stats[i].tex == tex) {
-                       rctx->dcc_stats[i].last_use_timestamp = os_time_get();
+               if (sctx->b.dcc_stats[i].tex == tex) {
+                       sctx->b.dcc_stats[i].last_use_timestamp = os_time_get();
                        return i;
                }
 
                /* Record the first seen empty slot. */
-               if (empty_slot == -1 && !rctx->dcc_stats[i].tex)
+               if (empty_slot == -1 && !sctx->b.dcc_stats[i].tex)
                        empty_slot = i;
        }
 
@@ -2159,19 +2169,19 @@ static unsigned vi_get_context_dcc_stats_index(struct r600_common_context *rctx,
                int oldest_slot = 0;
 
                /* Find the oldest slot. */
-               for (i = 1; i < ARRAY_SIZE(rctx->dcc_stats); i++)
-                       if (rctx->dcc_stats[oldest_slot].last_use_timestamp >
-                           rctx->dcc_stats[i].last_use_timestamp)
+               for (i = 1; i < ARRAY_SIZE(sctx->b.dcc_stats); i++)
+                       if (sctx->b.dcc_stats[oldest_slot].last_use_timestamp >
+                           sctx->b.dcc_stats[i].last_use_timestamp)
                                oldest_slot = i;
 
                /* Clean up the oldest slot. */
-               vi_dcc_clean_up_context_slot(rctx, oldest_slot);
+               vi_dcc_clean_up_context_slot(sctx, oldest_slot);
                empty_slot = oldest_slot;
        }
 
        /* Add the texture to the new slot. */
-       r600_texture_reference(&rctx->dcc_stats[empty_slot].tex, tex);
-       rctx->dcc_stats[empty_slot].last_use_timestamp = os_time_get();
+       r600_texture_reference(&sctx->b.dcc_stats[empty_slot].tex, tex);
+       sctx->b.dcc_stats[empty_slot].last_use_timestamp = os_time_get();
        return empty_slot;
 }
 
@@ -2191,17 +2201,17 @@ vi_create_resuming_pipestats_query(struct pipe_context *ctx)
 void vi_separate_dcc_start_query(struct pipe_context *ctx,
                                 struct r600_texture *tex)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
-       unsigned i = vi_get_context_dcc_stats_index(rctx, tex);
+       struct si_context *sctx = (struct si_context*)ctx;
+       unsigned i = vi_get_context_dcc_stats_index(sctx, tex);
 
-       assert(!rctx->dcc_stats[i].query_active);
+       assert(!sctx->b.dcc_stats[i].query_active);
 
-       if (!rctx->dcc_stats[i].ps_stats[0])
-               rctx->dcc_stats[i].ps_stats[0] = vi_create_resuming_pipestats_query(ctx);
+       if (!sctx->b.dcc_stats[i].ps_stats[0])
+               sctx->b.dcc_stats[i].ps_stats[0] = vi_create_resuming_pipestats_query(ctx);
 
        /* begin or resume the query */
-       ctx->begin_query(ctx, rctx->dcc_stats[i].ps_stats[0]);
-       rctx->dcc_stats[i].query_active = true;
+       ctx->begin_query(ctx, sctx->b.dcc_stats[i].ps_stats[0]);
+       sctx->b.dcc_stats[i].query_active = true;
 }
 
 /**
@@ -2210,15 +2220,15 @@ void vi_separate_dcc_start_query(struct pipe_context *ctx,
 void vi_separate_dcc_stop_query(struct pipe_context *ctx,
                                struct r600_texture *tex)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
-       unsigned i = vi_get_context_dcc_stats_index(rctx, tex);
+       struct si_context *sctx = (struct si_context*)ctx;
+       unsigned i = vi_get_context_dcc_stats_index(sctx, tex);
 
-       assert(rctx->dcc_stats[i].query_active);
-       assert(rctx->dcc_stats[i].ps_stats[0]);
+       assert(sctx->b.dcc_stats[i].query_active);
+       assert(sctx->b.dcc_stats[i].ps_stats[0]);
 
        /* pause or end the query */
-       ctx->end_query(ctx, rctx->dcc_stats[i].ps_stats[0]);
-       rctx->dcc_stats[i].query_active = false;
+       ctx->end_query(ctx, sctx->b.dcc_stats[i].ps_stats[0]);
+       sctx->b.dcc_stats[i].query_active = false;
 }
 
 static bool vi_should_enable_separate_dcc(struct r600_texture *tex)
@@ -2229,7 +2239,7 @@ static bool vi_should_enable_separate_dcc(struct r600_texture *tex)
 }
 
 /* Called by fast clear. */
-void vi_separate_dcc_try_enable(struct r600_common_context *rctx,
+void vi_separate_dcc_try_enable(struct si_context *sctx,
                                struct r600_texture *tex)
 {
        /* The intent is to use this with shared displayable back buffers,
@@ -2248,7 +2258,7 @@ void vi_separate_dcc_try_enable(struct r600_common_context *rctx,
        /* Enable the DCC stat gathering. */
        if (!tex->dcc_gather_statistics) {
                tex->dcc_gather_statistics = true;
-               vi_separate_dcc_start_query(&rctx->b, tex);
+               vi_separate_dcc_start_query(&sctx->b.b, tex);
        }
 
        if (!vi_should_enable_separate_dcc(tex))
@@ -2257,7 +2267,7 @@ void vi_separate_dcc_try_enable(struct r600_common_context *rctx,
        assert(tex->surface.num_dcc_levels);
        assert(!tex->dcc_separate_buffer);
 
-       r600_texture_discard_cmask(rctx->screen, tex);
+       si_texture_discard_cmask(sctx->screen, tex);
 
        /* Get a DCC buffer. */
        if (tex->last_dcc_separate_buffer) {
@@ -2267,7 +2277,7 @@ void vi_separate_dcc_try_enable(struct r600_common_context *rctx,
                tex->last_dcc_separate_buffer = NULL;
        } else {
                tex->dcc_separate_buffer = (struct r600_resource*)
-                       si_aligned_buffer_create(rctx->b.screen,
+                       si_aligned_buffer_create(sctx->b.b.screen,
                                                   R600_RESOURCE_FLAG_UNMAPPABLE,
                                                   PIPE_USAGE_DEFAULT,
                                                   tex->surface.dcc_size,
@@ -2291,27 +2301,27 @@ void vi_separate_dcc_try_enable(struct r600_common_context *rctx,
 void vi_separate_dcc_process_and_reset_stats(struct pipe_context *ctx,
                                             struct r600_texture *tex)
 {
-       struct r600_common_context *rctx = (struct r600_common_context*)ctx;
+       struct si_context *sctx = (struct si_context*)ctx;
        struct pipe_query *tmp;
-       unsigned i = vi_get_context_dcc_stats_index(rctx, tex);
-       bool query_active = rctx->dcc_stats[i].query_active;
+       unsigned i = vi_get_context_dcc_stats_index(sctx, tex);
+       bool query_active = sctx->b.dcc_stats[i].query_active;
        bool disable = false;
 
-       if (rctx->dcc_stats[i].ps_stats[2]) {
+       if (sctx->b.dcc_stats[i].ps_stats[2]) {
                union pipe_query_result result;
 
                /* Read the results. */
-               ctx->get_query_result(ctx, rctx->dcc_stats[i].ps_stats[2],
+               ctx->get_query_result(ctx, sctx->b.dcc_stats[i].ps_stats[2],
                                      true, &result);
-               si_query_hw_reset_buffers(rctx,
-                                           (struct r600_query_hw*)
-                                           rctx->dcc_stats[i].ps_stats[2]);
+               si_query_hw_reset_buffers(sctx,
+                                         (struct r600_query_hw*)
+                                         sctx->b.dcc_stats[i].ps_stats[2]);
 
                /* Compute the approximate number of fullscreen draws. */
                tex->ps_draw_ratio =
                        result.pipeline_statistics.ps_invocations /
                        (tex->resource.b.b.width0 * tex->resource.b.b.height0);
-               rctx->last_tex_ps_draw_ratio = tex->ps_draw_ratio;
+               sctx->b.last_tex_ps_draw_ratio = tex->ps_draw_ratio;
 
                disable = tex->dcc_separate_buffer &&
                          !vi_should_enable_separate_dcc(tex);
@@ -2324,10 +2334,10 @@ void vi_separate_dcc_process_and_reset_stats(struct pipe_context *ctx,
                vi_separate_dcc_stop_query(ctx, tex);
 
        /* Move the queries in the queue by one. */
-       tmp = rctx->dcc_stats[i].ps_stats[2];
-       rctx->dcc_stats[i].ps_stats[2] = rctx->dcc_stats[i].ps_stats[1];
-       rctx->dcc_stats[i].ps_stats[1] = rctx->dcc_stats[i].ps_stats[0];
-       rctx->dcc_stats[i].ps_stats[0] = tmp;
+       tmp = sctx->b.dcc_stats[i].ps_stats[2];
+       sctx->b.dcc_stats[i].ps_stats[2] = sctx->b.dcc_stats[i].ps_stats[1];
+       sctx->b.dcc_stats[i].ps_stats[1] = sctx->b.dcc_stats[i].ps_stats[0];
+       sctx->b.dcc_stats[i].ps_stats[0] = tmp;
 
        /* create and start a new query as ps_stats[0] */
        if (query_active)
@@ -2485,8 +2495,8 @@ void si_init_screen_texture_functions(struct si_screen *sscreen)
        sscreen->b.check_resource_capability = si_check_resource_capability;
 }
 
-void si_init_context_texture_functions(struct r600_common_context *rctx)
+void si_init_context_texture_functions(struct si_context *sctx)
 {
-       rctx->b.create_surface = r600_create_surface;
-       rctx->b.surface_destroy = r600_surface_destroy;
+       sctx->b.b.create_surface = r600_create_surface;
+       sctx->b.b.surface_destroy = r600_surface_destroy;
 }