radeonsi: enable TC-compatible stencil compression on VI
authorMarek Olšák <marek.olsak@amd.com>
Mon, 5 Jun 2017 17:51:38 +0000 (19:51 +0200)
committerMarek Olšák <marek.olsak@amd.com>
Wed, 7 Jun 2017 17:38:39 +0000 (19:38 +0200)
Most things are in place. Ideally we won't see decompress blits for stencil
anymore.

Reviewed-by: Nicolai Hähnle <nicolai.haehnle@amd.com>
src/gallium/drivers/radeonsi/si_blit.c
src/gallium/drivers/radeonsi/si_descriptors.c
src/gallium/drivers/radeonsi/si_state_draw.c

index f5d9048d8c911242102c403d118fbe9c9d5ea07d..500c5bfcf7cc6132f40030784bb26a6419439829 100644 (file)
@@ -332,6 +332,8 @@ si_flush_depth_texture(struct si_context *sctx,
        }
 
        assert(!tex->tc_compatible_htile || levels_z == 0);
+       assert(!tex->tc_compatible_htile || levels_s == 0 ||
+              !r600_can_sample_zs(tex, true));
 
        /* We may have to allocate the flushed texture here when called from
         * si_decompress_subresource.
index 61eb2f10be2baabaafa68fd7bd4ab4b79e888e40..7a2b71df6b51aef3bc13a4041ec82d6de922c8c5 100644 (file)
@@ -339,8 +339,7 @@ static void si_sampler_view_add_buffer(struct si_context *sctx,
        }
 
        if (rtex->htile_buffer &&
-           rtex->tc_compatible_htile &&
-           !is_stencil_sampler) {
+           rtex->tc_compatible_htile) {
                radeon_add_to_buffer_list_check_mem(&sctx->b, &sctx->b.gfx,
                                                    rtex->htile_buffer, usage,
                                                    RADEON_PRIO_HTILE, check_mem);
@@ -424,7 +423,7 @@ void si_set_mutable_tex_desc_fields(struct si_screen *sscreen,
 
                        if (sscreen->b.chip_class <= VI)
                                meta_va += base_level_info->dcc_offset;
-               } else if (tex->tc_compatible_htile && !is_stencil) {
+               } else if (tex->tc_compatible_htile) {
                        meta_va = tex->htile_buffer->gpu_address;
                }
 
@@ -571,7 +570,8 @@ static bool depth_needs_decompression(struct r600_texture *rtex,
                                      struct si_sampler_view *sview)
 {
        return rtex->db_compatible &&
-              (!rtex->tc_compatible_htile || sview->is_stencil_sampler);
+              (!rtex->tc_compatible_htile ||
+               !r600_can_sample_zs(rtex, sview->is_stencil_sampler));
 }
 
 static void si_update_compressed_tex_shader_mask(struct si_context *sctx,
index 77df64397f9df8567b344f811b6cbdd29cb62603..cd069e31a642150af8836e3f750c0dbb937c6017 100644 (file)
@@ -1398,7 +1398,8 @@ void si_draw_vbo(struct pipe_context *ctx, const struct pipe_draw_info *info)
                        if (!rtex->tc_compatible_htile)
                                rtex->dirty_level_mask |= 1 << surf->u.tex.level;
 
-                       if (rtex->surface.flags & RADEON_SURF_SBUFFER)
+                       if (rtex->surface.flags & RADEON_SURF_SBUFFER &&
+                           (!rtex->tc_compatible_htile || !rtex->can_sample_s))
                                rtex->stencil_dirty_level_mask |= 1 << surf->u.tex.level;
                }
                if (sctx->framebuffer.compressed_cb_mask) {