r600g: Pass conservative depth parameters to hw
authorGlenn Kennard <glenn.kennard@gmail.com>
Sat, 17 Oct 2015 14:53:28 +0000 (16:53 +0200)
committerDave Airlie <airlied@redhat.com>
Tue, 10 Nov 2015 23:06:25 +0000 (09:06 +1000)
Supported on R700 and up.

Signed-off-by: Glenn Kennard <glenn.kennard@gmail.com>
Reviewed-by: Marek Olšák <marek.olsak@amd.com>
Signed-off-by: Dave Airlie <airlied@redhat.com>
src/gallium/drivers/r600/evergreen_state.c
src/gallium/drivers/r600/evergreend.h
src/gallium/drivers/r600/r600_pipe.h
src/gallium/drivers/r600/r600_shader.c
src/gallium/drivers/r600/r600_shader.h
src/gallium/drivers/r600/r600_state.c
src/gallium/drivers/r600/r600d.h

index 60747d1c89b828d31b116e5c0773457b2155cf9f..30e902673d0abe04161c2ab54c6fed79b7ad2f41 100644 (file)
@@ -2951,6 +2951,19 @@ void evergreen_update_ps_state(struct pipe_context *ctx, struct r600_pipe_shader
        db_shader_control |= S_02880C_STENCIL_EXPORT_ENABLE(stencil_export);
        db_shader_control |= S_02880C_MASK_EXPORT_ENABLE(mask_export);
 
+       switch (rshader->ps_conservative_z) {
+       default: /* fall through */
+       case TGSI_FS_DEPTH_LAYOUT_ANY:
+               db_shader_control |= S_02880C_CONSERVATIVE_Z_EXPORT(V_02880C_EXPORT_ANY_Z);
+               break;
+       case TGSI_FS_DEPTH_LAYOUT_GREATER:
+               db_shader_control |= S_02880C_CONSERVATIVE_Z_EXPORT(V_02880C_EXPORT_GREATER_THAN_Z);
+               break;
+       case TGSI_FS_DEPTH_LAYOUT_LESS:
+               db_shader_control |= S_02880C_CONSERVATIVE_Z_EXPORT(V_02880C_EXPORT_LESS_THAN_Z);
+               break;
+       }
+
        exports_ps = 0;
        for (i = 0; i < rshader->noutput; i++) {
                if (rshader->output[i].name == TGSI_SEMANTIC_POSITION ||
index 937ffcbddb90aae74a6df87c3961c6443f75a2ed..a9a65f753054c8f56d8d456d88b2ca862064363c 100644 (file)
 #define     V_02880C_EXPORT_DB_FOUR16                  0x01
 #define     V_02880C_EXPORT_DB_TWO                     0x02
 #define   S_02880C_ALPHA_TO_MASK_DISABLE(x)            (((x) & 0x1) << 12)
+#define   S_02880C_CONSERVATIVE_Z_EXPORT(x)            (((x) & 0x03) << 16)
+#define   G_02880C_CONSERVATIVE_Z_EXPORT(x)            (((x) >> 16) & 0x03)
+#define   C_02880C_CONSERVATIVE_Z_EXPORT               0xFFFCFFFF
+#define     V_02880C_EXPORT_ANY_Z                      0
+#define     V_02880C_EXPORT_LESS_THAN_Z                1
+#define     V_02880C_EXPORT_GREATER_THAN_Z             2
+#define     V_02880C_EXPORT_RESERVED                   3
 
 #define R_028A00_PA_SU_POINT_SIZE                    0x028A00
 #define   S_028A00_HEIGHT(x)                           (((x) & 0xFFFF) << 0)
index 520b03f605da83b17b0ace2b8a6fbfac5940e12c..950bb6be76ceae9c83642b05ec8064553b326e7e 100644 (file)
@@ -116,6 +116,7 @@ struct r600_db_misc_state {
        unsigned                        log_samples;
        unsigned                        db_shader_control;
        bool                            htile_clear;
+       uint8_t                         ps_conservative_z;
 };
 
 struct r600_cb_misc_state {
index fc6335ae8bcbc83556d857f2cafb4fd5a00a3568..560197c82b5497101905d0b85e2c46c6907de0ba 100644 (file)
@@ -2044,6 +2044,7 @@ static int r600_shader_from_tgsi(struct r600_context *rctx,
 
        shader->fs_write_all = ctx.info.properties[TGSI_PROPERTY_FS_COLOR0_WRITES_ALL_CBUFS];
        shader->vs_position_window_space = ctx.info.properties[TGSI_PROPERTY_VS_WINDOW_SPACE_POSITION];
+       shader->ps_conservative_z = (uint8_t)ctx.info.properties[TGSI_PROPERTY_FS_DEPTH_LAYOUT];
 
        if (shader->vs_as_gs_a)
                vs_add_primid_output(&ctx, key.vs.prim_id_out);
index c240e7110c175900fa055a4dcce83b923fa3161f..2040f732bf5e5bfe3f8132bcc3b9ae7b9b7a5afb 100644 (file)
@@ -76,6 +76,8 @@ struct r600_shader {
        boolean                 uses_tex_buffers;
        boolean                 gs_prim_id_input;
 
+       uint8_t                 ps_conservative_z;
+
        /* Size in bytes of a data item in the ring(s) (single vertex data).
           Stages with only one ring items 123 will be set to 0. */
        unsigned                ring_item_sizes[4];
index 1be3e1b4de50d888052a893d58dd76d2f3d2cb5e..1305efa56600b49dec1cd8d52f05870a0d65721f 100644 (file)
@@ -1628,6 +1628,21 @@ static void r600_emit_db_misc_state(struct r600_context *rctx, struct r600_atom
                S_028D10_FORCE_HIS_ENABLE0(V_028D10_FORCE_DISABLE) |
                S_028D10_FORCE_HIS_ENABLE1(V_028D10_FORCE_DISABLE);
 
+       if (rctx->b.chip_class >= R700) {
+               switch (a->ps_conservative_z) {
+               default: /* fall through */
+               case TGSI_FS_DEPTH_LAYOUT_ANY:
+                       db_render_control |= S_028D0C_CONSERVATIVE_Z_EXPORT(V_028D0C_EXPORT_ANY_Z);
+                       break;
+               case TGSI_FS_DEPTH_LAYOUT_GREATER:
+                       db_render_control |= S_028D0C_CONSERVATIVE_Z_EXPORT(V_028D0C_EXPORT_GREATER_THAN_Z);
+                       break;
+               case TGSI_FS_DEPTH_LAYOUT_LESS:
+                       db_render_control |= S_028D0C_CONSERVATIVE_Z_EXPORT(V_028D0C_EXPORT_LESS_THAN_Z);
+                       break;
+               }
+       }
+
        if (a->occlusion_query_enabled) {
                if (rctx->b.chip_class >= R700) {
                        db_render_control |= S_028D0C_R700_PERFECT_ZPASS_COUNTS(1);
@@ -2787,6 +2802,7 @@ void r600_update_db_shader_control(struct r600_context * rctx)
 {
        bool dual_export;
        unsigned db_shader_control;
+       uint8_t ps_conservative_z;
 
        if (!rctx->ps_shader) {
                return;
@@ -2798,6 +2814,8 @@ void r600_update_db_shader_control(struct r600_context * rctx)
        db_shader_control = rctx->ps_shader->current->db_shader_control |
                            S_02880C_DUAL_EXPORT_ENABLE(dual_export);
 
+       ps_conservative_z = rctx->ps_shader->current->shader.ps_conservative_z;
+
        /* When alpha test is enabled we can't trust the hw to make the proper
         * decision on the order in which ztest should be run related to fragment
         * shader execution.
@@ -2811,8 +2829,10 @@ void r600_update_db_shader_control(struct r600_context * rctx)
                db_shader_control |= S_02880C_Z_ORDER(V_02880C_EARLY_Z_THEN_LATE_Z);
        }
 
-       if (db_shader_control != rctx->db_misc_state.db_shader_control) {
+       if (db_shader_control != rctx->db_misc_state.db_shader_control ||
+               ps_conservative_z != rctx->db_misc_state.ps_conservative_z) {
                rctx->db_misc_state.db_shader_control = db_shader_control;
+               rctx->db_misc_state.ps_conservative_z = ps_conservative_z;
                r600_mark_atom_dirty(rctx, &rctx->db_misc_state.atom);
        }
 }
index 6bba88cb57422bbebfd9d83fba165e9b63d42a24..53f5ad6db6a8107a4f651667d4fde3738ec17119 100644 (file)
 #define   S_028D0C_COPY_CENTROID(x)                    (((x) & 0x1) << 7)
 #define   S_028D0C_COPY_SAMPLE(x)                      (((x) & 0x1) << 8)
 #define   S_028D0C_R700_PERFECT_ZPASS_COUNTS(x)        (((x) & 0x1) << 15)
+#define   S_028D0C_CONSERVATIVE_Z_EXPORT(x)            (((x) & 0x03) << 13)
+#define   G_028D0C_CONSERVATIVE_Z_EXPORT(x)            (((x) >> 13) & 0x03)
+#define   C_028D0C_CONSERVATIVE_Z_EXPORT               0xFFFF9FFF
+#define     V_028D0C_EXPORT_ANY_Z                      0
+#define     V_028D0C_EXPORT_LESS_THAN_Z                1
+#define     V_028D0C_EXPORT_GREATER_THAN_Z             2
+#define     V_028D0C_EXPORT_RESERVED                   3
+
 #define R_028D10_DB_RENDER_OVERRIDE                  0x028D10
 #define   V_028D10_FORCE_OFF                         0
 #define   V_028D10_FORCE_ENABLE                      1