radv/gfx10: implement a bug workaround for NGG -> legacy transitions
authorSamuel Pitoiset <samuel.pitoiset@gmail.com>
Wed, 31 Jul 2019 07:39:19 +0000 (09:39 +0200)
committerSamuel Pitoiset <samuel.pitoiset@gmail.com>
Wed, 31 Jul 2019 10:14:29 +0000 (12:14 +0200)
Signed-off-by: Samuel Pitoiset <samuel.pitoiset@gmail.com>
Reviewed-by: Bas Nieuwenhuizen <bas@basnieuwenhuizen.nl>
src/amd/vulkan/radv_cmd_buffer.c
src/amd/vulkan/si_cmd_buffer.c

index bd5d30ad7a28f63fb0ca8b280caf2bbe5dabb6d9..da373d39fdd30c8c6b7ce4cfcb5cbfacdc717dc5 100644 (file)
@@ -3626,6 +3626,20 @@ void radv_CmdBindPipeline(
                /* Prefetch all pipeline shaders at first draw time. */
                cmd_buffer->state.prefetch_L2_mask |= RADV_PREFETCH_SHADERS;
 
+               if ((cmd_buffer->device->physical_device->rad_info.family == CHIP_NAVI10 ||
+                    cmd_buffer->device->physical_device->rad_info.family == CHIP_NAVI12 ||
+                    cmd_buffer->device->physical_device->rad_info.family == CHIP_NAVI14) &&
+                   cmd_buffer->state.emitted_pipeline &&
+                   radv_pipeline_has_ngg(cmd_buffer->state.emitted_pipeline) &&
+                   !radv_pipeline_has_ngg(cmd_buffer->state.pipeline)) {
+                       /* Transitioning from NGG to legacy GS requires
+                        * VGT_FLUSH on Navi10-14.  VGT_FLUSH is also emitted
+                        * at the beginning of IBs when legacy GS ring pointers
+                        * are set.
+                        */
+                       cmd_buffer->state.flush_bits |= RADV_CMD_FLAG_VGT_FLUSH;
+               }
+
                radv_bind_dynamic_state(cmd_buffer, &pipeline->dynamic_state);
                radv_bind_streamout_state(cmd_buffer, pipeline);
 
index 94f759139ee54340a8f49cdb42abf773d182c4c6..18b2236e54b0e9ad648f23c276e3a3f3578a9bfc 100644 (file)
@@ -878,8 +878,7 @@ gfx10_cs_emit_cache_flush(struct radeon_cmdbuf *cs,
        unsigned cb_db_event = 0;
 
        /* We don't need these. */
-       assert(!(flush_bits & (RADV_CMD_FLAG_VGT_FLUSH |
-                              RADV_CMD_FLAG_VGT_STREAMOUT_SYNC)));
+       assert(!(flush_bits & (RADV_CMD_FLAG_VGT_STREAMOUT_SYNC)));
 
        if (flush_bits & RADV_CMD_FLAG_INV_ICACHE)
                gcr_cntl |= S_586_GLI_INV(V_586_GLI_ALL);
@@ -998,6 +997,12 @@ gfx10_cs_emit_cache_flush(struct radeon_cmdbuf *cs,
                                 *flush_cnt, 0xffffffff);
        }
 
+       /* VGT state sync */
+       if (flush_bits & RADV_CMD_FLAG_VGT_FLUSH) {
+               radeon_emit(cs, PKT3(PKT3_EVENT_WRITE, 0, 0));
+               radeon_emit(cs, EVENT_TYPE(V_028A90_VGT_FLUSH) | EVENT_INDEX(0));
+       }
+
        /* Ignore fields that only modify the behavior of other fields. */
        if (gcr_cntl & C_586_GL1_RANGE & C_586_GL2_RANGE & C_586_SEQ) {
                /* Flush caches and wait for the caches to assert idle.