radeonsi: don't use the real barrier instruction in tess ctrl shaders
authorMarek Olšák <marek.olsak@amd.com>
Wed, 6 Apr 2016 22:49:32 +0000 (00:49 +0200)
committerMarek Olšák <marek.olsak@amd.com>
Thu, 7 Apr 2016 11:58:01 +0000 (13:58 +0200)
Reviewed-by: Bas Nieuwenhuizen <bas@basnieuwenhuizen.nl>
Reviewed-by: Nicolai Hähnle <nicolai.haehnle@amd.com>
src/gallium/drivers/radeonsi/si_shader.c

index bf3f00867e94fc70e415a89c7b97675349ffec70..08da3e37550e4e583d936069cd08dfc1b43bc0ce 100644 (file)
@@ -4282,6 +4282,14 @@ static void si_llvm_emit_barrier(const struct lp_build_tgsi_action *action,
        struct si_shader_context *ctx = si_shader_context(bld_base);
        struct gallivm_state *gallivm = bld_base->base.gallivm;
 
+       /* The real barrier instruction isn’t needed, because an entire patch
+        * always fits into a single wave.
+        */
+       if (ctx->type == TGSI_PROCESSOR_TESS_CTRL) {
+               emit_optimization_barrier(ctx);
+               return;
+       }
+
        lp_build_intrinsic(gallivm->builder,
                           HAVE_LLVM >= 0x0309 ? "llvm.amdgcn.s.barrier"
                                               : "llvm.AMDGPU.barrier.local",