intel/fs: Don't emit control barrier if only one thread is used

author Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com>

Tue, 14 Jan 2020 20:03:22 +0000 (12:03 -0800)

committer Marge Bot <eric+marge@anholt.net>

Tue, 21 Jan 2020 23:41:35 +0000 (23:41 +0000)
author Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com>
Tue, 14 Jan 2020 20:03:22 +0000 (12:03 -0800)
committer Marge Bot <eric+marge@anholt.net>
Tue, 21 Jan 2020 23:41:35 +0000 (23:41 +0000)
diff --git a/src/intel/compiler/brw_fs_nir.cpp b/src/intel/compiler/brw_fs_nir.cpp

index 0b4d50c56e33608ee04d01d017e5a51b66d9d736..a861a1d938d3e60b2578032866ee4641fe2d30c8 100644 (file)
--- a/src/intel/compiler/brw_fs_nir.cpp
+++ b/src/intel/compiler/brw_fs_nir.cpp
@@ -3720,6 +3720,15 @@ fs_visitor::nir_emit_cs_intrinsic(const fs_builder &bld,
  
     switch (instr->intrinsic) {
     case nir_intrinsic_control_barrier:
+      /* The whole workgroup fits in a single HW thread, so all the
+       * invocations are already executed lock-step.  Instead of an actual
+       * barrier just emit a scheduling fence, that will generate no code.
+       */
+      if (workgroup_size() <= dispatch_width) {
+         bld.exec_all().group(1, 0).emit(FS_OPCODE_SCHEDULING_FENCE);
+         break;
+      }
+
        emit_barrier();
        cs_prog_data->uses_barrier = true;
        break;
author	Caio Marcelo de Oliveira Filho <caio.oliveira@intel.com>
	Tue, 14 Jan 2020 20:03:22 +0000 (12:03 -0800)
committer	Marge Bot <eric+marge@anholt.net>
	Tue, 21 Jan 2020 23:41:35 +0000 (23:41 +0000)