intel/fs: Remove min_dispatch_width from fs_visitor

author Jason Ekstrand <jason.ekstrand@intel.com>

Tue, 22 Aug 2017 02:16:45 +0000 (19:16 -0700)

committer Jason Ekstrand <jason.ekstrand@intel.com>

Tue, 7 Nov 2017 18:37:52 +0000 (10:37 -0800)
author Jason Ekstrand <jason.ekstrand@intel.com>
Tue, 22 Aug 2017 02:16:45 +0000 (19:16 -0700)
committer Jason Ekstrand <jason.ekstrand@intel.com>
Tue, 7 Nov 2017 18:37:52 +0000 (10:37 -0800)
diff --git a/src/intel/compiler/brw_fs.cpp b/src/intel/compiler/brw_fs.cpp

index 71fd8bf2f0663a0e784b1b6325208ca15bdc7b32..7782b23ff71d4e9983d8f885ae75c0df1083151f 100644 (file)
--- a/src/intel/compiler/brw_fs.cpp
+++ b/src/intel/compiler/brw_fs.cpp
@@ -5912,7 +5912,7 @@ fs_visitor::fixup_3src_null_dest()
  }
  
  void
-fs_visitor::allocate_registers(bool allow_spilling)
+fs_visitor::allocate_registers(unsigned min_dispatch_width, bool allow_spilling)
  {
     bool allocated_without_spills;
  
@@ -6047,7 +6047,7 @@ fs_visitor::run_vs()
     assign_vs_urb_setup();
  
     fixup_3src_null_dest();
-   allocate_registers(true);
+   allocate_registers(8, true);
  
     return !failed;
  }
@@ -6127,7 +6127,7 @@ fs_visitor::run_tcs_single_patch()
     assign_tcs_single_patch_urb_setup();
  
     fixup_3src_null_dest();
-   allocate_registers(true);
+   allocate_registers(8, true);
  
     return !failed;
  }
@@ -6161,7 +6161,7 @@ fs_visitor::run_tes()
     assign_tes_urb_setup();
  
     fixup_3src_null_dest();
-   allocate_registers(true);
+   allocate_registers(8, true);
  
     return !failed;
  }
@@ -6210,7 +6210,7 @@ fs_visitor::run_gs()
     assign_gs_urb_setup();
  
     fixup_3src_null_dest();
-   allocate_registers(true);
+   allocate_registers(8, true);
  
     return !failed;
  }
@@ -6310,7 +6310,7 @@ fs_visitor::run_fs(bool allow_spilling, bool do_rep_send)
        assign_urb_setup();
  
        fixup_3src_null_dest();
-      allocate_registers(allow_spilling);
+      allocate_registers(8, allow_spilling);
  
        if (failed)
           return false;
@@ -6320,9 +6320,10 @@ fs_visitor::run_fs(bool allow_spilling, bool do_rep_send)
  }
  
  bool
-fs_visitor::run_cs()
+fs_visitor::run_cs(unsigned min_dispatch_width)
  {
     assert(stage == MESA_SHADER_COMPUTE);
+   assert(dispatch_width >= min_dispatch_width);
  
     setup_cs_payload();
  
@@ -6353,7 +6354,7 @@ fs_visitor::run_cs()
     assign_curb_setup();
  
     fixup_3src_null_dest();
-   allocate_registers(true);
+   allocate_registers(min_dispatch_width, true);
  
     if (failed)
        return false;
@@ -6841,8 +6842,11 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
        shader->info.cs.local_size[0] * shader->info.cs.local_size[1] *
        shader->info.cs.local_size[2];
  
-   unsigned max_cs_threads = compiler->devinfo->max_cs_threads;
-   unsigned simd_required = DIV_ROUND_UP(local_workgroup_size, max_cs_threads);
+   unsigned min_dispatch_width =
+      DIV_ROUND_UP(local_workgroup_size, compiler->devinfo->max_cs_threads);
+   min_dispatch_width = MAX2(8, min_dispatch_width);
+   min_dispatch_width = util_next_power_of_two(min_dispatch_width);
+   assert(min_dispatch_width <= 32);
  
     cfg_t *cfg = NULL;
     const char *fail_msg = NULL;
@@ -6852,8 +6856,8 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
     fs_visitor v8(compiler, log_data, mem_ctx, key, &prog_data->base,
                   NULL, /* Never used in core profile */
                   shader, 8, shader_time_index);
-   if (simd_required <= 8) {
-      if (!v8.run_cs()) {
+   if (min_dispatch_width <= 8) {
+      if (!v8.run_cs(min_dispatch_width)) {
           fail_msg = v8.fail_msg;
        } else {
           cfg = v8.cfg;
@@ -6868,11 +6872,11 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
                   shader, 16, shader_time_index);
     if (likely(!(INTEL_DEBUG & DEBUG_NO16)) &&
         !fail_msg && v8.max_dispatch_width >= 16 &&
-       simd_required <= 16) {
+       min_dispatch_width <= 16) {
        /* Try a SIMD16 compile */
-      if (simd_required <= 8)
+      if (min_dispatch_width <= 8)
           v16.import_uniforms(&v8);
-      if (!v16.run_cs()) {
+      if (!v16.run_cs(min_dispatch_width)) {
           compiler->shader_perf_log(log_data,
                                     "SIMD16 shader failed to compile: %s",
                                     v16.fail_msg);
@@ -6893,14 +6897,14 @@ brw_compile_cs(const struct brw_compiler *compiler, void *log_data,
                   NULL, /* Never used in core profile */
                   shader, 32, shader_time_index);
     if (!fail_msg && v8.max_dispatch_width >= 32 &&
-       (simd_required > 16 || (INTEL_DEBUG & DEBUG_DO32))) {
+       (min_dispatch_width > 16 || (INTEL_DEBUG & DEBUG_DO32))) {
        /* Try a SIMD32 compile */
-      if (simd_required <= 8)
+      if (min_dispatch_width <= 8)
           v32.import_uniforms(&v8);
-      else if (simd_required <= 16)
+      else if (min_dispatch_width <= 16)
           v32.import_uniforms(&v16);
  
-      if (!v32.run_cs()) {
+      if (!v32.run_cs(min_dispatch_width)) {
           compiler->shader_perf_log(log_data,
                                     "SIMD32 shader failed to compile: %s",
                                     v16.fail_msg);
diff --git a/src/intel/compiler/brw_fs.h b/src/intel/compiler/brw_fs.h

index b070d3888ebf625961fa03163aa1e1e8d10881d0..da3259323ec351a615a23337ce462e7ea65fb32c 100644 (file)
--- a/src/intel/compiler/brw_fs.h
+++ b/src/intel/compiler/brw_fs.h
@@ -99,9 +99,9 @@ public:
     bool run_tcs_single_patch();
     bool run_tes();
     bool run_gs();
-   bool run_cs();
+   bool run_cs(unsigned min_dispatch_width);
     void optimize();
-   void allocate_registers(bool allow_spilling);
+   void allocate_registers(unsigned min_dispatch_width, bool allow_spilling);
     void setup_fs_payload_gen4();
     void setup_fs_payload_gen6();
     void setup_vs_payload();
@@ -364,7 +364,6 @@ public:
     bool spilled_any_registers;
  
     const unsigned dispatch_width; /**< 8, 16 or 32 */
-   unsigned min_dispatch_width;
     unsigned max_dispatch_width;
  
     int shader_time_index;
diff --git a/src/intel/compiler/brw_fs_visitor.cpp b/src/intel/compiler/brw_fs_visitor.cpp

index 32fe0fc054b97233498fea2e52908254ac08b801..9fd4c20837ff6c71038f84ce23ade87dea1d429c 100644 (file)
--- a/src/intel/compiler/brw_fs_visitor.cpp
+++ b/src/intel/compiler/brw_fs_visitor.cpp
@@ -871,17 +871,6 @@ fs_visitor::init()
        unreachable("unhandled shader stage");
     }
  
-   if (stage == MESA_SHADER_COMPUTE) {
-      const struct brw_cs_prog_data *cs_prog_data = brw_cs_prog_data(prog_data);
-      unsigned size = cs_prog_data->local_size[0] *
-                      cs_prog_data->local_size[1] *
-                      cs_prog_data->local_size[2];
-      size = DIV_ROUND_UP(size, devinfo->max_cs_threads);
-      min_dispatch_width = size > 16 ? 32 : (size > 8 ? 16 : 8);
-   } else {
-      min_dispatch_width = 8;
-   }
-
     this->max_dispatch_width = 32;
     this->prog_data = this->stage_prog_data;
author	Jason Ekstrand <jason.ekstrand@intel.com>
	Tue, 22 Aug 2017 02:16:45 +0000 (19:16 -0700)
committer	Jason Ekstrand <jason.ekstrand@intel.com>
	Tue, 7 Nov 2017 18:37:52 +0000 (10:37 -0800)
src/intel/compiler/brw_fs.cpp		patch \| blob \| history
src/intel/compiler/brw_fs.h		patch \| blob \| history
src/intel/compiler/brw_fs_visitor.cpp		patch \| blob \| history