i965/fs: Support pull parameters in SIMD16 mode.
authorKenneth Graunke <kenneth@whitecape.org>
Sat, 8 Mar 2014 00:10:50 +0000 (16:10 -0800)
committerKenneth Graunke <kenneth@whitecape.org>
Tue, 18 Mar 2014 17:11:36 +0000 (10:11 -0700)
This is just a matter of reusing the pull/push constant information set
up by the SIMD8 compile.

This gains us 78 SIMD16 programs in shader-db.

Signed-off-by: Kenneth Graunke <kenneth@whitecape.org>
Reviewed-by: Topi Pohjolainen <topi.pohjolainen@intel.com>
Reviewed-by: Eric Anholt <eric@anholt.net>
src/mesa/drivers/dri/i965/brw_fs.cpp
src/mesa/drivers/dri/i965/brw_fs_visitor.cpp

index 054bed544b6547a6a22d283cc6b6d1b859304966..1f8590143fe03589fa61ba7c0bb4325d3cb308ff 100644 (file)
@@ -886,7 +886,9 @@ fs_visitor::import_uniforms(fs_visitor *v)
                           import_uniforms_callback,
                           variable_ht);
    this->push_constant_loc = v->push_constant_loc;
+   this->pull_constant_loc = v->pull_constant_loc;
    this->uniforms = v->uniforms;
+   this->param_size = v->param_size;
 }
 
 /* Our support for uniforms is piggy-backed on the struct
@@ -1748,6 +1750,9 @@ fs_visitor::compact_virtual_grfs()
 void
 fs_visitor::move_uniform_array_access_to_pull_constants()
 {
+   if (dispatch_width != 8)
+      return;
+
    pull_constant_loc = ralloc_array(mem_ctx, int, uniforms);
 
    for (unsigned int i = 0; i < uniforms; i++) {
@@ -3500,17 +3505,13 @@ brw_wm_fs_emit(struct brw_context *brw, struct brw_wm_compile *c,
    exec_list *simd16_instructions = NULL;
    fs_visitor v2(brw, c, prog, fp, 16);
    if (brw->gen >= 5 && likely(!(INTEL_DEBUG & DEBUG_NO16))) {
-      if (c->prog_data.base.nr_pull_params == 0) {
-         /* Try a SIMD16 compile */
-         v2.import_uniforms(&v);
-         if (!v2.run()) {
-            perf_debug("SIMD16 shader failed to compile, falling back to "
-                       "SIMD8 at a 10-20%% performance cost: %s", v2.fail_msg);
-         } else {
-            simd16_instructions = &v2.instructions;
-         }
+      /* Try a SIMD16 compile */
+      v2.import_uniforms(&v);
+      if (!v2.run()) {
+         perf_debug("SIMD16 shader failed to compile, falling back to "
+                    "SIMD8 at a 10-20%% performance cost: %s", v2.fail_msg);
       } else {
-         perf_debug("Skipping SIMD16 due to pull parameters.\n");
+         simd16_instructions = &v2.instructions;
       }
    }
 
index 7088502340befbe30f3f854450c84f3afa73a3f6..cd90e23202cd2ac59c85f673b96b46f91a867d38 100644 (file)
@@ -2978,7 +2978,8 @@ fs_visitor::fs_visitor(struct brw_context *brw,
 
    this->spilled_any_registers = false;
 
-   this->param_size = rzalloc_array(mem_ctx, int, stage_prog_data->nr_params);
+   if (dispatch_width == 8)
+      this->param_size = rzalloc_array(mem_ctx, int, stage_prog_data->nr_params);
 }
 
 fs_visitor::~fs_visitor()