nir/lower_vec_to_movs: Only coalesce if the vec had a SSA destination

author Jason Ekstrand <jason.ekstrand@intel.com>

Fri, 23 Mar 2018 18:05:04 +0000 (11:05 -0700)

committer Jason Ekstrand <jason.ekstrand@intel.com>

Wed, 4 Apr 2018 05:21:23 +0000 (22:21 -0700)
author Jason Ekstrand <jason.ekstrand@intel.com>
Fri, 23 Mar 2018 18:05:04 +0000 (11:05 -0700)
committer Jason Ekstrand <jason.ekstrand@intel.com>
Wed, 4 Apr 2018 05:21:23 +0000 (22:21 -0700)
diff --git a/src/compiler/nir/nir_lower_vec_to_movs.c b/src/compiler/nir/nir_lower_vec_to_movs.c

index 711ddd38bda8341f4be825c7baa6bc24cffef945..8b24376b0a5befa4982c4b47187fa6f70113fe8f 100644 (file)
--- a/src/compiler/nir/nir_lower_vec_to_movs.c
+++ b/src/compiler/nir/nir_lower_vec_to_movs.c
@@ -230,6 +230,7 @@ lower_vec_to_movs_block(nir_block *block, nir_function_impl *impl)
           continue; /* The loop */
        }
  
+      bool vec_had_ssa_dest = vec->dest.dest.is_ssa;
        if (vec->dest.dest.is_ssa) {
           /* Since we insert multiple MOVs, we have a register destination. */
           nir_register *reg = nir_local_reg_create(impl);
@@ -263,7 +264,11 @@ lower_vec_to_movs_block(nir_block *block, nir_function_impl *impl)
           if (!(vec->dest.write_mask & (1 << i)))
              continue;
  
-         if (!(finished_write_mask & (1 << i)))
+         /* Coalescing moves the register writes from the vec up to the ALU
+          * instruction in the source.  We can only do this if the original
+          * vecN had an SSA destination.
+          */
+         if (vec_had_ssa_dest && !(finished_write_mask & (1 << i)))
              finished_write_mask |= try_coalesce(vec, i);
  
           if (!(finished_write_mask & (1 << i)))
author	Jason Ekstrand <jason.ekstrand@intel.com>
	Fri, 23 Mar 2018 18:05:04 +0000 (11:05 -0700)
committer	Jason Ekstrand <jason.ekstrand@intel.com>
	Wed, 4 Apr 2018 05:21:23 +0000 (22:21 -0700)