nir/algebraic: Eliminate useless fsat() on operand of comparison w/value in (0, 1)

author Ian Romanick <ian.d.romanick@intel.com>

Tue, 5 Mar 2019 22:54:35 +0000 (14:54 -0800)

committer Ian Romanick <ian.d.romanick@intel.com>

Tue, 14 May 2019 18:38:23 +0000 (11:38 -0700)
author Ian Romanick <ian.d.romanick@intel.com>
Tue, 5 Mar 2019 22:54:35 +0000 (14:54 -0800)
committer Ian Romanick <ian.d.romanick@intel.com>
Tue, 14 May 2019 18:38:23 +0000 (11:38 -0700)
diff --git a/src/compiler/nir/nir_opt_algebraic.py b/src/compiler/nir/nir_opt_algebraic.py

index 5fc6fd80de41c90e3af80337f066b7c3934416ef..79058c06b977799ec17a996ae1055f24a4cedf0b 100644 (file)
--- a/src/compiler/nir/nir_opt_algebraic.py
+++ b/src/compiler/nir/nir_opt_algebraic.py
@@ -213,6 +213,18 @@ optimizations = [
     (('fne', ('fneg', a), -1.0), ('fne', 1.0, a)),
     (('feq', -1.0, ('fneg', a)), ('feq', a, 1.0)),
  
+   (('flt', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('flt', a, b)),
+   (('flt', '#b(is_gt_0_and_lt_1)', ('fsat(is_used_once)', a)), ('flt', b, a)),
+   (('fge', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('fge', a, b)),
+   (('fge', '#b(is_gt_0_and_lt_1)', ('fsat(is_used_once)', a)), ('fge', b, a)),
+   (('feq', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('feq', a, b)),
+   (('fne', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('fne', a, b)),
+
+   (('fge', ('fsat(is_used_once)', a), 1.0), ('fge', a, 1.0)),
+   (('flt', ('fsat(is_used_once)', a), 1.0), ('flt', a, 1.0)),
+   (('fge', 0.0, ('fsat(is_used_once)', a)), ('fge', 0.0, a)),
+   (('flt', 0.0, ('fsat(is_used_once)', a)), ('flt', 0.0, a)),
+
     # 0.0 >= b2f(a)
     # b2f(a) <= 0.0
     # b2f(a) == 0.0 because b2f(a) can only be 0 or 1
@@ -1136,6 +1148,21 @@ late_optimizations = [
     # optimization loop can prevent other optimizations.
     (('fneg', ('fneg', a)), a),
  
+   # These are duplicated from the main optimizations table.  The late
+   # patterns that rearrange expressions like x - .5 < 0 to x < .5 can create
+   # new patterns like these.  The patterns that compare with zero are removed
+   # because they are unlikely to be created in by anything in
+   # late_optimizations.
+   (('flt', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('flt', a, b)),
+   (('flt', '#b(is_gt_0_and_lt_1)', ('fsat(is_used_once)', a)), ('flt', b, a)),
+   (('fge', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('fge', a, b)),
+   (('fge', '#b(is_gt_0_and_lt_1)', ('fsat(is_used_once)', a)), ('fge', b, a)),
+   (('feq', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('feq', a, b)),
+   (('fne', ('fsat(is_used_once)', a), '#b(is_gt_0_and_lt_1)'), ('fne', a, b)),
+
+   (('fge', ('fsat(is_used_once)', a), 1.0), ('fge', a, 1.0)),
+   (('flt', ('fsat(is_used_once)', a), 1.0), ('flt', a, 1.0)),
+
     (('~fge', ('fmin(is_used_once)', ('fadd(is_used_once)', a, b), ('fadd', c, d)), 0.0), ('iand', ('fge', a, ('fneg', b)), ('fge', c, ('fneg', d)))),
  
     (('flt', ('fneg', a), ('fneg', b)), ('flt', b, a)),
diff --git a/src/compiler/nir/nir_search_helpers.h b/src/compiler/nir/nir_search_helpers.h

index dd220dfdffdecb55bbc43a766d81e4d0c0fd5dd1..9e03c610ece26e7c39de293ccf6248591cc071b1 100644 (file)
--- a/src/compiler/nir/nir_search_helpers.h
+++ b/src/compiler/nir/nir_search_helpers.h
@@ -109,6 +109,36 @@ is_zero_to_one(nir_alu_instr *instr, unsigned src, unsigned num_components,
     return true;
  }
  
+/**
+ * Exclusive compare with (0, 1).
+ *
+ * This differs from \c is_zero_to_one because that function tests 0 <= src <=
+ * 1 while this function tests 0 < src < 1.
+ */
+static inline bool
+is_gt_0_and_lt_1(nir_alu_instr *instr, unsigned src, unsigned num_components,
+                 const uint8_t *swizzle)
+{
+   /* only constant srcs: */
+   if (!nir_src_is_const(instr->src[src].src))
+      return false;
+
+   for (unsigned i = 0; i < num_components; i++) {
+      switch (nir_op_infos[instr->op].input_types[src]) {
+      case nir_type_float: {
+         double val = nir_src_comp_as_float(instr->src[src].src, swizzle[i]);
+         if (isnan(val) || val <= 0.0f || val >= 1.0f)
+            return false;
+         break;
+      }
+      default:
+         return false;
+      }
+   }
+
+   return true;
+}
+
  static inline bool
  is_not_const_zero(nir_alu_instr *instr, unsigned src, unsigned num_components,
                    const uint8_t *swizzle)
author	Ian Romanick <ian.d.romanick@intel.com>
	Tue, 5 Mar 2019 22:54:35 +0000 (14:54 -0800)
committer	Ian Romanick <ian.d.romanick@intel.com>
	Tue, 14 May 2019 18:38:23 +0000 (11:38 -0700)
src/compiler/nir/nir_opt_algebraic.py		patch \| blob \| history
src/compiler/nir/nir_search_helpers.h		patch \| blob \| history