nir/algebraic: add patterns for a >> #b << #b

author Rhys Perry <pendingchaos02@gmail.com>

Wed, 9 Oct 2019 14:03:45 +0000 (15:03 +0100)

committer Marge Bot <eric+marge@anholt.net>

Wed, 29 Jan 2020 14:30:33 +0000 (14:30 +0000)
author Rhys Perry <pendingchaos02@gmail.com>
Wed, 9 Oct 2019 14:03:45 +0000 (15:03 +0100)
committer Marge Bot <eric+marge@anholt.net>
Wed, 29 Jan 2020 14:30:33 +0000 (14:30 +0000)
diff --git a/src/compiler/nir/nir_opt_algebraic.py b/src/compiler/nir/nir_opt_algebraic.py

index 7b9a6a8e45d3ee3915f3a97372337d928a2f8c35..fd0007bb54d1bf8bad15cb9a6b2fee32136c7316 100644 (file)
--- a/src/compiler/nir/nir_opt_algebraic.py
+++ b/src/compiler/nir/nir_opt_algebraic.py
@@ -255,6 +255,22 @@ for s in [8, 16, 32, 64]:
          (ishr, a, ('imin', ('iadd', ('iand', b, mask), ('iand', c, mask)), s - 1))),
     ])
  
+# Optimize a pattern of address calculation created by DXVK where the offset is
+# divided by 4 and then multipled by 4. This can be turned into an iand and the
+# additions before can be reassociated to CSE the iand instruction.
+for log2 in range(1, 7): # powers of two from 2 to 64
+   v = 1 << log2
+   mask = 0xffffffff & ~(v - 1)
+   b_is_multiple = '#b(is_unsigned_multiple_of_{})'.format(v)
+
+   optimizations.extend([
+       # 'a >> #b << #b' -> 'a & ~((1 << #b) - 1)'
+       (('ishl@32', ('ushr@32', a, log2), log2), ('iand', a, mask)),
+
+       # Reassociate for improved CSE
+       (('iand@32', ('iadd@32', a, b_is_multiple), mask), ('iadd', ('iand', a, mask), b)),
+   ])
+
  optimizations.extend([
     # This is common for address calculations.  Reassociating may enable the
     # 'a<<c' to be CSE'd.  It also helps architectures that have an ISHLADD
diff --git a/src/compiler/nir/nir_search_helpers.h b/src/compiler/nir/nir_search_helpers.h

index 0c2f631ac39029026a45127801bd907af610cd8b..abfd660ae792597475df99956a411b6a1eab9398 100644 (file)
--- a/src/compiler/nir/nir_search_helpers.h
+++ b/src/compiler/nir/nir_search_helpers.h
@@ -90,6 +90,32 @@ is_neg_power_of_two(UNUSED struct hash_table *ht, nir_alu_instr *instr,
     return true;
  }
  
+#define MULTIPLE(test)                                                  \
+static inline bool                                                      \
+is_unsigned_multiple_of_ ## test(UNUSED struct hash_table *ht, nir_alu_instr *instr, \
+                                 unsigned src, unsigned num_components, \
+                                 const uint8_t *swizzle)                \
+{                                                                       \
+   /* only constant srcs: */                                            \
+   if (!nir_src_is_const(instr->src[src].src))                          \
+      return false;                                                     \
+                                                                        \
+   for (unsigned i = 0; i < num_components; i++) {                      \
+      uint64_t val = nir_src_comp_as_uint(instr->src[src].src, swizzle[i]); \
+      if (val % test != 0)                                              \
+         return false;                                                  \
+   }                                                                    \
+                                                                        \
+   return true;                                                         \
+}
+
+MULTIPLE(2)
+MULTIPLE(4)
+MULTIPLE(8)
+MULTIPLE(16)
+MULTIPLE(32)
+MULTIPLE(64)
+
  static inline bool
  is_zero_to_one(UNUSED struct hash_table *ht, nir_alu_instr *instr, unsigned src,
                 unsigned num_components,
author	Rhys Perry <pendingchaos02@gmail.com>
	Wed, 9 Oct 2019 14:03:45 +0000 (15:03 +0100)
committer	Marge Bot <eric+marge@anholt.net>
	Wed, 29 Jan 2020 14:30:33 +0000 (14:30 +0000)
src/compiler/nir/nir_opt_algebraic.py		patch \| blob \| history
src/compiler/nir/nir_search_helpers.h		patch \| blob \| history