Fold pointer range checks with equal spans

author Richard Sandiford <richard.sandiford@arm.com>

Wed, 1 Aug 2018 15:46:12 +0000 (15:46 +0000)

committer Richard Sandiford <rsandifo@gcc.gnu.org>

Wed, 1 Aug 2018 15:46:12 +0000 (15:46 +0000)
author Richard Sandiford <richard.sandiford@arm.com>
Wed, 1 Aug 2018 15:46:12 +0000 (15:46 +0000)
committer Richard Sandiford <rsandifo@gcc.gnu.org>
Wed, 1 Aug 2018 15:46:12 +0000 (15:46 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index efa46230f7d1e87aaed6c6ac07f72b3dace26e6f..2e4ed90d447fa18768b571575bba78966acd07ba 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,7 @@
+2018-08-01  Richard Sandiford  <richard.sandiford@arm.com>
+
+       * match.pd: Optimise pointer range checks.
+
  2018-08-01  Richard Sandiford  <richard.sandiford@arm.com>
  
         PR tree-optimization/86758
diff --git a/gcc/match.pd b/gcc/match.pd

index 0ae1af0ce06873417d3533aad760b9e3a38a4c3d..cb3c93e3e162b262e218dee1d09858095efba371 100644 (file)
--- a/gcc/match.pd
+++ b/gcc/match.pd
@@ -4937,3 +4937,63 @@ DEFINE_INT_AND_FLOAT_ROUND_FN (RINT)
     (if (inverse_conditions_p (@0, @2)
          && element_precision (type) == element_precision (op_type))
      (view_convert (cond_op @2 @3 @4 @5 (view_convert:op_type @1)))))))
+
+/* For pointers @0 and @2 and nonnegative constant offset @1, look for
+   expressions like:
+
+   A: (@0 + @1 < @2) | (@2 + @1 < @0)
+   B: (@0 + @1 <= @2) | (@2 + @1 <= @0)
+
+   If pointers are known not to wrap, B checks whether @1 bytes starting
+   at @0 and @2 do not overlap, while A tests the same thing for @1 + 1
+   bytes.  A is more efficiently tested as:
+
+   A: (sizetype) (@0 + @1 - @2) > @1 * 2
+
+   The equivalent expression for B is given by replacing @1 with @1 - 1:
+
+   B: (sizetype) (@0 + (@1 - 1) - @2) > (@1 - 1) * 2
+
+   @0 and @2 can be swapped in both expressions without changing the result.
+
+   The folds rely on sizetype's being unsigned (which is always true)
+   and on its being the same width as the pointer (which we have to check).
+
+   The fold replaces two pointer_plus expressions, two comparisons and
+   an IOR with a pointer_plus, a pointer_diff, and a comparison, so in
+   the best case it's a saving of two operations.  The A fold retains one
+   of the original pointer_pluses, so is a win even if both pointer_pluses
+   are used elsewhere.  The B fold is a wash if both pointer_pluses are
+   used elsewhere, since all we end up doing is replacing a comparison with
+   a pointer_plus.  We do still apply the fold under those circumstances
+   though, in case applying it to other conditions eventually makes one of the
+   pointer_pluses dead.  */
+(for ior (truth_orif truth_or bit_ior)
+ (for cmp (le lt)
+  (simplify
+   (ior (cmp:cs (pointer_plus@3 @0 INTEGER_CST@1) @2)
+       (cmp:cs (pointer_plus@4 @2 @1) @0))
+   (if (TYPE_OVERFLOW_UNDEFINED (TREE_TYPE (@0))
+       && TYPE_OVERFLOW_WRAPS (sizetype)
+       && TYPE_PRECISION (TREE_TYPE (@0)) == TYPE_PRECISION (sizetype))
+    /* Calculate the rhs constant.  */
+    (with { offset_int off = wi::to_offset (@1) - (cmp == LE_EXPR ? 1 : 0);
+           offset_int rhs = off * 2; }
+     /* Always fails for negative values.  */
+     (if (wi::min_precision (rhs, UNSIGNED) <= TYPE_PRECISION (sizetype))
+      /* Since the order of @0 and @2 doesn't matter, let tree_swap_operands_p
+        pick a canonical order.  This increases the chances of using the
+        same pointer_plus in multiple checks.  */
+      (with { bool swap_p = tree_swap_operands_p (@0, @2);
+             tree rhs_tree = wide_int_to_tree (sizetype, rhs); }
+       (if (cmp == LT_EXPR)
+       (gt (convert:sizetype
+            (pointer_diff:ssizetype { swap_p ? @4 : @3; }
+                                    { swap_p ? @0 : @2; }))
+           { rhs_tree; })
+       (gt (convert:sizetype
+            (pointer_diff:ssizetype
+             (pointer_plus { swap_p ? @2 : @0; }
+                           { wide_int_to_tree (sizetype, off); })
+             { swap_p ? @0 : @2; }))
+           { rhs_tree; })))))))))
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog

index 7f75e108268bb45429899e52a2572e9ebc37cb42..96565bb2d448ee78d3cfc3029b337e42f97d8302 100644 (file)
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,8 @@
+2018-08-01  Richard Sandiford  <richard.sandiford@arm.com>
+
+       * gcc.dg/pointer-range-check-1.c: New test.
+       * gcc.dg/pointer-range-check-2.c: Likewise.
+
  2018-08-01  Richard Sandiford  <richard.sandiford@arm.com>
  
         PR tree-optimization/86749
diff --git a/gcc/testsuite/gcc.dg/pointer-range-check-1.c b/gcc/testsuite/gcc.dg/pointer-range-check-1.c

new file mode 100644 (file)

index 0000000..9868658
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/pointer-range-check-1.c
@@ -0,0 +1,37 @@
+/* { dg-do compile { target { ilp32 || lp64 } } } */
+/* { dg-options "-O2 -fno-ipa-icf -fdump-tree-optimized" } */
+
+/* All four functions should be folded to:
+
+   (sizetype) (a + 15 - b) < 30.  */
+
+_Bool
+f1 (char *a, char *b)
+{
+  return (a + 16 <= b) || (b + 16 <= a);
+}
+
+_Bool
+f2 (char *a, char *b)
+{
+  return (a + 15 < b) || (b + 15 < a);
+}
+
+_Bool
+f3 (char *a, char *b)
+{
+  return (a + 16 <= b) | (b + 16 <= a);
+}
+
+_Bool
+f4 (char *a, char *b)
+{
+  return (a + 15 < b) | (b + 15 < a);
+}
+
+/* { dg-final { scan-tree-dump-times { = [^\n]* - [^\n]*;} 4 "optimized" } } */
+/* { dg-final { scan-tree-dump-times { = [^\n]* \+ [^\n]*;} 4 "optimized" } } */
+/* { dg-final { scan-tree-dump-times { = [^\n]*\ > [^\n]*;} 4 "optimized" } } */
+/* { dg-final { scan-tree-dump-not {=[^\n]*\ < [^\n]*;} "optimized" } } */
+/* { dg-final { scan-tree-dump-times { \+ 15} 4 "optimized" } } */
+/* { dg-final { scan-tree-dump-times { > 30} 4 "optimized" } } */
diff --git a/gcc/testsuite/gcc.dg/pointer-range-check-2.c b/gcc/testsuite/gcc.dg/pointer-range-check-2.c

new file mode 100644 (file)

index 0000000..4ccc413
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/pointer-range-check-2.c
@@ -0,0 +1,31 @@
+/* { dg-do compile } */
+/* { dg-options "-O2 -fno-ipa-icf -fwrapv-pointer -fdump-tree-optimized" } */
+
+_Bool
+f1 (char *a, char *b)
+{
+  return (a + 16 <= b) || (b + 16 <= a);
+}
+
+_Bool
+f2 (char *a, char *b)
+{
+  return (a + 15 < b) || (b + 15 < a);
+}
+
+_Bool
+f3 (char *a, char *b)
+{
+  return (a + 16 <= b) | (b + 16 <= a);
+}
+
+_Bool
+f4 (char *a, char *b)
+{
+  return (a + 15 < b) | (b + 15 < a);
+}
+
+/* { dg-final { scan-tree-dump-not { = [^\n]* - [^\n]*;} "optimized" } } */
+/* { dg-final { scan-tree-dump-times { = [^\n]* \+ [^\n]*;} 8 "optimized" } } */
+/* { dg-final { scan-tree-dump-times { \+ 15} 4 "optimized" } } */
+/* { dg-final { scan-tree-dump-times { \+ 16} 4 "optimized" } } */
author	Richard Sandiford <richard.sandiford@arm.com>
	Wed, 1 Aug 2018 15:46:12 +0000 (15:46 +0000)
committer	Richard Sandiford <rsandifo@gcc.gnu.org>
	Wed, 1 Aug 2018 15:46:12 +0000 (15:46 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/match.pd		patch \| blob \| history
gcc/testsuite/ChangeLog		patch \| blob \| history
gcc/testsuite/gcc.dg/pointer-range-check-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.dg/pointer-range-check-2.c	[new file with mode: 0644]	patch \| blob