tree-optimization/98291 - allow SLP more vectorization of reductions

author Richard Biener <rguenther@suse.de>

Mon, 4 Jan 2021 08:53:11 +0000 (09:53 +0100)

committer Richard Biener <rguenther@suse.de>

Mon, 4 Jan 2021 09:47:43 +0000 (10:47 +0100)
author Richard Biener <rguenther@suse.de>
Mon, 4 Jan 2021 08:53:11 +0000 (09:53 +0100)
committer Richard Biener <rguenther@suse.de>
Mon, 4 Jan 2021 09:47:43 +0000 (10:47 +0100)
diff --git a/gcc/testsuite/gcc.dg/vect/slp-reduc-11.c b/gcc/testsuite/gcc.dg/vect/slp-reduc-11.c

new file mode 100644 (file)

index 0000000..a2f86fb
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/slp-reduc-11.c
@@ -0,0 +1,20 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target vect_double } */
+
+double dotprod(const double *a, const double *b, unsigned long long n)
+{
+  double d1 = 0.0;
+  double d2 = 0.0;
+
+  for (unsigned long long i = 0; i < n; i += 2) {
+    d1 += a[i] * b[i];
+    d2 += a[i + 1] * b[i + 1];
+  }
+
+  return (d1 + d2);
+}
+
+/* We should use a SLP reduction even without -ffast-math by using a
+   VF of one.  */
+/* { dg-final { scan-tree-dump "vectorizing stmts using SLP" "vect" } } */
+/* { dg-final { scan-tree-dump "vectorized 1 loops" "vect" } } */
diff --git a/gcc/testsuite/gcc.dg/vect/vect-reduc-in-order-4.c b/gcc/testsuite/gcc.dg/vect/vect-reduc-in-order-4.c

index 7706a2dc5b2a45a536c97796b4e8bc1b00479e68..eff3994a3352ba727e79a66ae969ca0c8c89ec7a 100644 (file)
--- a/gcc/testsuite/gcc.dg/vect/vect-reduc-in-order-4.c
+++ b/gcc/testsuite/gcc.dg/vect/vect-reduc-in-order-4.c
@@ -41,6 +41,4 @@ main ()
    return 0;
  }
  
-/* { dg-final { scan-tree-dump {in-order unchained SLP reductions not supported} "vect" } } */
-/* { dg-final { scan-tree-dump-not {vectorizing stmts using SLP} "vect" } } */
  /* { dg-final { scan-tree-dump-times "VECT_PERM_EXPR" 0 "vect" } } */
diff --git a/gcc/tree-vect-loop.c b/gcc/tree-vect-loop.c

index f3b95ae8be37af70c89100ca3e5acd5fad90476a..2985bfe89d6ef5e8205daffea735a808480b2b01 100644 (file)
--- a/gcc/tree-vect-loop.c
+++ b/gcc/tree-vect-loop.c
@@ -6868,8 +6868,14 @@ vectorizable_reduction (loop_vec_info loop_vinfo,
          cases, so we need to check that this is ok.  One exception is when
          vectorizing an outer-loop: the inner-loop is executed sequentially,
          and therefore vectorizing reductions in the inner-loop during
-        outer-loop vectorization is safe.  */
-      if (needs_fold_left_reduction_p (scalar_type, orig_code))
+        outer-loop vectorization is safe.  Likewise when we are vectorizing
+        a series of reductions using SLP and the VF is one the reductions
+        are performed in scalar order.  */
+      if (slp_node
+         && !REDUC_GROUP_FIRST_ELEMENT (stmt_info)
+         && known_eq (LOOP_VINFO_VECT_FACTOR (loop_vinfo), 1u))
+       ;
+      else if (needs_fold_left_reduction_p (scalar_type, orig_code))
         {
           /* When vectorizing a reduction chain w/o SLP the reduction PHI
              is not directy used in stmt.  */
author	Richard Biener <rguenther@suse.de>
	Mon, 4 Jan 2021 08:53:11 +0000 (09:53 +0100)
committer	Richard Biener <rguenther@suse.de>
	Mon, 4 Jan 2021 09:47:43 +0000 (10:47 +0100)
gcc/testsuite/gcc.dg/vect/slp-reduc-11.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.dg/vect/vect-reduc-in-order-4.c		patch \| blob \| history
gcc/tree-vect-loop.c		patch \| blob \| history