tree-optimization/97482 - fix split_constant_offset of nop-conversions

author Richard Biener <rguenther@suse.de>

Thu, 15 Oct 2020 07:10:40 +0000 (09:10 +0200)

committer Richard Biener <rguenther@suse.de>

Thu, 15 Oct 2020 08:54:24 +0000 (10:54 +0200)
author Richard Biener <rguenther@suse.de>
Thu, 15 Oct 2020 07:10:40 +0000 (09:10 +0200)
committer Richard Biener <rguenther@suse.de>
Thu, 15 Oct 2020 08:54:24 +0000 (10:54 +0200)
diff --git a/gcc/fold-const.c b/gcc/fold-const.c

index 0cc80adf632fa3a5482780a41b682c258ee11afb..ebd32bb2e04584c9e0d9624e01494c7c71ec285c 100644 (file)
--- a/gcc/fold-const.c
+++ b/gcc/fold-const.c
@@ -15489,6 +15489,8 @@ ptr_difference_const (tree e1, tree e2, poly_int64_pod *diff)
  tree
  convert_to_ptrofftype_loc (location_t loc, tree off)
  {
+  if (ptrofftype_p (TREE_TYPE (off)))
+    return off;
    return fold_convert_loc (loc, sizetype, off);
  }
  
diff --git a/gcc/testsuite/gcc.dg/vect/pr97428.c b/gcc/testsuite/gcc.dg/vect/pr97428.c

new file mode 100644 (file)

index 0000000..b5b02dc
--- /dev/null
+++ b/gcc/testsuite/gcc.dg/vect/pr97428.c
@@ -0,0 +1,43 @@
+/* { dg-do compile } */
+
+typedef struct { double re, im; } dcmlx_t;
+typedef struct { double re[4], im[4]; } dcmlx4_t;
+
+void foo_i2(dcmlx4_t dst[], const dcmlx_t src[], int n)
+{
+  for (int i = 0; i < n; ++i) {
+    dcmlx_t s00 = src[i*4+0];
+    dcmlx_t s01 = src[i*4+1];
+    dcmlx_t s02 = src[i*4+2];
+    dcmlx_t s03 = src[i*4+3];
+
+    dcmlx_t s10 = src[i*4+0+n];
+    dcmlx_t s11 = src[i*4+1+n];
+    dcmlx_t s12 = src[i*4+2+n];
+    dcmlx_t s13 = src[i*4+3+n];
+
+    dst[i*2+0].re[0] = s00.re;
+    dst[i*2+0].re[1] = s01.re;
+    dst[i*2+0].re[2] = s02.re;
+    dst[i*2+0].re[3] = s03.re;
+    dst[i*2+0].im[0] = s00.im;
+    dst[i*2+0].im[1] = s01.im;
+    dst[i*2+0].im[2] = s02.im;
+    dst[i*2+0].im[3] = s03.im;
+
+    dst[i*2+1].re[0] = s10.re;
+    dst[i*2+1].re[1] = s11.re;
+    dst[i*2+1].re[2] = s12.re;
+    dst[i*2+1].re[3] = s13.re;
+    dst[i*2+1].im[0] = s10.im;
+    dst[i*2+1].im[1] = s11.im;
+    dst[i*2+1].im[2] = s12.im;
+    dst[i*2+1].im[3] = s13.im;
+  }
+}
+
+/* The first step to produce optimal code is to appropriately detect the
+   load and store groups.  */
+/* { dg-final { scan-tree-dump "Detected interleaving load of size 8" "vect" } } */
+/* { dg-final { scan-tree-dump "Detected interleaving store of size 16" "vect" } } */
+/* { dg-final { scan-tree-dump-not "gap of 6 elements" "vect" } } */
diff --git a/gcc/tree-data-ref.c b/gcc/tree-data-ref.c

index 5505ba46778501b25862c064798e3cecc8212477..3bf460cccfd9d59ab8b563bfd632bc2f61c8e328 100644 (file)
--- a/gcc/tree-data-ref.c
+++ b/gcc/tree-data-ref.c
@@ -754,7 +754,9 @@ split_constant_offset_1 (tree type, tree op0, enum tree_code code, tree op1,
             && TYPE_PRECISION (type) >= TYPE_PRECISION (itype)
             && (POINTER_TYPE_P (type) || INTEGRAL_TYPE_P (type)))
           {
-           if (INTEGRAL_TYPE_P (itype) && TYPE_OVERFLOW_WRAPS (itype))
+           if (INTEGRAL_TYPE_P (itype) && TYPE_OVERFLOW_WRAPS (itype)
+               && (TYPE_PRECISION (type) > TYPE_PRECISION (itype)
+                   || TYPE_UNSIGNED (itype) != TYPE_UNSIGNED (type)))
               {
                 /* Split the unconverted operand and try to prove that
                    wrapping isn't a problem.  */
author	Richard Biener <rguenther@suse.de>
	Thu, 15 Oct 2020 07:10:40 +0000 (09:10 +0200)
committer	Richard Biener <rguenther@suse.de>
	Thu, 15 Oct 2020 08:54:24 +0000 (10:54 +0200)
gcc/fold-const.c		patch \| blob \| history
gcc/testsuite/gcc.dg/vect/pr97428.c	[new file with mode: 0644]	patch \| blob
gcc/tree-data-ref.c		patch \| blob \| history