[AArch64] Prefer LD1RQ for big-endian SVE

author Richard Sandiford <richard.sandiford@linaro.org>

Thu, 1 Feb 2018 11:04:00 +0000 (11:04 +0000)

committer Richard Sandiford <rsandifo@gcc.gnu.org>

Thu, 1 Feb 2018 11:04:00 +0000 (11:04 +0000)
author Richard Sandiford <richard.sandiford@linaro.org>
Thu, 1 Feb 2018 11:04:00 +0000 (11:04 +0000)
committer Richard Sandiford <rsandifo@gcc.gnu.org>
Thu, 1 Feb 2018 11:04:00 +0000 (11:04 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 36d3f50ce9e3078abe3c78b9e2e6e38eae49573f..db763a636485adf0895d542a960c5cd6af72e32c 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,8 @@
+2018-02-01  Richard Sandiford  <richard.sandiford@linaro.org>
+
+       * config/aarch64/aarch64.c (aarch64_expand_sve_const_vector): Prefer
+       the TImode handling for big-endian targets.
+
  2018-02-01  Richard Sandiford  <richard.sandiford@linaro.org>
  
         * config/aarch64/aarch64-sve.md (sve_ld1rq): Replace with...
diff --git a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c

index ae142b45bdf099ba48a2f1e9deb290e46e9ee0e8..6296ffe959f62ac5515a3d32e617a909f829f090 100644 (file)
--- a/gcc/config/aarch64/aarch64.c
+++ b/gcc/config/aarch64/aarch64.c
@@ -2824,10 +2824,18 @@ aarch64_expand_sve_const_vector (rtx dest, rtx src)
        /* The constant is a repeating seqeuence of at least two elements,
          where the repeating elements occupy no more than 128 bits.
          Get an integer representation of the replicated value.  */
-      unsigned int int_bits = GET_MODE_UNIT_BITSIZE (mode) * npatterns;
-      gcc_assert (int_bits <= 128);
-
-      scalar_int_mode int_mode = int_mode_for_size (int_bits, 0).require ();
+      scalar_int_mode int_mode;
+      if (BYTES_BIG_ENDIAN)
+       /* For now, always use LD1RQ to load the value on big-endian
+          targets, since the handling of smaller integers includes a
+          subreg that is semantically an element reverse.  */
+       int_mode = TImode;
+      else
+       {
+         unsigned int int_bits = GET_MODE_UNIT_BITSIZE (mode) * npatterns;
+         gcc_assert (int_bits <= 128);
+         int_mode = int_mode_for_size (int_bits, 0).require ();
+       }
        rtx int_value = simplify_gen_subreg (int_mode, src, mode, 0);
        if (int_value
           && aarch64_expand_sve_widened_duplicate (dest, int_mode, int_value))
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog

index f440d1e42c8c5be7920fcccbc99c7a93d29f7c3a..522938f61ba92a7f08ea4105f64e84ed7522c832 100644 (file)
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,10 @@
+2018-02-01  Richard Sandiford  <richard.sandiford@linaro.org>
+
+       * gcc.target/aarch64/sve/slp_2.c: Expect LD1RQ to be used instead
+       of LD1R[HWD] for multi-element constants on big-endian targets.
+       * gcc.target/aarch64/sve/slp_3.c: Likewise.
+       * gcc.target/aarch64/sve/slp_4.c: Likewise.
+
  2018-02-01  Richard Sandiford  <richard.sandiford@linaro.org>
  
         * gcc.target/aarch64/sve/slp_2.c: Expect LD1RQD rather than LD1RQB.
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/slp_2.c b/gcc/testsuite/gcc.target/aarch64/sve/slp_2.c

index 657abb0e902ee99da281363da64a91a45ba218a5..413532c076fab9fe83db241a7bd97b8db79701d3 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/slp_2.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/slp_2.c
@@ -29,9 +29,12 @@ vec_slp_##TYPE (TYPE *restrict a, int n)                     \
  
  TEST_ALL (VEC_PERM)
  
-/* { dg-final { scan-assembler-times {\tld1rh\tz[0-9]+\.h, } 2 } } */
-/* { dg-final { scan-assembler-times {\tld1rw\tz[0-9]+\.s, } 3 } } */
-/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 3 } } */
+/* { dg-final { scan-assembler-times {\tld1rh\tz[0-9]+\.h, } 2 { target aarch64_little_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rqb\tz[0-9]+\.b, } 2 { target aarch64_big_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rw\tz[0-9]+\.s, } 3 { target aarch64_little_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rqh\tz[0-9]+\.h, } 3 { target aarch64_big_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 3 { target aarch64_little_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rqw\tz[0-9]+\.s, } 3 { target aarch64_big_endian } } } */
  /* { dg-final { scan-assembler-times {\tld1rqd\tz[0-9]+\.d, } 3 } } */
  /* { dg-final { scan-assembler-not {\tzip1\t} } } */
  /* { dg-final { scan-assembler-not {\tzip2\t} } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/slp_3.c b/gcc/testsuite/gcc.target/aarch64/sve/slp_3.c

index dd47502134b530a0ccb007758b5290f13783d412..0f9f01a00565b1d6f702b3d784a67a08d570dbaf 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/slp_3.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/slp_3.c
@@ -32,9 +32,12 @@ vec_slp_##TYPE (TYPE *restrict a, int n)                     \
  TEST_ALL (VEC_PERM)
  
  /* 1 for each 8-bit type.  */
-/* { dg-final { scan-assembler-times {\tld1rw\tz[0-9]+\.s, } 2 } } */
+/* { dg-final { scan-assembler-times {\tld1rw\tz[0-9]+\.s, } 2 { target aarch64_little_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rqb\tz[0-9]+\.b, } 2 { target aarch64_big_endian } } } */
  /* 1 for each 16-bit type and 4 for double.  */
-/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 7 } } */
+/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 7 { target aarch64_little_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rqh\tz[0-9]+\.h, } 3 { target aarch64_big_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 4 { target aarch64_big_endian } } } */
  /* 1 for each 32-bit type.  */
  /* { dg-final { scan-assembler-times {\tld1rqw\tz[0-9]+\.s, } 3 } } */
  /* { dg-final { scan-assembler-times {\tmov\tz[0-9]+\.d, #41\n} 2 } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/sve/slp_4.c b/gcc/testsuite/gcc.target/aarch64/sve/slp_4.c

index 026fa8c82af0a10589cab5eeffb865cf3dfdba4f..8d9d5ab5887d66729fbc20cb3be31a3ca9302c8c 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/sve/slp_4.c
+++ b/gcc/testsuite/gcc.target/aarch64/sve/slp_4.c
@@ -36,7 +36,9 @@ vec_slp_##TYPE (TYPE *restrict a, int n)                      \
  TEST_ALL (VEC_PERM)
  
  /* 1 for each 8-bit type, 4 for each 32-bit type and 8 for double.  */
-/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 22 } } */
+/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 22 { target aarch64_little_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rqb\tz[0-9]+\.b, } 2 { target aarch64_big_endian } } } */
+/* { dg-final { scan-assembler-times {\tld1rd\tz[0-9]+\.d, } 20 { target aarch64_big_endian } } } */
  /* 1 for each 16-bit type.  */
  /* { dg-final { scan-assembler-times {\tld1rqh\tz[0-9]\.h, } 3 } } */
  /* { dg-final { scan-assembler-times {\tmov\tz[0-9]+\.d, #99\n} 2 } } */
author	Richard Sandiford <richard.sandiford@linaro.org>
	Thu, 1 Feb 2018 11:04:00 +0000 (11:04 +0000)
committer	Richard Sandiford <rsandifo@gcc.gnu.org>
	Thu, 1 Feb 2018 11:04:00 +0000 (11:04 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/config/aarch64/aarch64.c		patch \| blob \| history
gcc/testsuite/ChangeLog		patch \| blob \| history
gcc/testsuite/gcc.target/aarch64/sve/slp_2.c		patch \| blob \| history
gcc/testsuite/gcc.target/aarch64/sve/slp_3.c		patch \| blob \| history
gcc/testsuite/gcc.target/aarch64/sve/slp_4.c		patch \| blob \| history