[AArch64] Add STP pattern to store a vec_concat of two 64-bit registers

author Kyrylo Tkachov <kyrylo.tkachov@arm.com>

Wed, 8 Nov 2017 18:32:09 +0000 (18:32 +0000)

committer Kyrylo Tkachov <ktkachov@gcc.gnu.org>

Wed, 8 Nov 2017 18:32:09 +0000 (18:32 +0000)
author Kyrylo Tkachov <kyrylo.tkachov@arm.com>
Wed, 8 Nov 2017 18:32:09 +0000 (18:32 +0000)
committer Kyrylo Tkachov <ktkachov@gcc.gnu.org>
Wed, 8 Nov 2017 18:32:09 +0000 (18:32 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 37ccb2cbd0e95451ccc2ec04024ca4d79debc9e0..805625f8f3d2794582d343f94dfd0f9b2c24f65c 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,11 @@
+2017-11-08  Kyrylo Tkachov  <kyrylo.tkachov@arm.com>
+
+       * config/aarch64/aarch64-simd.md (store_pair_lanes<mode>):
+       New pattern.
+       * config/aarch64/constraints.md (Uml): New constraint.
+       * config/aarch64/predicates.md (aarch64_mem_pair_lanes_operand): New
+       predicate.
+
  2017-11-08  Kyrylo Tkachov  <kyrylo.tkachov@arm.com>
  
         * simplify-rtx.c (simplify_ternary_operation): Simplify vec_merge
diff --git a/gcc/config/aarch64/aarch64-simd.md b/gcc/config/aarch64/aarch64-simd.md

index 1f5c911fc4b773a709571d2d2247695aefaa9c59..9a6da35f6f9154c46464ca47d9c4efa9a69a6b8d 100644 (file)
--- a/gcc/config/aarch64/aarch64-simd.md
+++ b/gcc/config/aarch64/aarch64-simd.md
@@ -2949,6 +2949,18 @@
    [(set_attr "type" "neon_load1_1reg_q")]
  )
  
+(define_insn "store_pair_lanes<mode>"
+  [(set (match_operand:<VDBL> 0 "aarch64_mem_pair_lanes_operand" "=Uml, Uml")
+       (vec_concat:<VDBL>
+          (match_operand:VDC 1 "register_operand" "w, r")
+          (match_operand:VDC 2 "register_operand" "w, r")))]
+  "TARGET_SIMD"
+  "@
+   stp\\t%d1, %d2, %0
+   stp\\t%x1, %x2, %0"
+  [(set_attr "type" "neon_stp, store_16")]
+)
+
  ;; In this insn, operand 1 should be low, and operand 2 the high part of the
  ;; dest vector.
  
diff --git a/gcc/config/aarch64/constraints.md b/gcc/config/aarch64/constraints.md

index 4ef7a50ac1ad11d902e25007b0ef8d4d683d62d4..af4143ef756464afac29d17f124b436520f90451 100644 (file)
--- a/gcc/config/aarch64/constraints.md
+++ b/gcc/config/aarch64/constraints.md
@@ -171,6 +171,15 @@
         (match_test "aarch64_legitimate_address_p (GET_MODE (op), XEXP (op, 0),
                                                   PARALLEL, 1)")))
  
+;; Used for storing two 64-bit values in an AdvSIMD register using an STP
+;; as a 128-bit vec_concat.
+(define_memory_constraint "Uml"
+  "@internal
+  A memory address suitable for a load/store pair operation."
+  (and (match_code "mem")
+       (match_test "aarch64_legitimate_address_p (DFmode, XEXP (op, 0),
+                                                  PARALLEL, 1)")))
+
  (define_memory_constraint "Utv"
    "@internal
     An address valid for loading/storing opaque structure
diff --git a/gcc/config/aarch64/predicates.md b/gcc/config/aarch64/predicates.md

index 84d441a1cf6d3a7a6bf548132195c6105b3bd3a8..2eaf0a7630169c3f4c23632d2a90be9ca15680df 100644 (file)
--- a/gcc/config/aarch64/predicates.md
+++ b/gcc/config/aarch64/predicates.md
@@ -189,6 +189,13 @@
         (match_test "aarch64_legitimate_address_p (mode, XEXP (op, 0), PARALLEL,
                                                0)")))
  
+;; Used for storing two 64-bit values in an AdvSIMD register using an STP
+;; as a 128-bit vec_concat.
+(define_predicate "aarch64_mem_pair_lanes_operand"
+  (and (match_code "mem")
+       (match_test "aarch64_legitimate_address_p (DFmode, XEXP (op, 0),
+                                                  PARALLEL, 1)")))
+
  (define_predicate "aarch64_prefetch_operand"
    (match_test "aarch64_address_valid_for_prefetch_p (op, false)"))
  
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog

index 3d9c337bf404fbac514d363696d8395408c3e1a3..d20cadc232376ffff70cc96a046a5595cd03e04b 100644 (file)
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,7 @@
+2017-11-08  Kyrylo Tkachov  <kyrylo.tkachov@arm.com>
+
+       * gcc.target/aarch64/store_v2vec_lanes.c: New test.
+
  2017-11-08  Kyrylo Tkachov  <kyrylo.tkachov@arm.com>
  
         * gcc.target/aarch64/load_v2vec_lanes_1.c: New test.
diff --git a/gcc/testsuite/gcc.target/aarch64/store_v2vec_lanes.c b/gcc/testsuite/gcc.target/aarch64/store_v2vec_lanes.c

new file mode 100644 (file)

index 0000000..6810db3
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/store_v2vec_lanes.c
@@ -0,0 +1,31 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+typedef long long v2di __attribute__ ((vector_size (16)));
+typedef double v2df __attribute__ ((vector_size (16)));
+
+void
+construct_lane_1 (double *y, v2df *z)
+{
+  double y0 = y[0] + 1;
+  double y1 = y[1] + 2;
+  v2df x = {y0, y1};
+  z[2] = x;
+}
+
+void
+construct_lane_2 (long long *y, v2di *z)
+{
+  long long y0 = y[0] + 1;
+  long long y1 = y[1] + 2;
+  v2di x = {y0, y1};
+  z[2] = x;
+}
+
+/* We can use the load_pair_lanes<mode> pattern to vec_concat two DI/DF
+   values from consecutive memory into a 2-element vector by using
+   a Q-reg LDR.  */
+
+/* { dg-final { scan-assembler-times "stp\td\[0-9\]+, d\[0-9\]+" 1 } } */
+/* { dg-final { scan-assembler-times "stp\tx\[0-9\]+, x\[0-9\]+" 1 } } */
+/* { dg-final { scan-assembler-not "ins\t" } } */
author	Kyrylo Tkachov <kyrylo.tkachov@arm.com>
	Wed, 8 Nov 2017 18:32:09 +0000 (18:32 +0000)
committer	Kyrylo Tkachov <ktkachov@gcc.gnu.org>
	Wed, 8 Nov 2017 18:32:09 +0000 (18:32 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/config/aarch64/aarch64-simd.md		patch \| blob \| history
gcc/config/aarch64/constraints.md		patch \| blob \| history
gcc/config/aarch64/predicates.md		patch \| blob \| history
gcc/testsuite/ChangeLog		patch \| blob \| history
gcc/testsuite/gcc.target/aarch64/store_v2vec_lanes.c	[new file with mode: 0644]	patch \| blob