[AArch64] Support zero-extended move to FP register

author Wilco Dijkstra <wdijkstr@arm.com>

Fri, 12 Oct 2018 10:49:27 +0000 (10:49 +0000)

committer Wilco Dijkstra <wilco@gcc.gnu.org>

Fri, 12 Oct 2018 10:49:27 +0000 (10:49 +0000)
author Wilco Dijkstra <wdijkstr@arm.com>
Fri, 12 Oct 2018 10:49:27 +0000 (10:49 +0000)
committer Wilco Dijkstra <wilco@gcc.gnu.org>
Fri, 12 Oct 2018 10:49:27 +0000 (10:49 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 67b39211811a1b641b3fd94ed0686d41f31081dc..ecf2b805d70c3fbfa42317ed37a75605b1e88b63 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,12 @@
+2018-10-12  Wilco Dijkstra  <wdijkstr@arm.com>
+
+       * config/aarch64/aarch64.md (zero_extendsidi2_aarch64): Add alternatives
+       to zero-extend between int and floating-point registers.
+       (load_pair_zero_extendsidi2_aarch64): Add alternative for zero-extended
+       ldp into floating-point registers.  Add type and arch attributes.
+       (zero_extend<SHORT:mode><GPI:mode>2_aarch64): Add arch attribute.
+       Use f_loads for type attribute.
+
  2018-10-11  Martin Sebor  <msebor@redhat.com>
  
         * doc/extend.texi (attribute packed): Correct typos.
diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md

index b4a4315ff4b3b603299a5718ad5a489a75a8c5c9..58e9962ae249518b3786b295e4690df9ac326bc3 100644 (file)
--- a/gcc/config/aarch64/aarch64.md
+++ b/gcc/config/aarch64/aarch64.md
@@ -1520,26 +1520,34 @@
  )
  
  (define_insn "*zero_extendsidi2_aarch64"
-  [(set (match_operand:DI 0 "register_operand" "=r,r")
-        (zero_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m")))]
+  [(set (match_operand:DI 0 "register_operand" "=r,r,w,w,r,w")
+        (zero_extend:DI (match_operand:SI 1 "nonimmediate_operand" "r,m,r,m,w,w")))]
    ""
    "@
     uxtw\t%0, %w1
-   ldr\t%w0, %1"
-  [(set_attr "type" "extend,load_4")]
+   ldr\t%w0, %1
+   fmov\t%s0, %w1
+   ldr\t%s0, %1
+   fmov\t%w0, %s1
+   fmov\t%s0, %s1"
+  [(set_attr "type" "extend,load_4,f_mcr,f_loads,f_mrc,fmov")
+   (set_attr "arch" "*,*,fp,fp,fp,fp")]
  )
  
  (define_insn "*load_pair_zero_extendsidi2_aarch64"
-  [(set (match_operand:DI 0 "register_operand" "=r")
-       (zero_extend:DI (match_operand:SI 1 "aarch64_mem_pair_operand" "Ump")))
-   (set (match_operand:DI 2 "register_operand" "=r")
-       (zero_extend:DI (match_operand:SI 3 "memory_operand" "m")))]
+  [(set (match_operand:DI 0 "register_operand" "=r,w")
+       (zero_extend:DI (match_operand:SI 1 "aarch64_mem_pair_operand" "Ump,Ump")))
+   (set (match_operand:DI 2 "register_operand" "=r,w")
+       (zero_extend:DI (match_operand:SI 3 "memory_operand" "m,m")))]
    "rtx_equal_p (XEXP (operands[3], 0),
                 plus_constant (Pmode,
                                XEXP (operands[1], 0),
                                GET_MODE_SIZE (SImode)))"
-  "ldp\\t%w0, %w2, %1"
-  [(set_attr "type" "load_8")]
+  "@
+   ldp\t%w0, %w2, %1
+   ldp\t%s0, %s2, %1"
+  [(set_attr "type" "load_8,neon_load1_2reg")
+   (set_attr "arch" "*,fp")]
  )
  
  (define_expand "<ANY_EXTEND:optab><SHORT:mode><GPI:mode>2"
@@ -1566,7 +1574,8 @@
     and\t%<GPI:w>0, %<GPI:w>1, <SHORT:short_mask>
     ldr<SHORT:size>\t%w0, %1
     ldr\t%<SHORT:size>0, %1"
-  [(set_attr "type" "logic_imm,load_4,load_4")]
+  [(set_attr "type" "logic_imm,load_4,f_loads")
+   (set_attr "arch" "*,*,fp")]
  )
  
  (define_expand "<optab>qihi2"
diff --git a/gcc/testsuite/ChangeLog b/gcc/testsuite/ChangeLog

index edb680ec4a700972f956989e652467245feffb7e..964f4ea4c11f4177abbf04878f96c30081589c5b 100644 (file)
--- a/gcc/testsuite/ChangeLog
+++ b/gcc/testsuite/ChangeLog
@@ -1,3 +1,8 @@
+2018-10-12  Wilco Dijkstra  <wdijkstr@arm.com>
+
+       * gcc.target/aarch64/popcnt.c: Test zero-extended popcount.
+       * gcc.target/aarch64/vec_zeroextend.c: Test zero-extended vectors.
+
  2018-10-11  Will Schmidt  <will_schmidt@vnet.ibm.com>
  
         * gcc.target/powerpc/fold-vec-insert-char-p8.c: New.
diff --git a/gcc/testsuite/gcc.target/aarch64/popcnt.c b/gcc/testsuite/gcc.target/aarch64/popcnt.c

index 7e957966d8e81b8633a444bb42944d0da82ae5db..2b5e9f3e2c0245438ed7bcc5d0d4e01efe01b1ee 100644 (file)
--- a/gcc/testsuite/gcc.target/aarch64/popcnt.c
+++ b/gcc/testsuite/gcc.target/aarch64/popcnt.c
@@ -19,5 +19,16 @@ foo2 (long long x)
    return __builtin_popcountll (x);
  }
  
-/* { dg-final { scan-assembler-not "popcount" } } */
-/* { dg-final { scan-assembler-times "cnt\t" 3 } } */
+int
+foo3 (int *p)
+{
+  return __builtin_popcount (*p);
+}
+
+/* { dg-final { scan-assembler-not {popcount} } } */
+/* { dg-final { scan-assembler-times {cnt\t} 4 } } */
+/* { dg-final { scan-assembler-times {fmov\ts} 1 {target lp64} } } */
+/* { dg-final { scan-assembler-times {fmov\td} 2 {target lp64} } } */
+/* { dg-final { scan-assembler-times {fmov\ts} 2 {target ilp32} } } */
+/* { dg-final { scan-assembler-times {fmov\td} 1 {target ilp32} } } */
+/* { dg-final { scan-assembler-times {ldr\ts} 1 } } */
diff --git a/gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c b/gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c

new file mode 100644 (file)

index 0000000..9c3971f
--- /dev/null
+++ b/gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c
@@ -0,0 +1,21 @@
+/* { dg-do compile } */
+/* { dg-options "-O2" } */
+
+#define vector __attribute__((vector_size(16) ))
+
+vector unsigned long long
+f1(vector unsigned long long b, vector unsigned int a)
+{
+  b[0] = a[0];
+  return b;
+}
+
+unsigned long long
+f2(vector unsigned int a)
+{
+  return a[0];
+}
+
+/* { dg-final { scan-assembler-times {fmov} 2 } } */
+/* { dg-final { scan-assembler-not {umov} } } */
+/* { dg-final { scan-assembler-not {uxtw} } } */
author	Wilco Dijkstra <wdijkstr@arm.com>
	Fri, 12 Oct 2018 10:49:27 +0000 (10:49 +0000)
committer	Wilco Dijkstra <wilco@gcc.gnu.org>
	Fri, 12 Oct 2018 10:49:27 +0000 (10:49 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/config/aarch64/aarch64.md		patch \| blob \| history
gcc/testsuite/ChangeLog		patch \| blob \| history
gcc/testsuite/gcc.target/aarch64/popcnt.c		patch \| blob \| history
gcc/testsuite/gcc.target/aarch64/vec_zeroextend.c	[new file with mode: 0644]	patch \| blob