[ARM] Optimize copysign/copysignf for soft-float using BFI
authorJiong Wang <jiong.wang@arm.com>
Fri, 28 Nov 2014 14:07:04 +0000 (14:07 +0000)
committerJiong Wang <jiwang@gcc.gnu.org>
Fri, 28 Nov 2014 14:07:04 +0000 (14:07 +0000)
  gcc/
    * config/arm/arm.md (copysignsf3): New pattern.
    (copysigndf3): Likewise.

  gcc/testsuite/
    * gcc.target/arm/copysign_softfloat_1.c: New copysign/copysignf
    testcase for soft-float.

From-SVN: r218159

gcc/ChangeLog
gcc/config/arm/arm.md
gcc/testsuite/ChangeLog
gcc/testsuite/gcc.target/arm/copysign_softfloat_1.c [new file with mode: 0644]

index 3165e49961984350ba641f65037502032a457030..10fec954f9f5744b4feb95efa520e01e7dccfe56 100644 (file)
@@ -1,3 +1,8 @@
+2014-11-28  Jiong Wang  <jiong.wang@arm.com>
+
+       * config/arm/arm.md (copysignsf3): New pattern.
+       (copysigndf3): Likewise.
+
 2014-11-28  Andrey Turetskiy  <andrey.turetskiy@intel.com>
            Ilya Verbin  <ilya.verbin@intel.com>
 
index c48001c952d758ab680e83487652d4be4cdb8a51..822760bdd34e2e381334fdeecc58d3809c11774f 100644 (file)
   [(set_attr "predicable" "yes")]
 )
 
+(define_expand "copysignsf3"
+  [(match_operand:SF 0 "register_operand")
+   (match_operand:SF 1 "register_operand")
+   (match_operand:SF 2 "register_operand")]
+  "TARGET_SOFT_FLOAT && arm_arch_thumb2"
+  "{
+     emit_move_insn (operands[0], operands[2]);
+     emit_insn (gen_insv_t2 (simplify_gen_subreg (SImode, operands[0], SFmode, 0),
+               GEN_INT (31), GEN_INT (0),
+               simplify_gen_subreg (SImode, operands[1], SFmode, 0)));
+     DONE;
+  }"
+)
+
+(define_expand "copysigndf3"
+  [(match_operand:DF 0 "register_operand")
+   (match_operand:DF 1 "register_operand")
+   (match_operand:DF 2 "register_operand")]
+  "TARGET_SOFT_FLOAT && arm_arch_thumb2"
+  "{
+     rtx op0_low = gen_lowpart (SImode, operands[0]);
+     rtx op0_high = gen_highpart (SImode, operands[0]);
+     rtx op1_low = gen_lowpart (SImode, operands[1]);
+     rtx op1_high = gen_highpart (SImode, operands[1]);
+     rtx op2_high = gen_highpart (SImode, operands[2]);
+
+     rtx scratch1 = gen_reg_rtx (SImode);
+     rtx scratch2 = gen_reg_rtx (SImode);
+     emit_move_insn (scratch1, op2_high);
+     emit_move_insn (scratch2, op1_high);
+
+     emit_insn(gen_rtx_SET(SImode, scratch1,
+                          gen_rtx_LSHIFTRT (SImode, op2_high, GEN_INT(31))));
+     emit_insn(gen_insv_t2(scratch2, GEN_INT(1), GEN_INT(31), scratch1));
+     emit_move_insn (op0_low, op1_low);
+     emit_move_insn (op0_high, scratch2);
+
+     DONE;
+  }"
+)
+
 ;; Vector bits common to IWMMXT and Neon
 (include "vec-common.md")
 ;; Load the Intel Wireless Multimedia Extension patterns
index ca28e66fadd9705fb7e44420173bd169c0ce702f..8d4a7889ff24f78c9ec6c2b33b8a2794a9a95270 100644 (file)
@@ -1,3 +1,8 @@
+2014-11-28  Jiong Wang  <jiong.wang@arm.com>
+
+       * gcc.target/arm/copysign_softfloat_1.c: New copysign/copysignf
+       testcase for soft-float.
+
 2014-11-28  H.J. Lu  <hongjiu.lu@intel.com>
 
        * gcc.target/i386/pr63661.c: Replace -mtune=native with
diff --git a/gcc/testsuite/gcc.target/arm/copysign_softfloat_1.c b/gcc/testsuite/gcc.target/arm/copysign_softfloat_1.c
new file mode 100644 (file)
index 0000000..def3fa0
--- /dev/null
@@ -0,0 +1,61 @@
+/* { dg-do run } */
+/* { dg-require-effective-target arm_thumb2_ok } */
+/* { dg-skip-if "skip override" { *-*-* } { "-mfloat-abi=softfp" "-mfloat-abi=hard" } { "" } } */
+/* { dg-options "-O2 -mfloat-abi=soft --save-temps" } */
+extern void abort (void);
+
+#define N 16
+
+float a_f[N] = {-0.1f, -3.2f, -6.3f, -9.4f,
+               -12.5f, -15.6f, -18.7f, -21.8f,
+               24.9f, 27.1f, 30.2f, 33.3f,
+               36.4f, 39.5f, 42.6f, 45.7f};
+
+float b_f[N] = {-1.2f, 3.4f, -5.6f, 7.8f,
+               -9.0f, 1.0f, -2.0f, 3.0f,
+               -4.0f, -5.0f, 6.0f, 7.0f,
+               -8.0f, -9.0f, 10.0f, 11.0f};
+
+float c_f[N] = {-0.1f, 3.2f, -6.3f, 9.4f,
+               -12.5f, 15.6f, -18.7f, 21.8f,
+               -24.9f, -27.1f, 30.2f, 33.3f,
+               -36.4f, -39.5f, 42.6f, 45.7f};
+
+double a_d[N] = {-0.1, -3.2, -6.3, -9.4,
+                -12.5, -15.6, -18.7, -21.8,
+                24.9, 27.1, 30.2, 33.3,
+                36.4, 39.5, 42.6, 45.7};
+
+double b_d[N] = {-1.2, 3.4, -5.6, 7.8,
+                -9.0, 1.0, -2.0, 3.0,
+                -4.0, -5.0, 6.0, 7.0,
+                -8.0, -9.0, 10.0, 11.0};
+
+double c_d[N] = {-0.1, 3.2, -6.3, 9.4,
+                -12.5, 15.6, -18.7, 21.8,
+                -24.9, -27.1, 30.2, 33.3,
+                -36.4, -39.5, 42.6, 45.7};
+
+int
+main (int argc, char **argv)
+{
+  int index = 0;
+
+/* { dg-final { scan-assembler-times "bfi" 2 } } */
+/* { dg-final { scan-assembler-times "lsr" 1 } } */
+  for (index; index < N; index++)
+    {
+      if (__builtin_copysignf (a_f[index], b_f[index]) != c_f[index])
+       abort();
+    }
+
+  for (index = 0; index < N; index++)
+    {
+      if (__builtin_copysign (a_d[index], b_d[index]) != c_d[index])
+       abort();
+    }
+
+  return 0;
+}
+
+/* { dg-final { cleanup-saved-temps } } */