arm-cores.def: Add support for -mcpu=cortex-m0.small-multiply,cortex-m0plus.small...

author Hale Wang <hale.wang@arm.com>

Thu, 6 Nov 2014 07:02:30 +0000 (07:02 +0000)

committer Hale Wang <halewang@gcc.gnu.org>

Thu, 6 Nov 2014 07:02:30 +0000 (07:02 +0000)
author Hale Wang <hale.wang@arm.com>
Thu, 6 Nov 2014 07:02:30 +0000 (07:02 +0000)
committer Hale Wang <halewang@gcc.gnu.org>
Thu, 6 Nov 2014 07:02:30 +0000 (07:02 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index c5ed2a31f382d4bebd312ef793677a1463eed292..0a2748bf9095cc60d86ef7f9d8fead768c9987d5 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,27 @@
+2014-11-06  Hale Wang  <Hale.Wang@arm.com>
+
+       * config/arm/arm-cores.def: Add support for
+       -mcpu=cortex-m0.small-multiply,cortex-m0plus.small-multiply,
+       cortex-m1.small-multiply.
+       * config/arm/arm-tables.opt: Regenerate.
+       * config/arm/arm-tune.md: Regenerate.
+       * config/arm/arm.c: Update the rtx-costs for MUL.
+       * config/arm/bpabi.h: Handle
+       -mcpu=cortex-m0.small-multiply,cortex-m0plus.small-multiply,
+       cortex-m1.small-multiply.
+       * doc/invoke.texi: Document
+       -mcpu=cortex-m0.small-multiply,cortex-m0plus.small-multiply,
+       cortex-m1.small-multiply.
+       * testsuite/gcc.target/arm/small-multiply-m0-1.c: New test case.
+       * testsuite/gcc.target/arm/small-multiply-m0-2.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m0-3.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m0plus-1.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m0plus-2.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m0plus-3.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m1-1.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m1-2.c: Likewise.
+       * testsuite/gcc.target/arm/small-multiply-m1-3.c: Likewise.
+
  2014-11-06  Hale Wang  <Hale.Wang@arm.com>
  
         * config/arm/arm.c: Add cortex-m7 tune.
diff --git a/gcc/config/arm/arm-cores.def b/gcc/config/arm/arm-cores.def

index 3b34173e983a688cb24df1e4b9b8b371860b6987..d5067b0e9b9255181a95c116e3131c98c89ff79e 100644 (file)
--- a/gcc/config/arm/arm-cores.def
+++ b/gcc/config/arm/arm-cores.def
@@ -137,6 +137,11 @@ ARM_CORE("cortex-m1",              cortexm1, cortexm1,             6M, FL_LDSCHED, v6m)
  ARM_CORE("cortex-m0",          cortexm0, cortexm0,             6M, FL_LDSCHED, v6m)
  ARM_CORE("cortex-m0plus",      cortexm0plus, cortexm0plus,     6M, FL_LDSCHED, v6m)
  
+/* V6M Architecture Processors for small-multiply implementations.  */
+ARM_CORE("cortex-m1.small-multiply",   cortexm1smallmultiply, cortexm1,        6M, FL_LDSCHED | FL_SMALLMUL, v6m)
+ARM_CORE("cortex-m0.small-multiply",   cortexm0smallmultiply, cortexm0,        6M, FL_LDSCHED | FL_SMALLMUL, v6m)
+ARM_CORE("cortex-m0plus.small-multiply",cortexm0plussmallmultiply, cortexm0plus,6M, FL_LDSCHED | FL_SMALLMUL, v6m)
+
  /* V7 Architecture Processors */
  ARM_CORE("generic-armv7-a",    genericv7a, genericv7a,         7A,  FL_LDSCHED, cortex)
  ARM_CORE("cortex-a5",          cortexa5, cortexa5,             7A,  FL_LDSCHED, cortex_a5)
diff --git a/gcc/config/arm/arm-tables.opt b/gcc/config/arm/arm-tables.opt

index 04191bceefbb1f279f031d18ac11c083ea9d7d15..9c7e944bfcbc7a3f3e5cbfa625b56b0099c842da 100644 (file)
--- a/gcc/config/arm/arm-tables.opt
+++ b/gcc/config/arm/arm-tables.opt
@@ -240,6 +240,15 @@ Enum(processor_type) String(cortex-m0) Value(cortexm0)
  EnumValue
  Enum(processor_type) String(cortex-m0plus) Value(cortexm0plus)
  
+EnumValue
+Enum(processor_type) String(cortex-m1.small-multiply) Value(cortexm1smallmultiply)
+
+EnumValue
+Enum(processor_type) String(cortex-m0.small-multiply) Value(cortexm0smallmultiply)
+
+EnumValue
+Enum(processor_type) String(cortex-m0plus.small-multiply) Value(cortexm0plussmallmultiply)
+
  EnumValue
  Enum(processor_type) String(generic-armv7-a) Value(genericv7a)
  
diff --git a/gcc/config/arm/arm-tune.md b/gcc/config/arm/arm-tune.md

index 4217fbe8b2c8e62c3098fa531ad40600f948944b..84355d69e467652069c4649d26685f2dba20a6e9 100644 (file)
--- a/gcc/config/arm/arm-tune.md
+++ b/gcc/config/arm/arm-tune.md
@@ -25,6 +25,7 @@
         arm1176jzs,arm1176jzfs,mpcorenovfp,
         mpcore,arm1156t2s,arm1156t2fs,
         cortexm1,cortexm0,cortexm0plus,
+       cortexm1smallmultiply,cortexm0smallmultiply,cortexm0plussmallmultiply,
         genericv7a,cortexa5,cortexa7,
         cortexa8,cortexa9,cortexa12,
         cortexa15,cortexr4,cortexr4f,
diff --git a/gcc/config/arm/arm.c b/gcc/config/arm/arm.c

index beeeb970db0a42dc68a128169e3e0dc27a43cf71..9e07d600c94a01f562334e591f35ebeffc573d6c 100644 (file)
--- a/gcc/config/arm/arm.c
+++ b/gcc/config/arm/arm.c
@@ -770,6 +770,8 @@ static int thumb_call_reg_needed;
  #define FL_ARCH8      (1 << 24)       /* Architecture 8.  */
  #define FL_CRC32      (1 << 25)              /* ARMv8 CRC32 instructions.  */
  
+#define FL_SMALLMUL   (1 << 26)       /* Small multiply supported.  */
+
  #define FL_IWMMXT     (1 << 29)              /* XScale v2 or "Intel Wireless MMX technology".  */
  #define FL_IWMMXT2    (1 << 30)       /* "Intel Wireless MMX2 technology".  */
  
@@ -933,6 +935,9 @@ int arm_condexec_masklen = 0;
  /* Nonzero if chip supports the ARMv8 CRC instructions.  */
  int arm_arch_crc = 0;
  
+/* Nonzero if the core has a very small, high-latency, multiply unit.  */
+int arm_m_profile_small_mul = 0;
+
  /* The condition codes of the ARM, and the inverse function.  */
  static const char * const arm_condition_codes[] =
  {
@@ -2824,6 +2829,7 @@ arm_option_override (void)
    arm_arch_arm_hwdiv = (insn_flags & FL_ARM_DIV) != 0;
    arm_tune_cortex_a9 = (arm_tune == cortexa9) != 0;
    arm_arch_crc = (insn_flags & FL_CRC32) != 0;
+  arm_m_profile_small_mul = (insn_flags & FL_SMALLMUL) != 0;
    if (arm_restrict_it == 2)
      arm_restrict_it = arm_arch8 && TARGET_THUMB2;
  
@@ -8960,7 +8966,13 @@ thumb1_size_rtx_costs (rtx x, enum rtx_code code, enum rtx_code outer)
            /* Thumb1 mul instruction can't operate on const. We must Load it
               into a register first.  */
            int const_size = thumb1_size_rtx_costs (XEXP (x, 1), CONST_INT, SET);
-          return COSTS_N_INSNS (1) + const_size;
+         /* For the targets which have a very small and high-latency multiply
+            unit, we prefer to synthesize the mult with up to 5 instructions,
+            giving a good balance between size and performance.  */
+         if (arm_arch6m && arm_m_profile_small_mul)
+           return COSTS_N_INSNS (5);
+         else
+           return COSTS_N_INSNS (1) + const_size;
          }
        return COSTS_N_INSNS (1);
  
@@ -11378,7 +11390,11 @@ arm_9e_rtx_costs (rtx x, enum rtx_code code, enum rtx_code outer_code,
        switch (code)
         {
         case MULT:
-         *total = COSTS_N_INSNS (3);
+         /* Small multiply: 32 cycles for an integer multiply inst.  */
+         if (arm_arch6m && arm_m_profile_small_mul)
+           *total = COSTS_N_INSNS (32);
+         else
+           *total = COSTS_N_INSNS (3);
           return true;
  
         default:
diff --git a/gcc/config/arm/bpabi.h b/gcc/config/arm/bpabi.h

index 9a471c251a8d5aa565f423fbf1e49d0380b80178..f99e1af1e1ad27f0cfbc0cfb9e9daa80ebe49f65 100644 (file)
--- a/gcc/config/arm/bpabi.h
+++ b/gcc/config/arm/bpabi.h
@@ -70,6 +70,9 @@
     |mcpu=cortex-a53                                    \
     |mcpu=cortex-a57                                    \
     |mcpu=cortex-a57.cortex-a53                         \
+   |mcpu=cortex-m1.small-multiply                       \
+   |mcpu=cortex-m0.small-multiply                       \
+   |mcpu=cortex-m0plus.small-multiply                  \
     |mcpu=generic-armv7-a                                \
     |march=armv7ve                                      \
     |march=armv7-m|mcpu=cortex-m3                        \
@@ -87,6 +90,9 @@
     |mcpu=cortex-a53                                    \
     |mcpu=cortex-a57                                    \
     |mcpu=cortex-a57.cortex-a53                         \
+   |mcpu=cortex-m1.small-multiply                       \
+   |mcpu=cortex-m0.small-multiply                       \
+   |mcpu=cortex-m0plus.small-multiply                   \
     |mcpu=marvell-pj4                                   \
     |mcpu=generic-armv7-a                                \
     |march=armv7ve                                      \
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi

index a6429333c3cd63ff460cd15bc85333989f0cbfe7..209c8f68bc982782f3a0a9fe3fe1e19d03b05906 100644 (file)
--- a/gcc/doc/invoke.texi
+++ b/gcc/doc/invoke.texi
@@ -12747,6 +12747,9 @@ Permissible names are: @samp{arm2}, @samp{arm250},
  @samp{cortex-m1},
  @samp{cortex-m0},
  @samp{cortex-m0plus},
+@samp{cortex-m1.small-multiply},
+@samp{cortex-m0.small-multiply},
+@samp{cortex-m0plus.small-multiply},
  @samp{marvell-pj4},
  @samp{xscale}, @samp{iwmmxt}, @samp{iwmmxt2}, @samp{ep9312},
  @samp{fa526}, @samp{fa626},
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m0-1.c b/gcc/testsuite/gcc.target/arm/small-multiply-m0-1.c

new file mode 100644 (file)

index 0000000..77ec603
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m0-1.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m0.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m0.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m0.small-multiply -mthumb -O2" } */
+
+int
+test (int a)
+{
+  return a * 0x123456;
+}
+
+/* { dg-final { scan-assembler-not "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m0-2.c b/gcc/testsuite/gcc.target/arm/small-multiply-m0-2.c

new file mode 100644 (file)

index 0000000..c89b3ba
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m0-2.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m0.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m0.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m0.small-multiply -mthumb -Os" } */
+
+int
+test (int a)
+{
+  return a * 0x123456;
+}
+
+/* { dg-final { scan-assembler "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m0-3.c b/gcc/testsuite/gcc.target/arm/small-multiply-m0-3.c

new file mode 100644 (file)

index 0000000..b2df109
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m0-3.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m0.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m0.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m0.small-multiply -mthumb -Os" } */
+
+int
+test (int a)
+{
+  return a * 0x13;
+}
+
+/* { dg-final { scan-assembler-not "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-1.c b/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-1.c

new file mode 100644 (file)

index 0000000..08a450b
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-1.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m0plus.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m0plus.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m0plus.small-multiply -mthumb -O2" } */
+
+int
+test (int a)
+{
+  return a * 0x123456;
+}
+
+/* { dg-final { scan-assembler-not "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-2.c b/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-2.c

new file mode 100644 (file)

index 0000000..17b52d3
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-2.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m0plus.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m0plus.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m0plus.small-multiply -mthumb -Os" } */
+
+int
+test (int a)
+{
+  return a * 0x123456;
+}
+
+/* { dg-final { scan-assembler "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-3.c b/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-3.c

new file mode 100644 (file)

index 0000000..af69c75
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m0plus-3.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m0plus.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m0plus.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m0plus.small-multiply -mthumb -Os" } */
+
+int
+test (int a)
+{
+  return a * 0x13;
+}
+
+/* { dg-final { scan-assembler-not "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m1-1.c b/gcc/testsuite/gcc.target/arm/small-multiply-m1-1.c

new file mode 100644 (file)

index 0000000..d265aaf
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m1-1.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m1.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m1.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m1.small-multiply -mthumb -O2" } */
+
+int
+test (int a)
+{
+  return a * 0x123456;
+}
+
+/* { dg-final { scan-assembler-not "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m1-2.c b/gcc/testsuite/gcc.target/arm/small-multiply-m1-2.c

new file mode 100644 (file)

index 0000000..c50891c
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m1-2.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m1.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m1.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m1.small-multiply -mthumb -Os" } */
+
+int
+test (int a)
+{
+  return a * 0x123456;
+}
+
+/* { dg-final { scan-assembler "\[\\t \]+mul" } } */
diff --git a/gcc/testsuite/gcc.target/arm/small-multiply-m1-3.c b/gcc/testsuite/gcc.target/arm/small-multiply-m1-3.c

new file mode 100644 (file)

index 0000000..1da21a6
--- /dev/null
+++ b/gcc/testsuite/gcc.target/arm/small-multiply-m1-3.c
@@ -0,0 +1,12 @@
+/* { dg-do compile } */
+/* { dg-require-effective-target arm_thumb1_ok } */
+/* { dg-skip-if "Test is specific to cortex-m1.small-multiply" { arm*-*-* } { "-mcpu=*" } { "-mcpu=cortex-m1.small-multiply" } } */
+/* { dg-options "-mcpu=cortex-m1.small-multiply -mthumb -Os" } */
+
+int
+test (int a)
+{
+  return a * 0x13;
+}
+
+/* { dg-final { scan-assembler-not "\[\\t \]+mul" } } */
author	Hale Wang <hale.wang@arm.com>
	Thu, 6 Nov 2014 07:02:30 +0000 (07:02 +0000)
committer	Hale Wang <halewang@gcc.gnu.org>
	Thu, 6 Nov 2014 07:02:30 +0000 (07:02 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/config/arm/arm-cores.def		patch \| blob \| history
gcc/config/arm/arm-tables.opt		patch \| blob \| history
gcc/config/arm/arm-tune.md		patch \| blob \| history
gcc/config/arm/arm.c		patch \| blob \| history
gcc/config/arm/bpabi.h		patch \| blob \| history
gcc/doc/invoke.texi		patch \| blob \| history
gcc/testsuite/gcc.target/arm/small-multiply-m0-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m0-2.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m0-3.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m0plus-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m0plus-2.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m0plus-3.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m1-1.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m1-2.c	[new file with mode: 0644]	patch \| blob
gcc/testsuite/gcc.target/arm/small-multiply-m1-3.c	[new file with mode: 0644]	patch \| blob