[aarch64] Add CPU support for Ampere Computing's eMAG.

author Christoph Muellner <christoph.muellner@theobroma-systems.com>

Fri, 23 Nov 2018 17:52:19 +0000 (17:52 +0000)

committer Philipp Tomsich <ptomsich@gcc.gnu.org>

Fri, 23 Nov 2018 17:52:19 +0000 (17:52 +0000)
author Christoph Muellner <christoph.muellner@theobroma-systems.com>
Fri, 23 Nov 2018 17:52:19 +0000 (17:52 +0000)
committer Philipp Tomsich <ptomsich@gcc.gnu.org>
Fri, 23 Nov 2018 17:52:19 +0000 (17:52 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index 0f3e8edbf70428d9b7b1b8d3dbc9a41649211e58..fb107374807b8633195c3f5ddff0a8904c2df1a6 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,10 @@
+2018-11-23  Christoph Muellner  <christoph.muellner@theobroma-systems.com>
+
+        * config/aarch64/aarch64-cores.def: Define emag.
+       * config/aarch64/aarch64-tune.md: Regenerated with emag.
+       * config/aarch64/aarch64.c (emag_tunings): New struct.
+       * doc/invoke.texi: Document mtune value.
+
  2018-11-23  Christoph Muellner  <christoph.muellner@theobroma-systems.com>
             Philipp Tomsich <philipp.tomsich@theobroma-systems.com>
  
diff --git a/gcc/config/aarch64/aarch64-cores.def b/gcc/config/aarch64/aarch64-cores.def

index 1f3ac56e26b62907acab74b91eb1d07e62d9a7c8..74be5dbf25954560c0b78e6da62f64dc0d143486 100644 (file)
--- a/gcc/config/aarch64/aarch64-cores.def
+++ b/gcc/config/aarch64/aarch64-cores.def
@@ -61,6 +61,11 @@ AARCH64_CORE("thunderxt88",   thunderxt88,   thunderx,  8A,  AARCH64_FL_FOR_ARCH
  AARCH64_CORE("thunderxt81",   thunderxt81,   thunderx,  8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO, thunderx,  0x43, 0x0a2, -1)
  AARCH64_CORE("thunderxt83",   thunderxt83,   thunderx,  8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO, thunderx,  0x43, 0x0a3, -1)
  
+/* Ampere Computing cores. */
+/* Do not swap around "emag" and "xgene1",
+   this order is required to handle variant correctly. */
+AARCH64_CORE("emag",        emag,      xgene1,    8A,  AARCH64_FL_FOR_ARCH8 | AARCH64_FL_CRC | AARCH64_FL_CRYPTO, emag, 0x50, 0x000, 3)
+
  /* APM ('P') cores. */
  AARCH64_CORE("xgene1",      xgene1,    xgene1,    8A,  AARCH64_FL_FOR_ARCH8, xgene1, 0x50, 0x000, -1)
  
diff --git a/gcc/config/aarch64/aarch64-tune.md b/gcc/config/aarch64/aarch64-tune.md

index fade1d4430ae3614c93e0f6af53e62064a5c5ef5..2fc7f0398e73dd146a15ec1468d2fe94f339616b 100644 (file)
--- a/gcc/config/aarch64/aarch64-tune.md
+++ b/gcc/config/aarch64/aarch64-tune.md
@@ -1,5 +1,5 @@
  ;; -*- buffer-read-only: t -*-
  ;; Generated automatically by gentune.sh from aarch64-cores.def
  (define_attr "tune"
-       "cortexa35,cortexa53,cortexa57,cortexa72,cortexa73,thunderx,thunderxt88p1,thunderxt88,thunderxt81,thunderxt83,xgene1,falkor,qdf24xx,exynosm1,phecda,thunderx2t99p1,vulcan,thunderx2t99,cortexa55,cortexa75,cortexa76,ares,tsv110,saphira,cortexa57cortexa53,cortexa72cortexa53,cortexa73cortexa35,cortexa73cortexa53,cortexa75cortexa55,cortexa76cortexa55"
+       "cortexa35,cortexa53,cortexa57,cortexa72,cortexa73,thunderx,thunderxt88p1,thunderxt88,thunderxt81,thunderxt83,emag,xgene1,falkor,qdf24xx,exynosm1,phecda,thunderx2t99p1,vulcan,thunderx2t99,cortexa55,cortexa75,cortexa76,ares,tsv110,saphira,cortexa57cortexa53,cortexa72cortexa53,cortexa73cortexa35,cortexa73cortexa53,cortexa75cortexa55,cortexa76cortexa55"
         (const (symbol_ref "((enum attr_tune) aarch64_tune)")))
diff --git a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c

index 23d1388d52eb0b273e21c4edd8d523a4684c3233..90bbc578f1a001b52b77561c968c717dcd4aac70 100644 (file)
--- a/gcc/config/aarch64/aarch64.c
+++ b/gcc/config/aarch64/aarch64.c
@@ -957,6 +957,31 @@ static const struct tune_params xgene1_tunings =
    &xgene1_prefetch_tune
  };
  
+static const struct tune_params emag_tunings =
+{
+  &xgene1_extra_costs,
+  &xgene1_addrcost_table,
+  &xgene1_regmove_cost,
+  &xgene1_vector_cost,
+  &generic_branch_cost,
+  &xgene1_approx_modes,
+  6, /* memmov_cost  */
+  4, /* issue_rate  */
+  AARCH64_FUSE_NOTHING, /* fusible_ops  */
+  "16",        /* function_align.  */
+  "16",        /* jump_align.  */
+  "16",        /* loop_align.  */
+  2,   /* int_reassoc_width.  */
+  4,   /* fp_reassoc_width.  */
+  1,   /* vec_reassoc_width.  */
+  2,   /* min_div_recip_mul_sf.  */
+  2,   /* min_div_recip_mul_df.  */
+  17,  /* max_case_values.  */
+  tune_params::AUTOPREFETCHER_OFF,     /* autoprefetcher_model.  */
+  (AARCH64_EXTRA_TUNE_NO_LDP_STP_QREGS),       /* tune_flags.  */
+  &xgene1_prefetch_tune
+};
+
  static const struct tune_params qdf24xx_tunings =
  {
    &qdf24xx_extra_costs,
diff --git a/gcc/doc/invoke.texi b/gcc/doc/invoke.texi

index d46ebd02c4e0fee7b1c93a9e96d80113f6af93a7..77bdfaad3ebbdb84c36cfe256d0ab3669a8d1a2c 100644 (file)
--- a/gcc/doc/invoke.texi
+++ b/gcc/doc/invoke.texi
@@ -15565,7 +15565,7 @@ Specify the name of the target processor for which GCC should tune the
  performance of the code.  Permissible values for this option are:
  @samp{generic}, @samp{cortex-a35}, @samp{cortex-a53}, @samp{cortex-a55},
  @samp{cortex-a57}, @samp{cortex-a72}, @samp{cortex-a73}, @samp{cortex-a75},
-@samp{cortex-a76}, @samp{ares}, @samp{exynos-m1}, @samp{falkor},
+@samp{cortex-a76}, @samp{ares}, @samp{exynos-m1}, @samp{emag}, @samp{falkor},
  @samp{qdf24xx}, @samp{saphira}, @samp{phecda}, @samp{xgene1}, @samp{vulcan},
  @samp{thunderx}, @samp{thunderxt88}, @samp{thunderxt88p1}, @samp{thunderxt81},
  @samp{tsv110}, @samp{thunderxt83}, @samp{thunderx2t99},
author	Christoph Muellner <christoph.muellner@theobroma-systems.com>
	Fri, 23 Nov 2018 17:52:19 +0000 (17:52 +0000)
committer	Philipp Tomsich <ptomsich@gcc.gnu.org>
	Fri, 23 Nov 2018 17:52:19 +0000 (17:52 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/config/aarch64/aarch64-cores.def		patch \| blob \| history
gcc/config/aarch64/aarch64-tune.md		patch \| blob \| history
gcc/config/aarch64/aarch64.c		patch \| blob \| history
gcc/doc/invoke.texi		patch \| blob \| history