2017-07-28 Tamar Christina <tamar.christina@arm.com>

author Tamar Christina <tamar.christina@arm.com>

Fri, 28 Jul 2017 15:11:25 +0000 (15:11 +0000)

committer Tamar Christina <tnfchris@gcc.gnu.org>

Fri, 28 Jul 2017 15:11:25 +0000 (15:11 +0000)
author Tamar Christina <tamar.christina@arm.com>
Fri, 28 Jul 2017 15:11:25 +0000 (15:11 +0000)
committer Tamar Christina <tnfchris@gcc.gnu.org>
Fri, 28 Jul 2017 15:11:25 +0000 (15:11 +0000)
diff --git a/gcc/ChangeLog b/gcc/ChangeLog

index cf3e7e5e602724685d509351183ae45222518cc3..8b62fd56b08053f638ac9239627d101102717e31 100644 (file)
--- a/gcc/ChangeLog
+++ b/gcc/ChangeLog
@@ -1,3 +1,27 @@
+2017-07-28  Tamar Christina  <tamar.christina@arm.com>
+
+       * config/aarch64/aarch64.c
+       (aarch64_simd_container_mode): Add prototype.
+       (aarch64_expand_mov_immediate): Add HI support.
+       (aarch64_reinterpret_float_as_int, aarch64_float_const_rtx_p: New.
+       (aarch64_can_const_movi_rtx_p): New.
+       (aarch64_preferred_reload_class):
+       Remove restrictions of using FP registers for certain SIMD operations.
+       (aarch64_rtx_costs): Added new cost for CONST_DOUBLE moves.
+       (aarch64_valid_floating_const): Add integer move validation.
+       (aarch64_simd_imm_scalar_p): Remove.
+       (aarch64_output_scalar_simd_mov_immediate): Generalize function.
+       (aarch64_legitimate_constant_p): Expand list of supported cases.
+       * config/aarch64/aarch64-protos.h
+       (aarch64_float_const_rtx_p, aarch64_can_const_movi_rtx_p): New.
+       (aarch64_reinterpret_float_as_int): New.
+       (aarch64_simd_imm_scalar_p): Remove.
+       * config/aarch64/constraints.md (Uvi): New.
+       (Dd): Split into Ds and new Dd.
+       * config/aarch64/aarch64.md (*movsi_aarch64):
+       Add SIMD mov case.
+       (*movdi_aarch64): Add SIMD mov case.
+
  2017-07-28  Bin Cheng  <bin.cheng@arm.com>
  
         * tree-predcom.c: (struct chain): Handle store-store chain in which
diff --git a/gcc/config/aarch64/aarch64-protos.h b/gcc/config/aarch64/aarch64-protos.h

index e397ff4afa73cfbc7e192fd5686b1beff9bbbadf..beff28e2272b7c771c5ae5f3e17f10fc5f9711d0 100644 (file)
--- a/gcc/config/aarch64/aarch64-protos.h
+++ b/gcc/config/aarch64/aarch64-protos.h
@@ -319,6 +319,7 @@ unsigned HOST_WIDE_INT aarch64_and_split_imm2 (HOST_WIDE_INT val_in);
  bool aarch64_and_bitmask_imm (unsigned HOST_WIDE_INT val_in, machine_mode mode);
  int aarch64_branch_cost (bool, bool);
  enum aarch64_symbol_type aarch64_classify_symbolic_expression (rtx);
+bool aarch64_can_const_movi_rtx_p (rtx x, machine_mode mode);
  bool aarch64_const_vec_all_same_int_p (rtx, HOST_WIDE_INT);
  bool aarch64_constant_address_p (rtx);
  bool aarch64_emit_approx_div (rtx, rtx, rtx);
@@ -326,6 +327,7 @@ bool aarch64_emit_approx_sqrt (rtx, rtx, bool);
  void aarch64_expand_call (rtx, rtx, bool);
  bool aarch64_expand_movmem (rtx *);
  bool aarch64_float_const_zero_rtx_p (rtx);
+bool aarch64_float_const_rtx_p (rtx);
  bool aarch64_function_arg_regno_p (unsigned);
  bool aarch64_fusion_enabled_p (enum aarch64_fusion_pairs);
  bool aarch64_gen_movmemqi (rtx *);
@@ -351,9 +353,9 @@ bool aarch64_pad_arg_upward (machine_mode, const_tree);
  bool aarch64_pad_reg_upward (machine_mode, const_tree, bool);
  bool aarch64_regno_ok_for_base_p (int, bool);
  bool aarch64_regno_ok_for_index_p (int, bool);
+bool aarch64_reinterpret_float_as_int (rtx value, unsigned HOST_WIDE_INT *fail);
  bool aarch64_simd_check_vect_par_cnst_half (rtx op, machine_mode mode,
                                             bool high);
-bool aarch64_simd_imm_scalar_p (rtx x, machine_mode mode);
  bool aarch64_simd_imm_zero_p (rtx, machine_mode);
  bool aarch64_simd_scalar_immediate_valid_for_move (rtx, machine_mode);
  bool aarch64_simd_shift_imm_p (rtx, machine_mode, bool);
diff --git a/gcc/config/aarch64/aarch64.c b/gcc/config/aarch64/aarch64.c

index 092ef10b7b86158a9d54e2bf723dda25d9e36c7d..af6e6523098138c88f4057f4bc00be5a89fbacea 100644 (file)
--- a/gcc/config/aarch64/aarch64.c
+++ b/gcc/config/aarch64/aarch64.c
@@ -147,6 +147,8 @@ static bool aarch64_builtin_support_vector_misalignment (machine_mode mode,
                                                          const_tree type,
                                                          int misalignment,
                                                          bool is_packed);
+static machine_mode
+aarch64_simd_container_mode (machine_mode mode, unsigned width);
  
  /* Major revision number of the ARM Architecture implemented by the target.  */
  unsigned aarch64_architecture_version;
@@ -4677,6 +4679,69 @@ aarch64_legitimize_address_displacement (rtx *disp, rtx *off, machine_mode mode)
    return true;
  }
  
+/* Return the binary representation of floating point constant VALUE in INTVAL.
+   If the value cannot be converted, return false without setting INTVAL.
+   The conversion is done in the given MODE.  */
+bool
+aarch64_reinterpret_float_as_int (rtx value, unsigned HOST_WIDE_INT *intval)
+{
+
+  /* We make a general exception for 0.  */
+  if (aarch64_float_const_zero_rtx_p (value))
+    {
+      *intval = 0;
+      return true;
+    }
+
+  machine_mode mode = GET_MODE (value);
+  if (GET_CODE (value) != CONST_DOUBLE
+      || !SCALAR_FLOAT_MODE_P (mode)
+      || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT
+      /* Only support up to DF mode.  */
+      || GET_MODE_BITSIZE (mode) > GET_MODE_BITSIZE (DFmode))
+    return false;
+
+  unsigned HOST_WIDE_INT ival = 0;
+
+  long res[2];
+  real_to_target (res,
+                 CONST_DOUBLE_REAL_VALUE (value),
+                 REAL_MODE_FORMAT (mode));
+
+  ival = zext_hwi (res[0], 32);
+  if (GET_MODE_BITSIZE (mode) == GET_MODE_BITSIZE (DFmode))
+    ival |= (zext_hwi (res[1], 32) << 32);
+
+  *intval = ival;
+  return true;
+}
+
+/* Return TRUE if rtx X is an immediate constant that can be moved using a
+   single MOV(+MOVK) followed by an FMOV.  */
+bool
+aarch64_float_const_rtx_p (rtx x)
+{
+  machine_mode mode = GET_MODE (x);
+  if (mode == VOIDmode)
+    return false;
+
+  /* Determine whether it's cheaper to write float constants as
+     mov/movk pairs over ldr/adrp pairs.  */
+  unsigned HOST_WIDE_INT ival;
+
+  if (GET_CODE (x) == CONST_DOUBLE
+      && SCALAR_FLOAT_MODE_P (mode)
+      && aarch64_reinterpret_float_as_int (x, &ival))
+    {
+      machine_mode imode = mode == HFmode ? SImode : int_mode_for_mode (mode);
+      int num_instr = aarch64_internal_mov_immediate
+                       (NULL_RTX, gen_int_mode (ival, imode), false, imode);
+      return num_instr < 3;
+    }
+
+  return false;
+}
+
  /* Return TRUE if rtx X is immediate constant 0.0 */
  bool
  aarch64_float_const_zero_rtx_p (rtx x)
@@ -4689,6 +4754,49 @@ aarch64_float_const_zero_rtx_p (rtx x)
    return real_equal (CONST_DOUBLE_REAL_VALUE (x), &dconst0);
  }
  
+/* Return TRUE if rtx X is immediate constant that fits in a single
+   MOVI immediate operation.  */
+bool
+aarch64_can_const_movi_rtx_p (rtx x, machine_mode mode)
+{
+  if (!TARGET_SIMD)
+     return false;
+
+  /* We make a general exception for 0.  */
+  if (aarch64_float_const_zero_rtx_p (x))
+      return true;
+
+  machine_mode vmode, imode;
+  unsigned HOST_WIDE_INT ival;
+
+  if (GET_CODE (x) == CONST_DOUBLE
+      && SCALAR_FLOAT_MODE_P (mode))
+    {
+      if (!aarch64_reinterpret_float_as_int (x, &ival))
+       return false;
+
+      imode = int_mode_for_mode (mode);
+    }
+  else if (GET_CODE (x) == CONST_INT
+          && SCALAR_INT_MODE_P (mode))
+    {
+       imode = mode;
+       ival = INTVAL (x);
+    }
+  else
+    return false;
+
+   /* use a 64 bit mode for everything except for DI/DF mode, where we use
+     a 128 bit vector mode.  */
+  int width = GET_MODE_BITSIZE (mode) == 64 ? 128 : 64;
+
+  vmode = aarch64_simd_container_mode (imode, width);
+  rtx v_op = aarch64_simd_gen_const_vector_dup (vmode, ival);
+
+  return aarch64_simd_valid_immediate (v_op, vmode, false, NULL);
+}
+
+
  /* Return the fixed registers used for condition codes.  */
  
  static bool
@@ -5883,12 +5991,6 @@ aarch64_preferred_reload_class (rtx x, reg_class_t regclass)
        return NO_REGS;
      }
  
-  /* If it's an integer immediate that MOVI can't handle, then
-     FP_REGS is not an option, so we return NO_REGS instead.  */
-  if (CONST_INT_P (x) && reg_class_subset_p (regclass, FP_REGS)
-      && !aarch64_simd_imm_scalar_p (x, GET_MODE (x)))
-    return NO_REGS;
-
    /* Register eliminiation can result in a request for
       SP+constant->FP_REGS.  We cannot support such operations which
       use SP as source and an FP_REG as destination, so reject out
@@ -6838,6 +6940,25 @@ aarch64_rtx_costs (rtx x, machine_mode mode, int outer ATTRIBUTE_UNUSED,
        return true;
  
      case CONST_DOUBLE:
+
+      /* First determine number of instructions to do the move
+         as an integer constant.  */
+      if (!aarch64_float_const_representable_p (x)
+          && !aarch64_can_const_movi_rtx_p (x, mode)
+          && aarch64_float_const_rtx_p (x))
+       {
+         unsigned HOST_WIDE_INT ival;
+         bool succeed = aarch64_reinterpret_float_as_int (x, &ival);
+         gcc_assert (succeed);
+
+         machine_mode imode = mode == HFmode ? SImode
+                                             : int_mode_for_mode (mode);
+         int ncost = aarch64_internal_mov_immediate
+               (NULL_RTX, gen_int_mode (ival, imode), false, imode);
+         *cost += COSTS_N_INSNS (ncost);
+         return true;
+       }
+
        if (speed)
         {
           /* mov[df,sf]_aarch64.  */
@@ -10182,18 +10303,16 @@ aarch64_legitimate_pic_operand_p (rtx x)
  /* Return true if X holds either a quarter-precision or
       floating-point +0.0 constant.  */
  static bool
-aarch64_valid_floating_const (machine_mode mode, rtx x)
+aarch64_valid_floating_const (rtx x)
  {
    if (!CONST_DOUBLE_P (x))
      return false;
  
-  if (aarch64_float_const_zero_rtx_p (x))
+  /* This call determines which constants can be used in mov<mode>
+     as integer moves instead of constant loads.  */
+  if (aarch64_float_const_rtx_p (x))
      return true;
  
-  /* We only handle moving 0.0 to a TFmode register.  */
-  if (!(mode == SFmode || mode == DFmode))
-    return false;
-
    return aarch64_float_const_representable_p (x);
  }
  
@@ -10205,11 +10324,15 @@ aarch64_legitimate_constant_p (machine_mode mode, rtx x)
    if (TARGET_SIMD && aarch64_vect_struct_mode_p (mode))
      return false;
  
-  /* This could probably go away because
-     we now decompose CONST_INTs according to expand_mov_immediate.  */
+  /* For these cases we never want to use a literal load.
+     As such we have to prevent the compiler from forcing these
+     to memory.  */
    if ((GET_CODE (x) == CONST_VECTOR
         && aarch64_simd_valid_immediate (x, mode, false, NULL))
-      || CONST_INT_P (x) || aarch64_valid_floating_const (mode, x))
+      || CONST_INT_P (x)
+      || aarch64_valid_floating_const (x)
+      || aarch64_can_const_movi_rtx_p (x, mode)
+      || aarch64_float_const_rtx_p (x))
         return !targetm.cannot_force_const_mem (mode, x);
  
    if (GET_CODE (x) == HIGH
@@ -11491,23 +11614,6 @@ aarch64_mask_from_zextract_ops (rtx width, rtx pos)
    return GEN_INT (mask << UINTVAL (pos));
  }
  
-bool
-aarch64_simd_imm_scalar_p (rtx x, machine_mode mode ATTRIBUTE_UNUSED)
-{
-  HOST_WIDE_INT imm = INTVAL (x);
-  int i;
-
-  for (i = 0; i < 8; i++)
-    {
-      unsigned int byte = imm & 0xff;
-      if (byte != 0xff && byte != 0)
-       return false;
-      imm >>= 8;
-    }
-
-  return true;
-}
-
  bool
  aarch64_mov_operand_p (rtx x, machine_mode mode)
  {
@@ -12899,15 +13005,28 @@ aarch64_output_simd_mov_immediate (rtx const_vector,
  }
  
  char*
-aarch64_output_scalar_simd_mov_immediate (rtx immediate,
-                                         machine_mode mode)
+aarch64_output_scalar_simd_mov_immediate (rtx immediate,  machine_mode mode)
  {
+
+  /* If a floating point number was passed and we desire to use it in an
+     integer mode do the conversion to integer.  */
+  if (CONST_DOUBLE_P (immediate) && GET_MODE_CLASS (mode) == MODE_INT)
+    {
+      unsigned HOST_WIDE_INT ival;
+      if (!aarch64_reinterpret_float_as_int (immediate, &ival))
+         gcc_unreachable ();
+      immediate = gen_int_mode (ival, mode);
+    }
+
    machine_mode vmode;
+  /* use a 64 bit mode for everything except for DI/DF mode, where we use
+     a 128 bit vector mode.  */
+  int width = GET_MODE_BITSIZE (mode) == 64 ? 128 : 64;
  
    gcc_assert (!VECTOR_MODE_P (mode));
-  vmode = aarch64_simd_container_mode (mode, 64);
+  vmode = aarch64_simd_container_mode (mode, width);
    rtx v_op = aarch64_simd_gen_const_vector_dup (vmode, INTVAL (immediate));
-  return aarch64_output_simd_mov_immediate (v_op, vmode, 64);
+  return aarch64_output_simd_mov_immediate (v_op, vmode, width);
  }
  
  /* Split operands into moves from op[1] + op[2] into op[0].  */
diff --git a/gcc/config/aarch64/aarch64.md b/gcc/config/aarch64/aarch64.md

index d3e66db1f712c6b51a4122629fba027077086e3f..43876beb4d00f808964b6c673105c0deef99444d 100644 (file)
--- a/gcc/config/aarch64/aarch64.md
+++ b/gcc/config/aarch64/aarch64.md
@@ -920,8 +920,8 @@
  )
  
  (define_insn_and_split "*movsi_aarch64"
-  [(set (match_operand:SI 0 "nonimmediate_operand" "=r,k,r,r,r,r,*w,m,  m,r,r  ,*w,r,*w")
-       (match_operand:SI 1 "aarch64_mov_operand"  " r,r,k,M,n,m, m,rZ,*w,Usa,Ush,rZ,w,*w"))]
+  [(set (match_operand:SI 0 "nonimmediate_operand" "=r,k,r,r,r,r,*w,m,  m,r,r  ,*w, r,*w,w")
+       (match_operand:SI 1 "aarch64_mov_operand"  " r,r,k,M,n,m, m,rZ,*w,Usa,Ush,rZ,w,*w,Ds"))]
    "(register_operand (operands[0], SImode)
      || aarch64_reg_or_zero (operands[1], SImode))"
    "@
@@ -938,8 +938,9 @@
     adrp\\t%x0, %A1
     fmov\\t%s0, %w1
     fmov\\t%w0, %s1
-   fmov\\t%s0, %s1"
-   "CONST_INT_P (operands[1]) && !aarch64_move_imm (INTVAL (operands[1]), SImode)
+   fmov\\t%s0, %s1
+   * return aarch64_output_scalar_simd_mov_immediate (operands[1], SImode);"
+  "CONST_INT_P (operands[1]) && !aarch64_move_imm (INTVAL (operands[1]), SImode)
      && REG_P (operands[0]) && GP_REGNUM_P (REGNO (operands[0]))"
     [(const_int 0)]
     "{
@@ -947,8 +948,9 @@
         DONE;
      }"
    [(set_attr "type" "mov_reg,mov_reg,mov_reg,mov_imm,mov_imm,load1,load1,store1,store1,\
-                     adr,adr,f_mcr,f_mrc,fmov")
-   (set_attr "fp" "*,*,*,*,*,*,yes,*,yes,*,*,yes,yes,yes")]
+                   adr,adr,f_mcr,f_mrc,fmov,neon_move")
+   (set_attr "fp" "*,*,*,*,*,*,yes,*,yes,*,*,yes,yes,yes,*")
+   (set_attr "simd" "*,*,*,*,*,*,*,*,*,*,*,*,*,*,yes")]
  )
  
  (define_insn_and_split "*movdi_aarch64"
@@ -971,7 +973,7 @@
     fmov\\t%d0, %x1
     fmov\\t%x0, %d1
     fmov\\t%d0, %d1
-   movi\\t%d0, %1"
+   * return aarch64_output_scalar_simd_mov_immediate (operands[1], DImode);"
     "(CONST_INT_P (operands[1]) && !aarch64_move_imm (INTVAL (operands[1]), DImode))
      && REG_P (operands[0]) && GP_REGNUM_P (REGNO (operands[0]))"
     [(const_int 0)]
diff --git a/gcc/config/aarch64/constraints.md b/gcc/config/aarch64/constraints.md

index 88e840f2898d2da3e51e753578ee59bce4f462fa..9ce3d4efaf31a301dfb7c1772a6b685fb2cbd2ee 100644 (file)
--- a/gcc/config/aarch64/constraints.md
+++ b/gcc/config/aarch64/constraints.md
@@ -176,6 +176,12 @@
    (and (match_code "const_double")
         (match_test "aarch64_float_const_representable_p (op)")))
  
+(define_constraint "Uvi"
+  "A floating point constant which can be used with a\
+   MOVI immediate operation."
+  (and (match_code "const_double")
+       (match_test "aarch64_can_const_movi_rtx_p (op, GET_MODE (op))")))
+
  (define_constraint "Dn"
    "@internal
   A constraint that matches vector of immediates."
@@ -220,9 +226,17 @@
  
  (define_constraint "Dd"
    "@internal
- A constraint that matches an immediate operand valid for AdvSIMD scalar."
+ A constraint that matches an integer immediate operand valid\
+ for AdvSIMD scalar operations in DImode."
+ (and (match_code "const_int")
+      (match_test "aarch64_can_const_movi_rtx_p (op, DImode)")))
+
+(define_constraint "Ds"
+  "@internal
+ A constraint that matches an integer immediate operand valid\
+ for AdvSIMD scalar operations in SImode."
   (and (match_code "const_int")
-      (match_test "aarch64_simd_imm_scalar_p (op, GET_MODE (op))")))
+      (match_test "aarch64_can_const_movi_rtx_p (op, SImode)")))
  
  (define_address_constraint "Dp"
    "@internal
author	Tamar Christina <tamar.christina@arm.com>
	Fri, 28 Jul 2017 15:11:25 +0000 (15:11 +0000)
committer	Tamar Christina <tnfchris@gcc.gnu.org>
	Fri, 28 Jul 2017 15:11:25 +0000 (15:11 +0000)
gcc/ChangeLog		patch \| blob \| history
gcc/config/aarch64/aarch64-protos.h		patch \| blob \| history
gcc/config/aarch64/aarch64.c		patch \| blob \| history
gcc/config/aarch64/aarch64.md		patch \| blob \| history
gcc/config/aarch64/constraints.md		patch \| blob \| history