re PR target/65697 (__atomic memory barriers not strong enough for __sync builtins)

[gcc.git] / gcc / haifa-sched.c
diff --git a/gcc/haifa-sched.c b/gcc/haifa-sched.c

index 64c8c9c1f70bb7a685098f64249848d933c22482..fd6e3e929e65a6c0a5bafa369f1362abe3758950 100644 (file)
--- a/gcc/haifa-sched.c
+++ b/gcc/haifa-sched.c
@@ -131,11 +131,6 @@ along with GCC; see the file COPYING3.  If not see
  #include "rtl.h"
  #include "tm_p.h"
  #include "regs.h"
-#include "hashtab.h"
-#include "hash-set.h"
-#include "vec.h"
-#include "machmode.h"
-#include "input.h"
  #include "function.h"
  #include "flags.h"
  #include "insn-config.h"
@@ -156,7 +151,6 @@ along with GCC; see the file COPYING3.  If not see
  #include "cfgloop.h"
  #include "ira.h"
  #include "emit-rtl.h"  /* FIXME: Can go away once crtl is moved to rtl.h.  */
-#include "hash-table.h"
  #include "dumpfile.h"
  
  #ifdef INSN_SCHEDULING
@@ -619,18 +613,17 @@ struct delay_pair
  
  /* Helpers for delay hashing.  */
  
-struct delay_i1_hasher : typed_noop_remove <delay_pair>
+struct delay_i1_hasher : nofree_ptr_hash <delay_pair>
  {
-  typedef delay_pair value_type;
-  typedef void compare_type;
-  static inline hashval_t hash (const value_type *);
-  static inline bool equal (const value_type *, const compare_type *);
+  typedef void *compare_type;
+  static inline hashval_t hash (const delay_pair *);
+  static inline bool equal (const delay_pair *, const void *);
  };
  
  /* Returns a hash value for X, based on hashing just I1.  */
  
  inline hashval_t
-delay_i1_hasher::hash (const value_type *x)
+delay_i1_hasher::hash (const delay_pair *x)
  {
    return htab_hash_pointer (x->i1);
  }
@@ -638,23 +631,22 @@ delay_i1_hasher::hash (const value_type *x)
  /* Return true if I1 of pair X is the same as that of pair Y.  */
  
  inline bool
-delay_i1_hasher::equal (const value_type *x, const compare_type *y)
+delay_i1_hasher::equal (const delay_pair *x, const void *y)
  {
    return x->i1 == y;
  }
  
-struct delay_i2_hasher : typed_free_remove <delay_pair>
+struct delay_i2_hasher : free_ptr_hash <delay_pair>
  {
-  typedef delay_pair value_type;
-  typedef void compare_type;
-  static inline hashval_t hash (const value_type *);
-  static inline bool equal (const value_type *, const compare_type *);
+  typedef void *compare_type;
+  static inline hashval_t hash (const delay_pair *);
+  static inline bool equal (const delay_pair *, const void *);
  };
  
  /* Returns a hash value for X, based on hashing just I2.  */
  
  inline hashval_t
-delay_i2_hasher::hash (const value_type *x)
+delay_i2_hasher::hash (const delay_pair *x)
  {
    return htab_hash_pointer (x->i2);
  }
@@ -662,7 +654,7 @@ delay_i2_hasher::hash (const value_type *x)
  /* Return true if I2 of pair X is the same as that of pair Y.  */
  
  inline bool
-delay_i2_hasher::equal (const value_type *x, const compare_type *y)
+delay_i2_hasher::equal (const delay_pair *x, const void *y)
  {
    return x->i2 == y;
  }
@@ -881,7 +873,7 @@ static int early_queue_to_ready (state_t, struct ready_list *);
  /* The following functions are used to implement multi-pass scheduling
     on the first cycle.  */
  static rtx_insn *ready_remove (struct ready_list *, int);
-static void ready_remove_insn (rtx);
+static void ready_remove_insn (rtx_insn *);
  
  static void fix_inter_tick (rtx_insn *, rtx_insn *);
  static int fix_tick_ready (rtx_insn *);
@@ -894,7 +886,7 @@ static void extend_h_i_d (void);
  static void init_h_i_d (rtx_insn *);
  static int haifa_speculate_insn (rtx_insn *, ds_t, rtx *);
  static void generate_recovery_code (rtx_insn *);
-static void process_insn_forw_deps_be_in_spec (rtx, rtx_insn *, ds_t);
+static void process_insn_forw_deps_be_in_spec (rtx_insn *, rtx_insn *, ds_t);
  static void begin_speculative_block (rtx_insn *);
  static void add_to_speculative_block (rtx_insn *);
  static void init_before_recovery (basic_block *);
@@ -1032,18 +1024,13 @@ initiate_reg_pressure_info (bitmap live)
  static void
  setup_ref_regs (rtx x)
  {
-  int i, j, regno;
+  int i, j;
    const RTX_CODE code = GET_CODE (x);
    const char *fmt;
  
    if (REG_P (x))
      {
-      regno = REGNO (x);
-      if (HARD_REGISTER_NUM_P (regno))
-       bitmap_set_range (region_ref_regs, regno,
-                         hard_regno_nregs[regno][GET_MODE (x)]);
-      else
-       bitmap_set_bit (region_ref_regs, REGNO (x));
+      bitmap_set_range (region_ref_regs, REGNO (x), REG_NREGS (x));
        return;
      }
    fmt = GET_RTX_FORMAT (code);
@@ -1070,7 +1057,6 @@ initiate_bb_reg_pressure_info (basic_block bb)
        if (NONDEBUG_INSN_P (insn))
         setup_ref_regs (PATTERN (insn));
    initiate_reg_pressure_info (df_get_live_in (bb));
-#ifdef EH_RETURN_DATA_REGNO
    if (bb_has_eh_pred (bb))
      for (i = 0; ; ++i)
        {
@@ -1082,7 +1068,6 @@ initiate_bb_reg_pressure_info (basic_block bb)
           mark_regno_birth_or_death (curr_reg_live, curr_reg_pressure,
                                      regno, true);
        }
-#endif
  }
  
  /* Save current register pressure related info.  */
@@ -1233,6 +1218,11 @@ recompute_todo_spec (rtx_insn *next, bool for_backtrack)
    if (!sd_lists_empty_p (next, SD_LIST_HARD_BACK))
      return HARD_DEP;
  
+  /* If NEXT is intended to sit adjacent to this instruction, we don't
+     want to try to break any dependencies.  Treat it as a HARD_DEP.  */
+  if (SCHED_GROUP_P (next))
+    return HARD_DEP;
+
    /* Now we've got NEXT with speculative deps only.
       1. Look at the deps to see what we have to do.
       2. Check if we can do 'todo'.  */
@@ -1387,7 +1377,7 @@ static rtx_insn *last_scheduled_insn;
     block, or the prev_head of the scheduling block.  Used by
     rank_for_schedule, so that insns independent of the last scheduled
     insn will be preferred over dependent instructions.  */
-static rtx last_nondebug_scheduled_insn;
+static rtx_insn *last_nondebug_scheduled_insn;
  
  /* Pointer that iterates through the list of unscheduled insns if we
     have a dbg_cnt enabled.  It always points at an insn prior to the
@@ -1595,7 +1585,7 @@ contributes_to_priority_p (dep_t dep)
  /* Compute the number of nondebug deps in list LIST for INSN.  */
  
  static int
-dep_list_size (rtx insn, sd_list_types_def list)
+dep_list_size (rtx_insn *insn, sd_list_types_def list)
  {
    sd_iterator_def sd_it;
    dep_t dep;
@@ -2568,7 +2558,7 @@ model_set_excess_costs (rtx_insn **insns, int count)
  
  /* Enum of rank_for_schedule heuristic decisions.  */
  enum rfs_decision {
-  RFS_DEBUG, RFS_LIVE_RANGE_SHRINK1, RFS_LIVE_RANGE_SHRINK2,
+  RFS_LIVE_RANGE_SHRINK1, RFS_LIVE_RANGE_SHRINK2,
    RFS_SCHED_GROUP, RFS_PRESSURE_DELAY, RFS_PRESSURE_TICK,
    RFS_FEEDS_BACKTRACK_INSN, RFS_PRIORITY, RFS_SPECULATION,
    RFS_SCHED_RANK, RFS_LAST_INSN, RFS_PRESSURE_INDEX,
@@ -2576,7 +2566,7 @@ enum rfs_decision {
  
  /* Corresponding strings for print outs.  */
  static const char *rfs_str[RFS_N] = {
-  "RFS_DEBUG", "RFS_LIVE_RANGE_SHRINK1", "RFS_LIVE_RANGE_SHRINK2",
+  "RFS_LIVE_RANGE_SHRINK1", "RFS_LIVE_RANGE_SHRINK2",
    "RFS_SCHED_GROUP", "RFS_PRESSURE_DELAY", "RFS_PRESSURE_TICK",
    "RFS_FEEDS_BACKTRACK_INSN", "RFS_PRIORITY", "RFS_SPECULATION",
    "RFS_SCHED_RANK", "RFS_LAST_INSN", "RFS_PRESSURE_INDEX",
@@ -2612,12 +2602,11 @@ rank_for_schedule_debug (const void *x, const void *y)
  
    /* Schedule debug insns as early as possible.  */
    if (DEBUG_INSN_P (tmp) && !DEBUG_INSN_P (tmp2))
-    return rfs_result (RFS_DEBUG, -1, tmp, tmp2);
+    return -1;
    else if (!DEBUG_INSN_P (tmp) && DEBUG_INSN_P (tmp2))
-    return rfs_result (RFS_DEBUG, 1, tmp, tmp2);
+    return 1;
    else if (DEBUG_INSN_P (tmp) && DEBUG_INSN_P (tmp2))
-    return rfs_result (RFS_DEBUG, INSN_LUID (tmp) - INSN_LUID (tmp2),
-                      tmp, tmp2);
+    return INSN_LUID (tmp) - INSN_LUID (tmp2);
    else
      return INSN_RFS_DEBUG_ORIG_ORDER (tmp2) - INSN_RFS_DEBUG_ORIG_ORDER (tmp);
  }
@@ -2785,7 +2774,7 @@ rank_for_schedule (const void *x, const void *y)
      {
        dep_t dep1;
        dep_t dep2;
-      rtx last = last_nondebug_scheduled_insn;
+      rtx_insn *last = last_nondebug_scheduled_insn;
  
        /* Classify the instructions into three classes:
           1) Data dependent on last schedule insn.
@@ -3030,7 +3019,7 @@ ready_remove (struct ready_list *ready, int index)
  
  /* Remove INSN from the ready list.  */
  static void
-ready_remove_insn (rtx insn)
+ready_remove_insn (rtx_insn *insn)
  {
    int i;
  
@@ -3080,48 +3069,45 @@ print_rank_for_schedule_stats (const char *prefix,
        }
  }
  
-/* Sort the ready list READY by ascending priority, using the SCHED_SORT
-   macro.  */
-
-void
-ready_sort (struct ready_list *ready)
+/* Separate DEBUG_INSNS from normal insns.  DEBUG_INSNs go to the end
+   of array.  */
+static void
+ready_sort_debug (struct ready_list *ready)
  {
    int i;
    rtx_insn **first = ready_lastpos (ready);
-  int n_ready_non_debug = ready->n_ready;
  
    for (i = 0; i < ready->n_ready; ++i)
-    {
-      if (DEBUG_INSN_P (first[i]))
-       --n_ready_non_debug;
-      else
-       {
-         INSN_RFS_DEBUG_ORIG_ORDER (first[i]) = i;
+    if (!DEBUG_INSN_P (first[i]))
+      INSN_RFS_DEBUG_ORIG_ORDER (first[i]) = i;
  
-         if (sched_pressure == SCHED_PRESSURE_WEIGHTED)
-           setup_insn_reg_pressure_info (first[i]);
-       }
-    }
+  qsort (first, ready->n_ready, sizeof (rtx), rank_for_schedule_debug);
+}
  
-  if (sched_pressure == SCHED_PRESSURE_MODEL
-      && model_curr_point < model_num_insns)
-    model_set_excess_costs (first, ready->n_ready);
+/* Sort non-debug insns in the ready list READY by ascending priority.
+   Assumes that all debug insns are separated from the real insns.  */
+static void
+ready_sort_real (struct ready_list *ready)
+{
+  int i;
+  rtx_insn **first = ready_lastpos (ready);
+  int n_ready_real = ready->n_ready - ready->n_debug;
+
+  if (sched_pressure == SCHED_PRESSURE_WEIGHTED)
+    for (i = 0; i < n_ready_real; ++i)
+      setup_insn_reg_pressure_info (first[i]);
+  else if (sched_pressure == SCHED_PRESSURE_MODEL
+          && model_curr_point < model_num_insns)
+    model_set_excess_costs (first, n_ready_real);
  
    rank_for_schedule_stats_t stats1;
    if (sched_verbose >= 4)
      stats1 = rank_for_schedule_stats;
  
-  if (n_ready_non_debug < ready->n_ready)
-    /* Separate DEBUG_INSNS from normal insns.  DEBUG_INSNs go to the end
-       of array.  */
-    qsort (first, ready->n_ready, sizeof (rtx), rank_for_schedule_debug);
-  else
-    {
-      if (n_ready_non_debug == 2)
-       swap_sort (first, n_ready_non_debug);
-      else if (n_ready_non_debug > 2)
-       qsort (first, n_ready_non_debug, sizeof (rtx), rank_for_schedule);
-    }
+  if (n_ready_real == 2)
+    swap_sort (first, n_ready_real);
+  else if (n_ready_real > 2)
+    qsort (first, n_ready_real, sizeof (rtx), rank_for_schedule);
  
    if (sched_verbose >= 4)
      {
@@ -3130,6 +3116,16 @@ ready_sort (struct ready_list *ready)
      }
  }
  
+/* Sort the ready list READY by ascending priority.  */
+static void
+ready_sort (struct ready_list *ready)
+{
+  if (ready->n_debug > 0)
+    ready_sort_debug (ready);
+  else
+    ready_sort_real (ready);
+}
+
  /* PREV is an insn that is ready to execute.  Adjust its priority if that
     will help shorten or lengthen register lifetimes as appropriate.  Also
     provide a hook for the target to tweak itself.  */
@@ -3278,7 +3274,7 @@ sched_setup_bb_reg_pressure_info (basic_block bb, rtx_insn *after)
     only be scheduled once their control dependency is resolved.  */
  
  static void
-check_clobbered_conditions (rtx insn)
+check_clobbered_conditions (rtx_insn *insn)
  {
    HARD_REG_SET t;
    int i;
@@ -4300,7 +4296,7 @@ struct haifa_saved_data
    state_t curr_state;
  
    rtx_insn *last_scheduled_insn;
-  rtx last_nondebug_scheduled_insn;
+  rtx_insn *last_nondebug_scheduled_insn;
    rtx_insn *nonscheduled_insns_begin;
    int cycle_issued_insns;
  
@@ -4330,7 +4326,7 @@ static struct haifa_saved_data *backtrack_queue;
  /* For every dependency of INSN, set the FEEDS_BACKTRACK_INSN bit according
     to SET_P.  */
  static void
-mark_backtrack_feeds (rtx insn, int set_p)
+mark_backtrack_feeds (rtx_insn *insn, int set_p)
  {
    sd_iterator_def sd_it;
    dep_t dep;
@@ -4476,7 +4472,7 @@ undo_replacements_for_backtrack (struct haifa_saved_data *save)
     queued nowhere.  */
  
  static void
-unschedule_insns_until (rtx insn)
+unschedule_insns_until (rtx_insn *insn)
  {
    auto_vec<rtx_insn *> recompute_vec;
  
@@ -5124,7 +5120,7 @@ queue_to_ready (struct ready_list *ready)
  {
    rtx_insn *insn;
    rtx_insn_list *link;
-  rtx skip_insn;
+  rtx_insn *skip_insn;
  
    q_ptr = NEXT_Q (q_ptr);
  
@@ -5133,7 +5129,7 @@ queue_to_ready (struct ready_list *ready)
         nonscheduled insn.  */
      skip_insn = first_nonscheduled_insn ();
    else
-    skip_insn = NULL_RTX;
+    skip_insn = NULL;
  
    /* Add all pending insns that can be scheduled without stalls to the
       ready list.  */
@@ -5228,11 +5224,10 @@ queue_to_ready (struct ready_list *ready)
     addition) depending on user flags and target hooks.  */
  
  static bool
-ok_for_early_queue_removal (rtx insn)
+ok_for_early_queue_removal (rtx_insn *insn)
  {
    if (targetm.sched.is_costly_dependence)
      {
-      rtx prev_insn;
        int n_cycles;
        int i = scheduled_insns.length ();
        for (n_cycles = flag_sched_stalled_insns_dep; n_cycles; n_cycles--)
@@ -5241,7 +5236,7 @@ ok_for_early_queue_removal (rtx insn)
             {
               int cost;
  
-             prev_insn = scheduled_insns[i];
+             rtx_insn *prev_insn = scheduled_insns[i];
  
               if (!NOTE_P (prev_insn))
                 {
@@ -6459,7 +6454,7 @@ schedule_block (basic_block *target_bb, state_t init_state)
  
    /* We start inserting insns after PREV_HEAD.  */
    last_scheduled_insn = prev_head;
-  last_nondebug_scheduled_insn = NULL_RTX;
+  last_nondebug_scheduled_insn = NULL;
    nonscheduled_insns_begin = NULL;
  
    gcc_assert ((NOTE_P (last_scheduled_insn)
@@ -6490,7 +6485,8 @@ schedule_block (basic_block *target_bb, state_t init_state)
    if (!reload_completed
        && ready.n_ready - ready.n_debug > MAX_SCHED_READY_INSNS)
      {
-      ready_sort (&ready);
+      ready_sort_debug (&ready);
+      ready_sort_real (&ready);
  
        /* Find first free-standing insn past MAX_SCHED_READY_INSNS.
           If there are debug insns, we know they're first.  */
@@ -6501,7 +6497,8 @@ schedule_block (basic_block *target_bb, state_t init_state)
        if (sched_verbose >= 2)
         {
           fprintf (sched_dump,
-                  ";;\t\tReady list on entry: %d insns\n", ready.n_ready);
+                  ";;\t\tReady list on entry: %d insns:  ", ready.n_ready);
+         debug_ready_list (&ready);
           fprintf (sched_dump,
                    ";;\t\t before reload => truncated to %d insns\n", i);
         }
@@ -7173,9 +7170,8 @@ void
  sched_init (void)
  {
    /* Disable speculative loads in their presence if cc0 defined.  */
-#ifdef HAVE_cc0
+  if (HAVE_cc0)
    flag_schedule_speculative_load = 0;
-#endif
  
    if (targetm.sched.dispatch (NULL, IS_DISPATCH_ON))
      targetm.sched.dispatch_do (NULL, DISPATCH_INIT);
@@ -7790,7 +7786,7 @@ generate_recovery_code (rtx_insn *insn)
     Tries to add speculative dependencies of type FS between instructions
     in deps_list L and TWIN.  */
  static void
-process_insn_forw_deps_be_in_spec (rtx insn, rtx_insn *twin, ds_t fs)
+process_insn_forw_deps_be_in_spec (rtx_insn *insn, rtx_insn *twin, ds_t fs)
  {
    sd_iterator_def sd_it;
    dep_t dep;
@@ -8093,8 +8089,6 @@ init_before_recovery (basic_block *before_recovery_ptr)
           Between these two blocks recovery blocks will be emitted.  */
  
        basic_block single, empty;
-      rtx_insn *x;
-      rtx label;
  
        /* If the fallthrough edge to exit we've found is from the block we've
          created before, don't do anything more.  */
@@ -8125,8 +8119,9 @@ init_before_recovery (basic_block *before_recovery_ptr)
        make_single_succ_edge (empty, EXIT_BLOCK_PTR_FOR_FN (cfun),
                              EDGE_FALLTHRU);
  
-      label = block_label (empty);
-      x = emit_jump_insn_after (gen_jump (label), BB_END (single));
+      rtx_code_label *label = block_label (empty);
+      rtx_jump_insn *x = emit_jump_insn_after (gen_jump (label),
+                                              BB_END (single));
        JUMP_LABEL (x) = label;
        LABEL_NUSES (label)++;
        haifa_init_insn (x);
@@ -8157,7 +8152,6 @@ init_before_recovery (basic_block *before_recovery_ptr)
  basic_block
  sched_create_recovery_block (basic_block *before_recovery_ptr)
  {
-  rtx label;
    rtx_insn *barrier;
    basic_block rec;
  
@@ -8169,7 +8163,7 @@ sched_create_recovery_block (basic_block *before_recovery_ptr)
    barrier = get_last_bb_insn (before_recovery);
    gcc_assert (BARRIER_P (barrier));
  
-  label = emit_label_after (gen_label_rtx (), barrier);
+  rtx_insn *label = emit_label_after (gen_label_rtx (), barrier);
  
    rec = create_basic_block (label, label, before_recovery);
  
@@ -8192,8 +8186,6 @@ void
  sched_create_recovery_edges (basic_block first_bb, basic_block rec,
                              basic_block second_bb)
  {
-  rtx label;
-  rtx jump;
    int edge_flags;
  
    /* This is fixing of incoming edge.  */
@@ -8205,8 +8197,8 @@ sched_create_recovery_edges (basic_block first_bb, basic_block rec,
      edge_flags = 0;
  
    make_edge (first_bb, rec, edge_flags);
-  label = block_label (second_bb);
-  jump = emit_jump_insn_after (gen_jump (label), BB_END (rec));
+  rtx_code_label *label = block_label (second_bb);
+  rtx_jump_insn *jump = emit_jump_insn_after (gen_jump (label), BB_END (rec));
    JUMP_LABEL (jump) = label;
    LABEL_NUSES (label)++;