gcc/loop.c

   1 /* Perform various loop optimizations, including strength reduction.
   2    Copyright (C) 1987, 1988, 1989, 1991, 1992, 1993, 1994, 1995, 1996, 1997,
   3    1998, 1999, 2000, 2001, 2002, 2003 Free Software Foundation, Inc.
   4
   5 This file is part of GCC.
   6
   7 GCC is free software; you can redistribute it and/or modify it under
   8 the terms of the GNU General Public License as published by the Free
   9 Software Foundation; either version 2, or (at your option) any later
  10 version.
  11
  12 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  13 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  14 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  15 for more details.
  16
  17 You should have received a copy of the GNU General Public License
  18 along with GCC; see the file COPYING.  If not, write to the Free
  19 Software Foundation, 59 Temple Place - Suite 330, Boston, MA
  20 02111-1307, USA.  */
  21
  22 /* This is the loop optimization pass of the compiler.
  23    It finds invariant computations within loops and moves them
  24    to the beginning of the loop.  Then it identifies basic and
  25    general induction variables.  Strength reduction is applied to the general
  26    induction variables, and induction variable elimination is applied to
  27    the basic induction variables.
  28
  29    It also finds cases where
  30    a register is set within the loop by zero-extending a narrower value
  31    and changes these to zero the entire register once before the loop
  32    and merely copy the low part within the loop.
  33
  34    Most of the complexity is in heuristics to decide when it is worth
  35    while to do these things.  */
  36
  37 #include "config.h"
  38 #include "system.h"
  39 #include "coretypes.h"
  40 #include "tm.h"
  41 #include "rtl.h"
  42 #include "tm_p.h"
  43 #include "function.h"
  44 #include "expr.h"
  45 #include "hard-reg-set.h"
  46 #include "basic-block.h"
  47 #include "insn-config.h"
  48 #include "regs.h"
  49 #include "recog.h"
  50 #include "flags.h"
  51 #include "real.h"
  52 #include "loop.h"
  53 #include "cselib.h"
  54 #include "except.h"
  55 #include "toplev.h"
  56 #include "predict.h"
  57 #include "insn-flags.h"
  58 #include "optabs.h"
  59 #include "cfgloop.h"
  60
  61 /* Not really meaningful values, but at least something.  */
  62 #ifndef SIMULTANEOUS_PREFETCHES
  63 #define SIMULTANEOUS_PREFETCHES 3
  64 #endif
  65 #ifndef PREFETCH_BLOCK
  66 #define PREFETCH_BLOCK 32
  67 #endif
  68 #ifndef HAVE_prefetch
  69 #define HAVE_prefetch 0
  70 #define CODE_FOR_prefetch 0
  71 #define gen_prefetch(a,b,c) (abort(), NULL_RTX)
  72 #endif
  73
  74 /* Give up the prefetch optimizations once we exceed a given threshhold.
  75    It is unlikely that we would be able to optimize something in a loop
  76    with so many detected prefetches.  */
  77 #define MAX_PREFETCHES 100
  78 /* The number of prefetch blocks that are beneficial to fetch at once before
  79    a loop with a known (and low) iteration count.  */
  80 #define PREFETCH_BLOCKS_BEFORE_LOOP_MAX  6
  81 /* For very tiny loops it is not worthwhile to prefetch even before the loop,
  82    since it is likely that the data are already in the cache.  */
  83 #define PREFETCH_BLOCKS_BEFORE_LOOP_MIN  2
  84
  85 /* Parameterize some prefetch heuristics so they can be turned on and off
  86    easily for performance testing on new architectures.  These can be
  87    defined in target-dependent files.  */
  88
  89 /* Prefetch is worthwhile only when loads/stores are dense.  */
  90 #ifndef PREFETCH_ONLY_DENSE_MEM
  91 #define PREFETCH_ONLY_DENSE_MEM 1
  92 #endif
  93
  94 /* Define what we mean by "dense" loads and stores; This value divided by 256
  95    is the minimum percentage of memory references that worth prefetching.  */
  96 #ifndef PREFETCH_DENSE_MEM
  97 #define PREFETCH_DENSE_MEM 220
  98 #endif
  99
 100 /* Do not prefetch for a loop whose iteration count is known to be low.  */
 101 #ifndef PREFETCH_NO_LOW_LOOPCNT
 102 #define PREFETCH_NO_LOW_LOOPCNT 1
 103 #endif
 104
 105 /* Define what we mean by a "low" iteration count.  */
 106 #ifndef PREFETCH_LOW_LOOPCNT
 107 #define PREFETCH_LOW_LOOPCNT 32
 108 #endif
 109
 110 /* Do not prefetch for a loop that contains a function call; such a loop is
 111    probably not an internal loop.  */
 112 #ifndef PREFETCH_NO_CALL
 113 #define PREFETCH_NO_CALL 1
 114 #endif
 115
 116 /* Do not prefetch accesses with an extreme stride.  */
 117 #ifndef PREFETCH_NO_EXTREME_STRIDE
 118 #define PREFETCH_NO_EXTREME_STRIDE 1
 119 #endif
 120
 121 /* Define what we mean by an "extreme" stride.  */
 122 #ifndef PREFETCH_EXTREME_STRIDE
 123 #define PREFETCH_EXTREME_STRIDE 4096
 124 #endif
 125
 126 /* Define a limit to how far apart indices can be and still be merged
 127    into a single prefetch.  */
 128 #ifndef PREFETCH_EXTREME_DIFFERENCE
 129 #define PREFETCH_EXTREME_DIFFERENCE 4096
 130 #endif
 131
 132 /* Issue prefetch instructions before the loop to fetch data to be used
 133    in the first few loop iterations.  */
 134 #ifndef PREFETCH_BEFORE_LOOP
 135 #define PREFETCH_BEFORE_LOOP 1
 136 #endif
 137
 138 /* Do not handle reversed order prefetches (negative stride).  */
 139 #ifndef PREFETCH_NO_REVERSE_ORDER
 140 #define PREFETCH_NO_REVERSE_ORDER 1
 141 #endif
 142
 143 /* Prefetch even if the GIV is in conditional code.  */
 144 #ifndef PREFETCH_CONDITIONAL
 145 #define PREFETCH_CONDITIONAL 1
 146 #endif
 147
 148 #define LOOP_REG_LIFETIME(LOOP, REGNO) \
 149 ((REGNO_LAST_LUID (REGNO) - REGNO_FIRST_LUID (REGNO)))
 150
 151 #define LOOP_REG_GLOBAL_P(LOOP, REGNO) \
 152 ((REGNO_LAST_LUID (REGNO) > INSN_LUID ((LOOP)->end) \
 153  || REGNO_FIRST_LUID (REGNO) < INSN_LUID ((LOOP)->start)))
 154
 155 #define LOOP_REGNO_NREGS(REGNO, SET_DEST) \
 156 ((REGNO) < FIRST_PSEUDO_REGISTER \
 157  ? (int) HARD_REGNO_NREGS ((REGNO), GET_MODE (SET_DEST)) : 1)
 158
 159
 160 /* Vector mapping INSN_UIDs to luids.
 161    The luids are like uids but increase monotonically always.
 162    We use them to see whether a jump comes from outside a given loop.  */
 163
 164 int *uid_luid;
 165
 166 /* Indexed by INSN_UID, contains the ordinal giving the (innermost) loop
 167    number the insn is contained in.  */
 168
 169 struct loop **uid_loop;
 170
 171 /* 1 + largest uid of any insn.  */
 172
 173 int max_uid_for_loop;
 174
 175 /* Number of loops detected in current function.  Used as index to the
 176    next few tables.  */
 177
 178 static int max_loop_num;
 179
 180 /* Bound on pseudo register number before loop optimization.
 181    A pseudo has valid regscan info if its number is < max_reg_before_loop.  */
 182 unsigned int max_reg_before_loop;
 183
 184 /* The value to pass to the next call of reg_scan_update.  */
 185 static int loop_max_reg;
 186 \f
 187 /* During the analysis of a loop, a chain of `struct movable's
 188    is made to record all the movable insns found.
 189    Then the entire chain can be scanned to decide which to move.  */
 190
 191 struct movable
 192 {
 193   rtx insn;                     /* A movable insn */
 194   rtx set_src;                  /* The expression this reg is set from.  */
 195   rtx set_dest;                 /* The destination of this SET.  */
 196   rtx dependencies;             /* When INSN is libcall, this is an EXPR_LIST
 197                                    of any registers used within the LIBCALL.  */
 198   int consec;                   /* Number of consecutive following insns
 199                                    that must be moved with this one.  */
 200   unsigned int regno;           /* The register it sets */
 201   short lifetime;               /* lifetime of that register;
 202                                    may be adjusted when matching movables
 203                                    that load the same value are found.  */
 204   short savings;                /* Number of insns we can move for this reg,
 205                                    including other movables that force this
 206                                    or match this one.  */
 207   ENUM_BITFIELD(machine_mode) savemode : 8;   /* Nonzero means it is a mode for
 208                                    a low part that we should avoid changing when
 209                                    clearing the rest of the reg.  */
 210   unsigned int cond : 1;        /* 1 if only conditionally movable */
 211   unsigned int force : 1;       /* 1 means MUST move this insn */
 212   unsigned int global : 1;      /* 1 means reg is live outside this loop */
 213                 /* If PARTIAL is 1, GLOBAL means something different:
 214                    that the reg is live outside the range from where it is set
 215                    to the following label.  */
 216   unsigned int done : 1;        /* 1 inhibits further processing of this */
 217
 218   unsigned int partial : 1;     /* 1 means this reg is used for zero-extending.
 219                                    In particular, moving it does not make it
 220                                    invariant.  */
 221   unsigned int move_insn : 1;   /* 1 means that we call emit_move_insn to
 222                                    load SRC, rather than copying INSN.  */
 223   unsigned int move_insn_first:1;/* Same as above, if this is necessary for the
 224                                     first insn of a consecutive sets group.  */
 225   unsigned int is_equiv : 1;    /* 1 means a REG_EQUIV is present on INSN.  */
 226   unsigned int insert_temp : 1;  /* 1 means we copy to a new pseudo and replace
 227                                     the original insn with a copy from that
 228                                     pseudo, rather than deleting it.  */
 229   struct movable *match;        /* First entry for same value */
 230   struct movable *forces;       /* An insn that must be moved if this is */
 231   struct movable *next;
 232 };
 233
 234
 235 FILE *loop_dump_stream;
 236
 237 /* Forward declarations.  */
 238
 239 static void invalidate_loops_containing_label PARAMS ((rtx));
 240 static void find_and_verify_loops PARAMS ((rtx, struct loops *));
 241 static void mark_loop_jump PARAMS ((rtx, struct loop *));
 242 static void prescan_loop PARAMS ((struct loop *));
 243 static int reg_in_basic_block_p PARAMS ((rtx, rtx));
 244 static int consec_sets_invariant_p PARAMS ((const struct loop *,
 245                                             rtx, int, rtx));
 246 static int labels_in_range_p PARAMS ((rtx, int));
 247 static void count_one_set PARAMS ((struct loop_regs *, rtx, rtx, rtx *));
 248 static void note_addr_stored PARAMS ((rtx, rtx, void *));
 249 static void note_set_pseudo_multiple_uses PARAMS ((rtx, rtx, void *));
 250 static int loop_reg_used_before_p PARAMS ((const struct loop *, rtx, rtx));
 251 static void scan_loop PARAMS ((struct loop*, int));
 252 #if 0
 253 static void replace_call_address PARAMS ((rtx, rtx, rtx));
 254 #endif
 255 static rtx skip_consec_insns PARAMS ((rtx, int));
 256 static int libcall_benefit PARAMS ((rtx));
 257 static void ignore_some_movables PARAMS ((struct loop_movables *));
 258 static void force_movables PARAMS ((struct loop_movables *));
 259 static void combine_movables PARAMS ((struct loop_movables *,
 260                                       struct loop_regs *));
 261 static int num_unmoved_movables PARAMS ((const struct loop *));
 262 static int regs_match_p PARAMS ((rtx, rtx, struct loop_movables *));
 263 static int rtx_equal_for_loop_p PARAMS ((rtx, rtx, struct loop_movables *,
 264                                          struct loop_regs *));
 265 static void add_label_notes PARAMS ((rtx, rtx));
 266 static void move_movables PARAMS ((struct loop *loop, struct loop_movables *,
 267                                    int, int));
 268 static void loop_movables_add PARAMS((struct loop_movables *,
 269                                       struct movable *));
 270 static void loop_movables_free PARAMS((struct loop_movables *));
 271 static int count_nonfixed_reads PARAMS ((const struct loop *, rtx));
 272 static void loop_bivs_find PARAMS((struct loop *));
 273 static void loop_bivs_init_find PARAMS((struct loop *));
 274 static void loop_bivs_check PARAMS((struct loop *));
 275 static void loop_givs_find PARAMS((struct loop *));
 276 static void loop_givs_check PARAMS((struct loop *));
 277 static int loop_biv_eliminable_p PARAMS((struct loop *, struct iv_class *,
 278                                          int, int));
 279 static int loop_giv_reduce_benefit PARAMS((struct loop *, struct iv_class *,
 280                                            struct induction *, rtx));
 281 static void loop_givs_dead_check PARAMS((struct loop *, struct iv_class *));
 282 static void loop_givs_reduce PARAMS((struct loop *, struct iv_class *));
 283 static void loop_givs_rescan PARAMS((struct loop *, struct iv_class *,
 284                                      rtx *));
 285 static void loop_ivs_free PARAMS((struct loop *));
 286 static void strength_reduce PARAMS ((struct loop *, int));
 287 static void find_single_use_in_loop PARAMS ((struct loop_regs *, rtx, rtx));
 288 static int valid_initial_value_p PARAMS ((rtx, rtx, int, rtx));
 289 static void find_mem_givs PARAMS ((const struct loop *, rtx, rtx, int, int));
 290 static void record_biv PARAMS ((struct loop *, struct induction *,
 291                                 rtx, rtx, rtx, rtx, rtx *,
 292                                 int, int));
 293 static void check_final_value PARAMS ((const struct loop *,
 294                                        struct induction *));
 295 static void loop_ivs_dump PARAMS((const struct loop *, FILE *, int));
 296 static void loop_iv_class_dump PARAMS((const struct iv_class *, FILE *, int));
 297 static void loop_biv_dump PARAMS((const struct induction *, FILE *, int));
 298 static void loop_giv_dump PARAMS((const struct induction *, FILE *, int));
 299 static void record_giv PARAMS ((const struct loop *, struct induction *,
 300                                 rtx, rtx, rtx, rtx, rtx, rtx, int,
 301                                 enum g_types, int, int, rtx *));
 302 static void update_giv_derive PARAMS ((const struct loop *, rtx));
 303 static void check_ext_dependent_givs PARAMS ((struct iv_class *,
 304                                               struct loop_info *));
 305 static int basic_induction_var PARAMS ((const struct loop *, rtx,
 306                                         enum machine_mode, rtx, rtx,
 307                                         rtx *, rtx *, rtx **));
 308 static rtx simplify_giv_expr PARAMS ((const struct loop *, rtx, rtx *, int *));
 309 static int general_induction_var PARAMS ((const struct loop *loop, rtx, rtx *,
 310                                           rtx *, rtx *, rtx *, int, int *,
 311                                           enum machine_mode));
 312 static int consec_sets_giv PARAMS ((const struct loop *, int, rtx,
 313                                     rtx, rtx, rtx *, rtx *, rtx *, rtx *));
 314 static int check_dbra_loop PARAMS ((struct loop *, int));
 315 static rtx express_from_1 PARAMS ((rtx, rtx, rtx));
 316 static rtx combine_givs_p PARAMS ((struct induction *, struct induction *));
 317 static int cmp_combine_givs_stats PARAMS ((const PTR, const PTR));
 318 static void combine_givs PARAMS ((struct loop_regs *, struct iv_class *));
 319 static int product_cheap_p PARAMS ((rtx, rtx));
 320 static int maybe_eliminate_biv PARAMS ((const struct loop *, struct iv_class *,
 321                                         int, int, int));
 322 static int maybe_eliminate_biv_1 PARAMS ((const struct loop *, rtx, rtx,
 323                                           struct iv_class *, int,
 324                                           basic_block, rtx));
 325 static int last_use_this_basic_block PARAMS ((rtx, rtx));
 326 static void record_initial PARAMS ((rtx, rtx, void *));
 327 static void update_reg_last_use PARAMS ((rtx, rtx));
 328 static rtx next_insn_in_loop PARAMS ((const struct loop *, rtx));
 329 static void loop_regs_scan PARAMS ((const struct loop *, int));
 330 static int count_insns_in_loop PARAMS ((const struct loop *));
 331 static void load_mems PARAMS ((const struct loop *));
 332 static int insert_loop_mem PARAMS ((rtx *, void *));
 333 static int replace_loop_mem PARAMS ((rtx *, void *));
 334 static void replace_loop_mems PARAMS ((rtx, rtx, rtx));
 335 static int replace_loop_reg PARAMS ((rtx *, void *));
 336 static void replace_loop_regs PARAMS ((rtx insn, rtx, rtx));
 337 static void note_reg_stored PARAMS ((rtx, rtx, void *));
 338 static void try_copy_prop PARAMS ((const struct loop *, rtx, unsigned int));
 339 static void try_swap_copy_prop PARAMS ((const struct loop *, rtx,
 340                                          unsigned int));
 341 static rtx check_insn_for_givs PARAMS((struct loop *, rtx, int, int));
 342 static rtx check_insn_for_bivs PARAMS((struct loop *, rtx, int, int));
 343 static rtx gen_add_mult PARAMS ((rtx, rtx, rtx, rtx));
 344 static void loop_regs_update PARAMS ((const struct loop *, rtx));
 345 static int iv_add_mult_cost PARAMS ((rtx, rtx, rtx, rtx));
 346
 347 static rtx loop_insn_emit_after PARAMS((const struct loop *, basic_block,
 348                                         rtx, rtx));
 349 static rtx loop_call_insn_emit_before PARAMS((const struct loop *,
 350                                               basic_block, rtx, rtx));
 351 static rtx loop_call_insn_hoist PARAMS((const struct loop *, rtx));
 352 static rtx loop_insn_sink_or_swim PARAMS((const struct loop *, rtx));
 353
 354 static void loop_dump_aux PARAMS ((const struct loop *, FILE *, int));
 355 static void loop_delete_insns PARAMS ((rtx, rtx));
 356 static HOST_WIDE_INT remove_constant_addition PARAMS ((rtx *));
 357 static rtx gen_load_of_final_value PARAMS ((rtx, rtx));
 358 void debug_ivs PARAMS ((const struct loop *));
 359 void debug_iv_class PARAMS ((const struct iv_class *));
 360 void debug_biv PARAMS ((const struct induction *));
 361 void debug_giv PARAMS ((const struct induction *));
 362 void debug_loop PARAMS ((const struct loop *));
 363 void debug_loops PARAMS ((const struct loops *));
 364
 365 typedef struct loop_replace_args
 366 {
 367   rtx match;
 368   rtx replacement;
 369   rtx insn;
 370 } loop_replace_args;
 371
 372 /* Nonzero iff INSN is between START and END, inclusive.  */
 373 #define INSN_IN_RANGE_P(INSN, START, END)       \
 374   (INSN_UID (INSN) < max_uid_for_loop           \
 375    && INSN_LUID (INSN) >= INSN_LUID (START)     \
 376    && INSN_LUID (INSN) <= INSN_LUID (END))
 377
 378 /* Indirect_jump_in_function is computed once per function.  */
 379 static int indirect_jump_in_function;
 380 static int indirect_jump_in_function_p PARAMS ((rtx));
 381
 382 static int compute_luids PARAMS ((rtx, rtx, int));
 383
 384 static int biv_elimination_giv_has_0_offset PARAMS ((struct induction *,
 385                                                      struct induction *,
 386                                                      rtx));
 387 \f
 388 /* Benefit penalty, if a giv is not replaceable, i.e. must emit an insn to
 389    copy the value of the strength reduced giv to its original register.  */
 390 static int copy_cost;
 391
 392 /* Cost of using a register, to normalize the benefits of a giv.  */
 393 static int reg_address_cost;
 394
 395 void
 396 init_loop ()
 397 {
 398   rtx reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
 399
 400   reg_address_cost = address_cost (reg, SImode);
 401
 402   copy_cost = COSTS_N_INSNS (1);
 403 }
 404 \f
 405 /* Compute the mapping from uids to luids.
 406    LUIDs are numbers assigned to insns, like uids,
 407    except that luids increase monotonically through the code.
 408    Start at insn START and stop just before END.  Assign LUIDs
 409    starting with PREV_LUID + 1.  Return the last assigned LUID + 1.  */
 410 static int
 411 compute_luids (start, end, prev_luid)
 412      rtx start, end;
 413      int prev_luid;
 414 {
 415   int i;
 416   rtx insn;
 417
 418   for (insn = start, i = prev_luid; insn != end; insn = NEXT_INSN (insn))
 419     {
 420       if (INSN_UID (insn) >= max_uid_for_loop)
 421         continue;
 422       /* Don't assign luids to line-number NOTEs, so that the distance in
 423          luids between two insns is not affected by -g.  */
 424       if (GET_CODE (insn) != NOTE
 425           || NOTE_LINE_NUMBER (insn) <= 0)
 426         uid_luid[INSN_UID (insn)] = ++i;
 427       else
 428         /* Give a line number note the same luid as preceding insn.  */
 429         uid_luid[INSN_UID (insn)] = i;
 430     }
 431   return i + 1;
 432 }
 433 \f
 434 /* Entry point of this file.  Perform loop optimization
 435    on the current function.  F is the first insn of the function
 436    and DUMPFILE is a stream for output of a trace of actions taken
 437    (or 0 if none should be output).  */
 438
 439 void
 440 loop_optimize (f, dumpfile, flags)
 441      /* f is the first instruction of a chain of insns for one function */
 442      rtx f;
 443      FILE *dumpfile;
 444      int flags;
 445 {
 446   rtx insn;
 447   int i;
 448   struct loops loops_data;
 449   struct loops *loops = &loops_data;
 450   struct loop_info *loops_info;
 451
 452   loop_dump_stream = dumpfile;
 453
 454   init_recog_no_volatile ();
 455
 456   max_reg_before_loop = max_reg_num ();
 457   loop_max_reg = max_reg_before_loop;
 458
 459   regs_may_share = 0;
 460
 461   /* Count the number of loops.  */
 462
 463   max_loop_num = 0;
 464   for (insn = f; insn; insn = NEXT_INSN (insn))
 465     {
 466       if (GET_CODE (insn) == NOTE
 467           && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
 468         max_loop_num++;
 469     }
 470
 471   /* Don't waste time if no loops.  */
 472   if (max_loop_num == 0)
 473     return;
 474
 475   loops->num = max_loop_num;
 476
 477   /* Get size to use for tables indexed by uids.
 478      Leave some space for labels allocated by find_and_verify_loops.  */
 479   max_uid_for_loop = get_max_uid () + 1 + max_loop_num * 32;
 480
 481   uid_luid = (int *) xcalloc (max_uid_for_loop, sizeof (int));
 482   uid_loop = (struct loop **) xcalloc (max_uid_for_loop,
 483                                        sizeof (struct loop *));
 484
 485   /* Allocate storage for array of loops.  */
 486   loops->array = (struct loop *)
 487     xcalloc (loops->num, sizeof (struct loop));
 488
 489   /* Find and process each loop.
 490      First, find them, and record them in order of their beginnings.  */
 491   find_and_verify_loops (f, loops);
 492
 493   /* Allocate and initialize auxiliary loop information.  */
 494   loops_info = xcalloc (loops->num, sizeof (struct loop_info));
 495   for (i = 0; i < (int) loops->num; i++)
 496     loops->array[i].aux = loops_info + i;
 497
 498   /* Now find all register lifetimes.  This must be done after
 499      find_and_verify_loops, because it might reorder the insns in the
 500      function.  */
 501   reg_scan (f, max_reg_before_loop, 1);
 502
 503   /* This must occur after reg_scan so that registers created by gcse
 504      will have entries in the register tables.
 505
 506      We could have added a call to reg_scan after gcse_main in toplev.c,
 507      but moving this call to init_alias_analysis is more efficient.  */
 508   init_alias_analysis ();
 509
 510   /* See if we went too far.  Note that get_max_uid already returns
 511      one more that the maximum uid of all insn.  */
 512   if (get_max_uid () > max_uid_for_loop)
 513     abort ();
 514   /* Now reset it to the actual size we need.  See above.  */
 515   max_uid_for_loop = get_max_uid ();
 516
 517   /* find_and_verify_loops has already called compute_luids, but it
 518      might have rearranged code afterwards, so we need to recompute
 519      the luids now.  */
 520   compute_luids (f, NULL_RTX, 0);
 521
 522   /* Don't leave gaps in uid_luid for insns that have been
 523      deleted.  It is possible that the first or last insn
 524      using some register has been deleted by cross-jumping.
 525      Make sure that uid_luid for that former insn's uid
 526      points to the general area where that insn used to be.  */
 527   for (i = 0; i < max_uid_for_loop; i++)
 528     {
 529       uid_luid[0] = uid_luid[i];
 530       if (uid_luid[0] != 0)
 531         break;
 532     }
 533   for (i = 0; i < max_uid_for_loop; i++)
 534     if (uid_luid[i] == 0)
 535       uid_luid[i] = uid_luid[i - 1];
 536
 537   /* Determine if the function has indirect jump.  On some systems
 538      this prevents low overhead loop instructions from being used.  */
 539   indirect_jump_in_function = indirect_jump_in_function_p (f);
 540
 541   /* Now scan the loops, last ones first, since this means inner ones are done
 542      before outer ones.  */
 543   for (i = max_loop_num - 1; i >= 0; i--)
 544     {
 545       struct loop *loop = &loops->array[i];
 546
 547       if (! loop->invalid && loop->end)
 548         scan_loop (loop, flags);
 549     }
 550
 551   end_alias_analysis ();
 552
 553   /* Clean up.  */
 554   free (uid_luid);
 555   free (uid_loop);
 556   free (loops_info);
 557   free (loops->array);
 558 }
 559 \f
 560 /* Returns the next insn, in execution order, after INSN.  START and
 561    END are the NOTE_INSN_LOOP_BEG and NOTE_INSN_LOOP_END for the loop,
 562    respectively.  LOOP->TOP, if non-NULL, is the top of the loop in the
 563    insn-stream; it is used with loops that are entered near the
 564    bottom.  */
 565
 566 static rtx
 567 next_insn_in_loop (loop, insn)
 568      const struct loop *loop;
 569      rtx insn;
 570 {
 571   insn = NEXT_INSN (insn);
 572
 573   if (insn == loop->end)
 574     {
 575       if (loop->top)
 576         /* Go to the top of the loop, and continue there.  */
 577         insn = loop->top;
 578       else
 579         /* We're done.  */
 580         insn = NULL_RTX;
 581     }
 582
 583   if (insn == loop->scan_start)
 584     /* We're done.  */
 585     insn = NULL_RTX;
 586
 587   return insn;
 588 }
 589
 590 /* Optimize one loop described by LOOP.  */
 591
 592 /* ??? Could also move memory writes out of loops if the destination address
 593    is invariant, the source is invariant, the memory write is not volatile,
 594    and if we can prove that no read inside the loop can read this address
 595    before the write occurs.  If there is a read of this address after the
 596    write, then we can also mark the memory read as invariant.  */
 597
 598 static void
 599 scan_loop (loop, flags)
 600      struct loop *loop;
 601      int flags;
 602 {
 603   struct loop_info *loop_info = LOOP_INFO (loop);
 604   struct loop_regs *regs = LOOP_REGS (loop);
 605   int i;
 606   rtx loop_start = loop->start;
 607   rtx loop_end = loop->end;
 608   rtx p;
 609   /* 1 if we are scanning insns that could be executed zero times.  */
 610   int maybe_never = 0;
 611   /* 1 if we are scanning insns that might never be executed
 612      due to a subroutine call which might exit before they are reached.  */
 613   int call_passed = 0;
 614   /* Number of insns in the loop.  */
 615   int insn_count;
 616   int tem;
 617   rtx temp, update_start, update_end;
 618   /* The SET from an insn, if it is the only SET in the insn.  */
 619   rtx set, set1;
 620   /* Chain describing insns movable in current loop.  */
 621   struct loop_movables *movables = LOOP_MOVABLES (loop);
 622   /* Ratio of extra register life span we can justify
 623      for saving an instruction.  More if loop doesn't call subroutines
 624      since in that case saving an insn makes more difference
 625      and more registers are available.  */
 626   int threshold;
 627   /* Nonzero if we are scanning instructions in a sub-loop.  */
 628   int loop_depth = 0;
 629   int in_libcall;
 630
 631   loop->top = 0;
 632
 633   movables->head = 0;
 634   movables->last = 0;
 635
 636   /* Determine whether this loop starts with a jump down to a test at
 637      the end.  This will occur for a small number of loops with a test
 638      that is too complex to duplicate in front of the loop.
 639
 640      We search for the first insn or label in the loop, skipping NOTEs.
 641      However, we must be careful not to skip past a NOTE_INSN_LOOP_BEG
 642      (because we might have a loop executed only once that contains a
 643      loop which starts with a jump to its exit test) or a NOTE_INSN_LOOP_END
 644      (in case we have a degenerate loop).
 645
 646      Note that if we mistakenly think that a loop is entered at the top
 647      when, in fact, it is entered at the exit test, the only effect will be
 648      slightly poorer optimization.  Making the opposite error can generate
 649      incorrect code.  Since very few loops now start with a jump to the
 650      exit test, the code here to detect that case is very conservative.  */
 651
 652   for (p = NEXT_INSN (loop_start);
 653        p != loop_end
 654          && GET_CODE (p) != CODE_LABEL && ! INSN_P (p)
 655          && (GET_CODE (p) != NOTE
 656              || (NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_BEG
 657                  && NOTE_LINE_NUMBER (p) != NOTE_INSN_LOOP_END));
 658        p = NEXT_INSN (p))
 659     ;
 660
 661   loop->scan_start = p;
 662
 663   /* If loop end is the end of the current function, then emit a
 664      NOTE_INSN_DELETED after loop_end and set loop->sink to the dummy
 665      note insn.  This is the position we use when sinking insns out of
 666      the loop.  */
 667   if (NEXT_INSN (loop->end) != 0)
 668     loop->sink = NEXT_INSN (loop->end);
 669   else
 670     loop->sink = emit_note_after (NOTE_INSN_DELETED, loop->end);
 671
 672   /* Set up variables describing this loop.  */
 673   prescan_loop (loop);
 674   threshold = (loop_info->has_call ? 1 : 2) * (1 + n_non_fixed_regs);
 675
 676   /* If loop has a jump before the first label,
 677      the true entry is the target of that jump.
 678      Start scan from there.
 679      But record in LOOP->TOP the place where the end-test jumps
 680      back to so we can scan that after the end of the loop.  */
 681   if (GET_CODE (p) == JUMP_INSN
 682       /* Loop entry must be unconditional jump (and not a RETURN)  */
 683       && any_uncondjump_p (p)
 684       && JUMP_LABEL (p) != 0
 685       /* Check to see whether the jump actually
 686          jumps out of the loop (meaning it's no loop).
 687          This case can happen for things like
 688          do {..} while (0).  If this label was generated previously
 689          by loop, we can't tell anything about it and have to reject
 690          the loop.  */
 691       && INSN_IN_RANGE_P (JUMP_LABEL (p), loop_start, loop_end))
 692     {
 693       loop->top = next_label (loop->scan_start);
 694       loop->scan_start = JUMP_LABEL (p);
 695     }
 696
 697   /* If LOOP->SCAN_START was an insn created by loop, we don't know its luid
 698      as required by loop_reg_used_before_p.  So skip such loops.  (This
 699      test may never be true, but it's best to play it safe.)
 700
 701      Also, skip loops where we do not start scanning at a label.  This
 702      test also rejects loops starting with a JUMP_INSN that failed the
 703      test above.  */
 704
 705   if (INSN_UID (loop->scan_start) >= max_uid_for_loop
 706       || GET_CODE (loop->scan_start) != CODE_LABEL)
 707     {
 708       if (loop_dump_stream)
 709         fprintf (loop_dump_stream, "\nLoop from %d to %d is phony.\n\n",
 710                  INSN_UID (loop_start), INSN_UID (loop_end));
 711       return;
 712     }
 713
 714   /* Allocate extra space for REGs that might be created by load_mems.
 715      We allocate a little extra slop as well, in the hopes that we
 716      won't have to reallocate the regs array.  */
 717   loop_regs_scan (loop, loop_info->mems_idx + 16);
 718   insn_count = count_insns_in_loop (loop);
 719
 720   if (loop_dump_stream)
 721     {
 722       fprintf (loop_dump_stream, "\nLoop from %d to %d: %d real insns.\n",
 723                INSN_UID (loop_start), INSN_UID (loop_end), insn_count);
 724       if (loop->cont)
 725         fprintf (loop_dump_stream, "Continue at insn %d.\n",
 726                  INSN_UID (loop->cont));
 727     }
 728
 729   /* Scan through the loop finding insns that are safe to move.
 730      Set REGS->ARRAY[I].SET_IN_LOOP negative for the reg I being set, so that
 731      this reg will be considered invariant for subsequent insns.
 732      We consider whether subsequent insns use the reg
 733      in deciding whether it is worth actually moving.
 734
 735      MAYBE_NEVER is nonzero if we have passed a conditional jump insn
 736      and therefore it is possible that the insns we are scanning
 737      would never be executed.  At such times, we must make sure
 738      that it is safe to execute the insn once instead of zero times.
 739      When MAYBE_NEVER is 0, all insns will be executed at least once
 740      so that is not a problem.  */
 741
 742   for (in_libcall = 0, p = next_insn_in_loop (loop, loop->scan_start);
 743        p != NULL_RTX;
 744        p = next_insn_in_loop (loop, p))
 745     {
 746       if (in_libcall && INSN_P (p) && find_reg_note (p, REG_RETVAL, NULL_RTX))
 747         in_libcall--;
 748       if (GET_CODE (p) == INSN)
 749         {
 750           temp = find_reg_note (p, REG_LIBCALL, NULL_RTX);
 751           if (temp)
 752             in_libcall++;
 753           if (! in_libcall
 754               && (set = single_set (p))
 755               && GET_CODE (SET_DEST (set)) == REG
 756 #ifdef PIC_OFFSET_TABLE_REG_CALL_CLOBBERED
 757               && SET_DEST (set) != pic_offset_table_rtx
 758 #endif
 759               && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
 760             {
 761               int tem1 = 0;
 762               int tem2 = 0;
 763               int move_insn = 0;
 764               int insert_temp = 0;
 765               rtx src = SET_SRC (set);
 766               rtx dependencies = 0;
 767
 768               /* Figure out what to use as a source of this insn.  If a
 769                  REG_EQUIV note is given or if a REG_EQUAL note with a
 770                  constant operand is specified, use it as the source and
 771                  mark that we should move this insn by calling
 772                  emit_move_insn rather that duplicating the insn.
 773
 774                  Otherwise, only use the REG_EQUAL contents if a REG_RETVAL
 775                  note is present.  */
 776               temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
 777               if (temp)
 778                 src = XEXP (temp, 0), move_insn = 1;
 779               else
 780                 {
 781                   temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
 782                   if (temp && CONSTANT_P (XEXP (temp, 0)))
 783                     src = XEXP (temp, 0), move_insn = 1;
 784                   if (temp && find_reg_note (p, REG_RETVAL, NULL_RTX))
 785                     {
 786                       src = XEXP (temp, 0);
 787                       /* A libcall block can use regs that don't appear in
 788                          the equivalent expression.  To move the libcall,
 789                          we must move those regs too.  */
 790                       dependencies = libcall_other_reg (p, src);
 791                     }
 792                 }
 793
 794               /* For parallels, add any possible uses to the dependencies, as
 795                  we can't move the insn without resolving them first.  */
 796               if (GET_CODE (PATTERN (p)) == PARALLEL)
 797                 {
 798                   for (i = 0; i < XVECLEN (PATTERN (p), 0); i++)
 799                     {
 800                       rtx x = XVECEXP (PATTERN (p), 0, i);
 801                       if (GET_CODE (x) == USE)
 802                         dependencies
 803                           = gen_rtx_EXPR_LIST (VOIDmode, XEXP (x, 0),
 804                                                dependencies);
 805                     }
 806                 }
 807
 808               if (/* The register is used in basic blocks other
 809                       than the one where it is set (meaning that
 810                       something after this point in the loop might
 811                       depend on its value before the set).  */
 812                    ! reg_in_basic_block_p (p, SET_DEST (set))
 813                    /* And the set is not guaranteed to be executed once
 814                       the loop starts, or the value before the set is
 815                       needed before the set occurs...
 816
 817                       ??? Note we have quadratic behavior here, mitigated
 818                       by the fact that the previous test will often fail for
 819                       large loops.  Rather than re-scanning the entire loop
 820                       each time for register usage, we should build tables
 821                       of the register usage and use them here instead.  */
 822                    && (maybe_never
 823                        || loop_reg_used_before_p (loop, set, p)))
 824                 /* It is unsafe to move the set.  However, it may be OK to
 825                    move the source into a new psuedo, and subsitute a
 826                    reg-to-reg copy for the original insn.
 827
 828                    This code used to consider it OK to move a set of a variable
 829                    which was not created by the user and not used in an exit
 830                    test.
 831                    That behavior is incorrect and was removed.  */
 832                 insert_temp = 1;
 833
 834               /* Don't try to optimize a register that was made
 835                  by loop-optimization for an inner loop.
 836                  We don't know its life-span, so we can't compute
 837                  the benefit.  */
 838               if (REGNO (SET_DEST (set)) >= max_reg_before_loop)
 839                 ;
 840               /* Don't move the source and add a reg-to-reg copy with -Os
 841                  (this certainly increases size) or if the source is
 842                  already a reg (the motion will gain nothing).  */
 843               else if (insert_temp
 844                        && (optimize_size || GET_CODE (SET_SRC (set)) == REG
 845                            || (CONSTANT_P (SET_SRC (set))
 846                                && LEGITIMATE_CONSTANT_P (SET_SRC (set)))))
 847                 ;
 848               else if ((tem = loop_invariant_p (loop, src))
 849                        && (dependencies == 0
 850                            || (tem2
 851                                = loop_invariant_p (loop, dependencies)) != 0)
 852                        && (regs->array[REGNO (SET_DEST (set))].set_in_loop == 1
 853                            || (tem1
 854                                = consec_sets_invariant_p
 855                                (loop, SET_DEST (set),
 856                                 regs->array[REGNO (SET_DEST (set))].set_in_loop,
 857                                 p)))
 858                        /* If the insn can cause a trap (such as divide by zero),
 859                           can't move it unless it's guaranteed to be executed
 860                           once loop is entered.  Even a function call might
 861                           prevent the trap insn from being reached
 862                           (since it might exit!)  */
 863                        && ! ((maybe_never || call_passed)
 864                              && may_trap_p (src)))
 865                 {
 866                   struct movable *m;
 867                   int regno = REGNO (SET_DEST (set));
 868
 869                   /* A potential lossage is where we have a case where two insns
 870                      can be combined as long as they are both in the loop, but
 871                      we move one of them outside the loop.  For large loops,
 872                      this can lose.  The most common case of this is the address
 873                      of a function being called.
 874
 875                      Therefore, if this register is marked as being used
 876                      exactly once if we are in a loop with calls
 877                      (a "large loop"), see if we can replace the usage of
 878                      this register with the source of this SET.  If we can,
 879                      delete this insn.
 880
 881                      Don't do this if P has a REG_RETVAL note or if we have
 882                      SMALL_REGISTER_CLASSES and SET_SRC is a hard register.  */
 883
 884                   if (loop_info->has_call
 885                       && regs->array[regno].single_usage != 0
 886                       && regs->array[regno].single_usage != const0_rtx
 887                       && REGNO_FIRST_UID (regno) == INSN_UID (p)
 888                       && (REGNO_LAST_UID (regno)
 889                           == INSN_UID (regs->array[regno].single_usage))
 890                       && regs->array[regno].set_in_loop == 1
 891                       && GET_CODE (SET_SRC (set)) != ASM_OPERANDS
 892                       && ! side_effects_p (SET_SRC (set))
 893                       && ! find_reg_note (p, REG_RETVAL, NULL_RTX)
 894                       && (! SMALL_REGISTER_CLASSES
 895                           || (! (GET_CODE (SET_SRC (set)) == REG
 896                                  && (REGNO (SET_SRC (set))
 897                                      < FIRST_PSEUDO_REGISTER))))
 898                       /* This test is not redundant; SET_SRC (set) might be
 899                          a call-clobbered register and the life of REGNO
 900                          might span a call.  */
 901                       && ! modified_between_p (SET_SRC (set), p,
 902                                                regs->array[regno].single_usage)
 903                       && no_labels_between_p (p,
 904                                               regs->array[regno].single_usage)
 905                       && validate_replace_rtx (SET_DEST (set), SET_SRC (set),
 906                                                regs->array[regno].single_usage))
 907                     {
 908                       /* Replace any usage in a REG_EQUAL note.  Must copy
 909                          the new source, so that we don't get rtx sharing
 910                          between the SET_SOURCE and REG_NOTES of insn p.  */
 911                       REG_NOTES (regs->array[regno].single_usage)
 912                         = (replace_rtx
 913                            (REG_NOTES (regs->array[regno].single_usage),
 914                             SET_DEST (set), copy_rtx (SET_SRC (set))));
 915
 916                       delete_insn (p);
 917                       for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
 918                            i++)
 919                         regs->array[regno+i].set_in_loop = 0;
 920                       continue;
 921                     }
 922
 923                   m = (struct movable *) xmalloc (sizeof (struct movable));
 924                   m->next = 0;
 925                   m->insn = p;
 926                   m->set_src = src;
 927                   m->dependencies = dependencies;
 928                   m->set_dest = SET_DEST (set);
 929                   m->force = 0;
 930                   m->consec
 931                     = regs->array[REGNO (SET_DEST (set))].set_in_loop - 1;
 932                   m->done = 0;
 933                   m->forces = 0;
 934                   m->partial = 0;
 935                   m->move_insn = move_insn;
 936                   m->move_insn_first = 0;
 937                   m->insert_temp = insert_temp;
 938                   m->is_equiv = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
 939                   m->savemode = VOIDmode;
 940                   m->regno = regno;
 941                   /* Set M->cond if either loop_invariant_p
 942                      or consec_sets_invariant_p returned 2
 943                      (only conditionally invariant).  */
 944                   m->cond = ((tem | tem1 | tem2) > 1);
 945                   m->global =  LOOP_REG_GLOBAL_P (loop, regno);
 946                   m->match = 0;
 947                   m->lifetime = LOOP_REG_LIFETIME (loop, regno);
 948                   m->savings = regs->array[regno].n_times_set;
 949                   if (find_reg_note (p, REG_RETVAL, NULL_RTX))
 950                     m->savings += libcall_benefit (p);
 951                   for (i = 0; i < LOOP_REGNO_NREGS (regno, SET_DEST (set)); i++)
 952                     regs->array[regno+i].set_in_loop = move_insn ? -2 : -1;
 953                   /* Add M to the end of the chain MOVABLES.  */
 954                   loop_movables_add (movables, m);
 955
 956                   if (m->consec > 0)
 957                     {
 958                       /* It is possible for the first instruction to have a
 959                          REG_EQUAL note but a non-invariant SET_SRC, so we must
 960                          remember the status of the first instruction in case
 961                          the last instruction doesn't have a REG_EQUAL note.  */
 962                       m->move_insn_first = m->move_insn;
 963
 964                       /* Skip this insn, not checking REG_LIBCALL notes.  */
 965                       p = next_nonnote_insn (p);
 966                       /* Skip the consecutive insns, if there are any.  */
 967                       p = skip_consec_insns (p, m->consec);
 968                       /* Back up to the last insn of the consecutive group.  */
 969                       p = prev_nonnote_insn (p);
 970
 971                       /* We must now reset m->move_insn, m->is_equiv, and
 972                          possibly m->set_src to correspond to the effects of
 973                          all the insns.  */
 974                       temp = find_reg_note (p, REG_EQUIV, NULL_RTX);
 975                       if (temp)
 976                         m->set_src = XEXP (temp, 0), m->move_insn = 1;
 977                       else
 978                         {
 979                           temp = find_reg_note (p, REG_EQUAL, NULL_RTX);
 980                           if (temp && CONSTANT_P (XEXP (temp, 0)))
 981                             m->set_src = XEXP (temp, 0), m->move_insn = 1;
 982                           else
 983                             m->move_insn = 0;
 984
 985                         }
 986                       m->is_equiv
 987                         = (find_reg_note (p, REG_EQUIV, NULL_RTX) != 0);
 988                     }
 989                 }
 990               /* If this register is always set within a STRICT_LOW_PART
 991                  or set to zero, then its high bytes are constant.
 992                  So clear them outside the loop and within the loop
 993                  just load the low bytes.
 994                  We must check that the machine has an instruction to do so.
 995                  Also, if the value loaded into the register
 996                  depends on the same register, this cannot be done.  */
 997               else if (SET_SRC (set) == const0_rtx
 998                        && GET_CODE (NEXT_INSN (p)) == INSN
 999                        && (set1 = single_set (NEXT_INSN (p)))
1000                        && GET_CODE (set1) == SET
1001                        && (GET_CODE (SET_DEST (set1)) == STRICT_LOW_PART)
1002                        && (GET_CODE (XEXP (SET_DEST (set1), 0)) == SUBREG)
1003                        && (SUBREG_REG (XEXP (SET_DEST (set1), 0))
1004                            == SET_DEST (set))
1005                        && !reg_mentioned_p (SET_DEST (set), SET_SRC (set1)))
1006                 {
1007                   int regno = REGNO (SET_DEST (set));
1008                   if (regs->array[regno].set_in_loop == 2)
1009                     {
1010                       struct movable *m;
1011                       m = (struct movable *) xmalloc (sizeof (struct movable));
1012                       m->next = 0;
1013                       m->insn = p;
1014                       m->set_dest = SET_DEST (set);
1015                       m->dependencies = 0;
1016                       m->force = 0;
1017                       m->consec = 0;
1018                       m->done = 0;
1019                       m->forces = 0;
1020                       m->move_insn = 0;
1021                       m->move_insn_first = 0;
1022                       m->insert_temp = insert_temp;
1023                       m->partial = 1;
1024                       /* If the insn may not be executed on some cycles,
1025                          we can't clear the whole reg; clear just high part.
1026                          Not even if the reg is used only within this loop.
1027                          Consider this:
1028                          while (1)
1029                            while (s != t) {
1030                              if (foo ()) x = *s;
1031                              use (x);
1032                            }
1033                          Clearing x before the inner loop could clobber a value
1034                          being saved from the last time around the outer loop.
1035                          However, if the reg is not used outside this loop
1036                          and all uses of the register are in the same
1037                          basic block as the store, there is no problem.
1038
1039                          If this insn was made by loop, we don't know its
1040                          INSN_LUID and hence must make a conservative
1041                          assumption.  */
1042                       m->global = (INSN_UID (p) >= max_uid_for_loop
1043                                    || LOOP_REG_GLOBAL_P (loop, regno)
1044                                    || (labels_in_range_p
1045                                        (p, REGNO_FIRST_LUID (regno))));
1046                       if (maybe_never && m->global)
1047                         m->savemode = GET_MODE (SET_SRC (set1));
1048                       else
1049                         m->savemode = VOIDmode;
1050                       m->regno = regno;
1051                       m->cond = 0;
1052                       m->match = 0;
1053                       m->lifetime = LOOP_REG_LIFETIME (loop, regno);
1054                       m->savings = 1;
1055                       for (i = 0;
1056                            i < LOOP_REGNO_NREGS (regno, SET_DEST (set));
1057                            i++)
1058                         regs->array[regno+i].set_in_loop = -1;
1059                       /* Add M to the end of the chain MOVABLES.  */
1060                       loop_movables_add (movables, m);
1061                     }
1062                 }
1063             }
1064         }
1065       /* Past a call insn, we get to insns which might not be executed
1066          because the call might exit.  This matters for insns that trap.
1067          Constant and pure call insns always return, so they don't count.  */
1068       else if (GET_CODE (p) == CALL_INSN && ! CONST_OR_PURE_CALL_P (p))
1069         call_passed = 1;
1070       /* Past a label or a jump, we get to insns for which we
1071          can't count on whether or how many times they will be
1072          executed during each iteration.  Therefore, we can
1073          only move out sets of trivial variables
1074          (those not used after the loop).  */
1075       /* Similar code appears twice in strength_reduce.  */
1076       else if ((GET_CODE (p) == CODE_LABEL || GET_CODE (p) == JUMP_INSN)
1077                /* If we enter the loop in the middle, and scan around to the
1078                   beginning, don't set maybe_never for that.  This must be an
1079                   unconditional jump, otherwise the code at the top of the
1080                   loop might never be executed.  Unconditional jumps are
1081                   followed by a barrier then the loop_end.  */
1082                && ! (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p) == loop->top
1083                      && NEXT_INSN (NEXT_INSN (p)) == loop_end
1084                      && any_uncondjump_p (p)))
1085         maybe_never = 1;
1086       else if (GET_CODE (p) == NOTE)
1087         {
1088           /* At the virtual top of a converted loop, insns are again known to
1089              be executed: logically, the loop begins here even though the exit
1090              code has been duplicated.  */
1091           if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_VTOP && loop_depth == 0)
1092             maybe_never = call_passed = 0;
1093           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
1094             loop_depth++;
1095           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
1096             loop_depth--;
1097         }
1098     }
1099
1100   /* If one movable subsumes another, ignore that other.  */
1101
1102   ignore_some_movables (movables);
1103
1104   /* For each movable insn, see if the reg that it loads
1105      leads when it dies right into another conditionally movable insn.
1106      If so, record that the second insn "forces" the first one,
1107      since the second can be moved only if the first is.  */
1108
1109   force_movables (movables);
1110
1111   /* See if there are multiple movable insns that load the same value.
1112      If there are, make all but the first point at the first one
1113      through the `match' field, and add the priorities of them
1114      all together as the priority of the first.  */
1115
1116   combine_movables (movables, regs);
1117
1118   /* Now consider each movable insn to decide whether it is worth moving.
1119      Store 0 in regs->array[I].set_in_loop for each reg I that is moved.
1120
1121      For machines with few registers this increases code size, so do not
1122      move moveables when optimizing for code size on such machines.
1123      (The 18 below is the value for i386.)  */
1124
1125   if (!optimize_size
1126       || (reg_class_size[GENERAL_REGS] > 18 && !loop_info->has_call))
1127     {
1128       move_movables (loop, movables, threshold, insn_count);
1129
1130       /* Recalculate regs->array if move_movables has created new
1131          registers.  */
1132       if (max_reg_num () > regs->num)
1133         {
1134           loop_regs_scan (loop, 0);
1135           for (update_start = loop_start;
1136                PREV_INSN (update_start)
1137                && GET_CODE (PREV_INSN (update_start)) != CODE_LABEL;
1138                update_start = PREV_INSN (update_start))
1139             ;
1140           update_end = NEXT_INSN (loop_end);
1141
1142           reg_scan_update (update_start, update_end, loop_max_reg);
1143           loop_max_reg = max_reg_num ();
1144         }
1145     }
1146
1147   /* Now candidates that still are negative are those not moved.
1148      Change regs->array[I].set_in_loop to indicate that those are not actually
1149      invariant.  */
1150   for (i = 0; i < regs->num; i++)
1151     if (regs->array[i].set_in_loop < 0)
1152       regs->array[i].set_in_loop = regs->array[i].n_times_set;
1153
1154   /* Now that we've moved some things out of the loop, we might be able to
1155      hoist even more memory references.  */
1156   load_mems (loop);
1157
1158   /* Recalculate regs->array if load_mems has created new registers.  */
1159   if (max_reg_num () > regs->num)
1160     loop_regs_scan (loop, 0);
1161
1162   for (update_start = loop_start;
1163        PREV_INSN (update_start)
1164          && GET_CODE (PREV_INSN (update_start)) != CODE_LABEL;
1165        update_start = PREV_INSN (update_start))
1166     ;
1167   update_end = NEXT_INSN (loop_end);
1168
1169   reg_scan_update (update_start, update_end, loop_max_reg);
1170   loop_max_reg = max_reg_num ();
1171
1172   if (flag_strength_reduce)
1173     {
1174       if (update_end && GET_CODE (update_end) == CODE_LABEL)
1175         /* Ensure our label doesn't go away.  */
1176         LABEL_NUSES (update_end)++;
1177
1178       strength_reduce (loop, flags);
1179
1180       reg_scan_update (update_start, update_end, loop_max_reg);
1181       loop_max_reg = max_reg_num ();
1182
1183       if (update_end && GET_CODE (update_end) == CODE_LABEL
1184           && --LABEL_NUSES (update_end) == 0)
1185         delete_related_insns (update_end);
1186     }
1187
1188
1189   /* The movable information is required for strength reduction.  */
1190   loop_movables_free (movables);
1191
1192   free (regs->array);
1193   regs->array = 0;
1194   regs->num = 0;
1195 }
1196 \f
1197 /* Add elements to *OUTPUT to record all the pseudo-regs
1198    mentioned in IN_THIS but not mentioned in NOT_IN_THIS.  */
1199
1200 void
1201 record_excess_regs (in_this, not_in_this, output)
1202      rtx in_this, not_in_this;
1203      rtx *output;
1204 {
1205   enum rtx_code code;
1206   const char *fmt;
1207   int i;
1208
1209   code = GET_CODE (in_this);
1210
1211   switch (code)
1212     {
1213     case PC:
1214     case CC0:
1215     case CONST_INT:
1216     case CONST_DOUBLE:
1217     case CONST:
1218     case SYMBOL_REF:
1219     case LABEL_REF:
1220       return;
1221
1222     case REG:
1223       if (REGNO (in_this) >= FIRST_PSEUDO_REGISTER
1224           && ! reg_mentioned_p (in_this, not_in_this))
1225         *output = gen_rtx_EXPR_LIST (VOIDmode, in_this, *output);
1226       return;
1227
1228     default:
1229       break;
1230     }
1231
1232   fmt = GET_RTX_FORMAT (code);
1233   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1234     {
1235       int j;
1236
1237       switch (fmt[i])
1238         {
1239         case 'E':
1240           for (j = 0; j < XVECLEN (in_this, i); j++)
1241             record_excess_regs (XVECEXP (in_this, i, j), not_in_this, output);
1242           break;
1243
1244         case 'e':
1245           record_excess_regs (XEXP (in_this, i), not_in_this, output);
1246           break;
1247         }
1248     }
1249 }
1250 \f
1251 /* Check what regs are referred to in the libcall block ending with INSN,
1252    aside from those mentioned in the equivalent value.
1253    If there are none, return 0.
1254    If there are one or more, return an EXPR_LIST containing all of them.  */
1255
1256 rtx
1257 libcall_other_reg (insn, equiv)
1258      rtx insn, equiv;
1259 {
1260   rtx note = find_reg_note (insn, REG_RETVAL, NULL_RTX);
1261   rtx p = XEXP (note, 0);
1262   rtx output = 0;
1263
1264   /* First, find all the regs used in the libcall block
1265      that are not mentioned as inputs to the result.  */
1266
1267   while (p != insn)
1268     {
1269       if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
1270           || GET_CODE (p) == CALL_INSN)
1271         record_excess_regs (PATTERN (p), equiv, &output);
1272       p = NEXT_INSN (p);
1273     }
1274
1275   return output;
1276 }
1277 \f
1278 /* Return 1 if all uses of REG
1279    are between INSN and the end of the basic block.  */
1280
1281 static int
1282 reg_in_basic_block_p (insn, reg)
1283      rtx insn, reg;
1284 {
1285   int regno = REGNO (reg);
1286   rtx p;
1287
1288   if (REGNO_FIRST_UID (regno) != INSN_UID (insn))
1289     return 0;
1290
1291   /* Search this basic block for the already recorded last use of the reg.  */
1292   for (p = insn; p; p = NEXT_INSN (p))
1293     {
1294       switch (GET_CODE (p))
1295         {
1296         case NOTE:
1297           break;
1298
1299         case INSN:
1300         case CALL_INSN:
1301           /* Ordinary insn: if this is the last use, we win.  */
1302           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1303             return 1;
1304           break;
1305
1306         case JUMP_INSN:
1307           /* Jump insn: if this is the last use, we win.  */
1308           if (REGNO_LAST_UID (regno) == INSN_UID (p))
1309             return 1;
1310           /* Otherwise, it's the end of the basic block, so we lose.  */
1311           return 0;
1312
1313         case CODE_LABEL:
1314         case BARRIER:
1315           /* It's the end of the basic block, so we lose.  */
1316           return 0;
1317
1318         default:
1319           break;
1320         }
1321     }
1322
1323   /* The "last use" that was recorded can't be found after the first
1324      use.  This can happen when the last use was deleted while
1325      processing an inner loop, this inner loop was then completely
1326      unrolled, and the outer loop is always exited after the inner loop,
1327      so that everything after the first use becomes a single basic block.  */
1328   return 1;
1329 }
1330 \f
1331 /* Compute the benefit of eliminating the insns in the block whose
1332    last insn is LAST.  This may be a group of insns used to compute a
1333    value directly or can contain a library call.  */
1334
1335 static int
1336 libcall_benefit (last)
1337      rtx last;
1338 {
1339   rtx insn;
1340   int benefit = 0;
1341
1342   for (insn = XEXP (find_reg_note (last, REG_RETVAL, NULL_RTX), 0);
1343        insn != last; insn = NEXT_INSN (insn))
1344     {
1345       if (GET_CODE (insn) == CALL_INSN)
1346         benefit += 10;          /* Assume at least this many insns in a library
1347                                    routine.  */
1348       else if (GET_CODE (insn) == INSN
1349                && GET_CODE (PATTERN (insn)) != USE
1350                && GET_CODE (PATTERN (insn)) != CLOBBER)
1351         benefit++;
1352     }
1353
1354   return benefit;
1355 }
1356 \f
1357 /* Skip COUNT insns from INSN, counting library calls as 1 insn.  */
1358
1359 static rtx
1360 skip_consec_insns (insn, count)
1361      rtx insn;
1362      int count;
1363 {
1364   for (; count > 0; count--)
1365     {
1366       rtx temp;
1367
1368       /* If first insn of libcall sequence, skip to end.  */
1369       /* Do this at start of loop, since INSN is guaranteed to
1370          be an insn here.  */
1371       if (GET_CODE (insn) != NOTE
1372           && (temp = find_reg_note (insn, REG_LIBCALL, NULL_RTX)))
1373         insn = XEXP (temp, 0);
1374
1375       do
1376         insn = NEXT_INSN (insn);
1377       while (GET_CODE (insn) == NOTE);
1378     }
1379
1380   return insn;
1381 }
1382
1383 /* Ignore any movable whose insn falls within a libcall
1384    which is part of another movable.
1385    We make use of the fact that the movable for the libcall value
1386    was made later and so appears later on the chain.  */
1387
1388 static void
1389 ignore_some_movables (movables)
1390      struct loop_movables *movables;
1391 {
1392   struct movable *m, *m1;
1393
1394   for (m = movables->head; m; m = m->next)
1395     {
1396       /* Is this a movable for the value of a libcall?  */
1397       rtx note = find_reg_note (m->insn, REG_RETVAL, NULL_RTX);
1398       if (note)
1399         {
1400           rtx insn;
1401           /* Check for earlier movables inside that range,
1402              and mark them invalid.  We cannot use LUIDs here because
1403              insns created by loop.c for prior loops don't have LUIDs.
1404              Rather than reject all such insns from movables, we just
1405              explicitly check each insn in the libcall (since invariant
1406              libcalls aren't that common).  */
1407           for (insn = XEXP (note, 0); insn != m->insn; insn = NEXT_INSN (insn))
1408             for (m1 = movables->head; m1 != m; m1 = m1->next)
1409               if (m1->insn == insn)
1410                 m1->done = 1;
1411         }
1412     }
1413 }
1414
1415 /* For each movable insn, see if the reg that it loads
1416    leads when it dies right into another conditionally movable insn.
1417    If so, record that the second insn "forces" the first one,
1418    since the second can be moved only if the first is.  */
1419
1420 static void
1421 force_movables (movables)
1422      struct loop_movables *movables;
1423 {
1424   struct movable *m, *m1;
1425
1426   for (m1 = movables->head; m1; m1 = m1->next)
1427     /* Omit this if moving just the (SET (REG) 0) of a zero-extend.  */
1428     if (!m1->partial && !m1->done)
1429       {
1430         int regno = m1->regno;
1431         for (m = m1->next; m; m = m->next)
1432           /* ??? Could this be a bug?  What if CSE caused the
1433              register of M1 to be used after this insn?
1434              Since CSE does not update regno_last_uid,
1435              this insn M->insn might not be where it dies.
1436              But very likely this doesn't matter; what matters is
1437              that M's reg is computed from M1's reg.  */
1438           if (INSN_UID (m->insn) == REGNO_LAST_UID (regno)
1439               && !m->done)
1440             break;
1441         if (m != 0 && m->set_src == m1->set_dest
1442             /* If m->consec, m->set_src isn't valid.  */
1443             && m->consec == 0)
1444           m = 0;
1445
1446         /* Increase the priority of the moving the first insn
1447            since it permits the second to be moved as well.  */
1448         if (m != 0)
1449           {
1450             m->forces = m1;
1451             m1->lifetime += m->lifetime;
1452             m1->savings += m->savings;
1453           }
1454       }
1455 }
1456 \f
1457 /* Find invariant expressions that are equal and can be combined into
1458    one register.  */
1459
1460 static void
1461 combine_movables (movables, regs)
1462      struct loop_movables *movables;
1463      struct loop_regs *regs;
1464 {
1465   struct movable *m;
1466   char *matched_regs = (char *) xmalloc (regs->num);
1467   enum machine_mode mode;
1468
1469   /* Regs that are set more than once are not allowed to match
1470      or be matched.  I'm no longer sure why not.  */
1471   /* Only pseudo registers are allowed to match or be matched,
1472      since move_movables does not validate the change.  */
1473   /* Perhaps testing m->consec_sets would be more appropriate here?  */
1474
1475   for (m = movables->head; m; m = m->next)
1476     if (m->match == 0 && regs->array[m->regno].n_times_set == 1
1477         && m->regno >= FIRST_PSEUDO_REGISTER
1478         && !m->insert_temp
1479         && !m->partial)
1480       {
1481         struct movable *m1;
1482         int regno = m->regno;
1483
1484         memset (matched_regs, 0, regs->num);
1485         matched_regs[regno] = 1;
1486
1487         /* We want later insns to match the first one.  Don't make the first
1488            one match any later ones.  So start this loop at m->next.  */
1489         for (m1 = m->next; m1; m1 = m1->next)
1490           if (m != m1 && m1->match == 0
1491               && !m1->insert_temp
1492               && regs->array[m1->regno].n_times_set == 1
1493               && m1->regno >= FIRST_PSEUDO_REGISTER
1494               /* A reg used outside the loop mustn't be eliminated.  */
1495               && !m1->global
1496               /* A reg used for zero-extending mustn't be eliminated.  */
1497               && !m1->partial
1498               && (matched_regs[m1->regno]
1499                   ||
1500                   (
1501                    /* Can combine regs with different modes loaded from the
1502                       same constant only if the modes are the same or
1503                       if both are integer modes with M wider or the same
1504                       width as M1.  The check for integer is redundant, but
1505                       safe, since the only case of differing destination
1506                       modes with equal sources is when both sources are
1507                       VOIDmode, i.e., CONST_INT.  */
1508                    (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest)
1509                     || (GET_MODE_CLASS (GET_MODE (m->set_dest)) == MODE_INT
1510                         && GET_MODE_CLASS (GET_MODE (m1->set_dest)) == MODE_INT
1511                         && (GET_MODE_BITSIZE (GET_MODE (m->set_dest))
1512                             >= GET_MODE_BITSIZE (GET_MODE (m1->set_dest)))))
1513                    /* See if the source of M1 says it matches M.  */
1514                    && ((GET_CODE (m1->set_src) == REG
1515                         && matched_regs[REGNO (m1->set_src)])
1516                        || rtx_equal_for_loop_p (m->set_src, m1->set_src,
1517                                                 movables, regs))))
1518               && ((m->dependencies == m1->dependencies)
1519                   || rtx_equal_p (m->dependencies, m1->dependencies)))
1520             {
1521               m->lifetime += m1->lifetime;
1522               m->savings += m1->savings;
1523               m1->done = 1;
1524               m1->match = m;
1525               matched_regs[m1->regno] = 1;
1526             }
1527       }
1528
1529   /* Now combine the regs used for zero-extension.
1530      This can be done for those not marked `global'
1531      provided their lives don't overlap.  */
1532
1533   for (mode = GET_CLASS_NARROWEST_MODE (MODE_INT); mode != VOIDmode;
1534        mode = GET_MODE_WIDER_MODE (mode))
1535     {
1536       struct movable *m0 = 0;
1537
1538       /* Combine all the registers for extension from mode MODE.
1539          Don't combine any that are used outside this loop.  */
1540       for (m = movables->head; m; m = m->next)
1541         if (m->partial && ! m->global
1542             && mode == GET_MODE (SET_SRC (PATTERN (NEXT_INSN (m->insn)))))
1543           {
1544             struct movable *m1;
1545
1546             int first = REGNO_FIRST_LUID (m->regno);
1547             int last = REGNO_LAST_LUID (m->regno);
1548
1549             if (m0 == 0)
1550               {
1551                 /* First one: don't check for overlap, just record it.  */
1552                 m0 = m;
1553                 continue;
1554               }
1555
1556             /* Make sure they extend to the same mode.
1557                (Almost always true.)  */
1558             if (GET_MODE (m->set_dest) != GET_MODE (m0->set_dest))
1559               continue;
1560
1561             /* We already have one: check for overlap with those
1562                already combined together.  */
1563             for (m1 = movables->head; m1 != m; m1 = m1->next)
1564               if (m1 == m0 || (m1->partial && m1->match == m0))
1565                 if (! (REGNO_FIRST_LUID (m1->regno) > last
1566                        || REGNO_LAST_LUID (m1->regno) < first))
1567                   goto overlap;
1568
1569             /* No overlap: we can combine this with the others.  */
1570             m0->lifetime += m->lifetime;
1571             m0->savings += m->savings;
1572             m->done = 1;
1573             m->match = m0;
1574
1575           overlap:
1576             ;
1577           }
1578     }
1579
1580   /* Clean up.  */
1581   free (matched_regs);
1582 }
1583
1584 /* Returns the number of movable instructions in LOOP that were not
1585    moved outside the loop.  */
1586
1587 static int
1588 num_unmoved_movables (loop)
1589      const struct loop *loop;
1590 {
1591   int num = 0;
1592   struct movable *m;
1593
1594   for (m = LOOP_MOVABLES (loop)->head; m; m = m->next)
1595     if (!m->done)
1596       ++num;
1597
1598   return num;
1599 }
1600
1601 \f
1602 /* Return 1 if regs X and Y will become the same if moved.  */
1603
1604 static int
1605 regs_match_p (x, y, movables)
1606      rtx x, y;
1607      struct loop_movables *movables;
1608 {
1609   unsigned int xn = REGNO (x);
1610   unsigned int yn = REGNO (y);
1611   struct movable *mx, *my;
1612
1613   for (mx = movables->head; mx; mx = mx->next)
1614     if (mx->regno == xn)
1615       break;
1616
1617   for (my = movables->head; my; my = my->next)
1618     if (my->regno == yn)
1619       break;
1620
1621   return (mx && my
1622           && ((mx->match == my->match && mx->match != 0)
1623               || mx->match == my
1624               || mx == my->match));
1625 }
1626
1627 /* Return 1 if X and Y are identical-looking rtx's.
1628    This is the Lisp function EQUAL for rtx arguments.
1629
1630    If two registers are matching movables or a movable register and an
1631    equivalent constant, consider them equal.  */
1632
1633 static int
1634 rtx_equal_for_loop_p (x, y, movables, regs)
1635      rtx x, y;
1636      struct loop_movables *movables;
1637      struct loop_regs *regs;
1638 {
1639   int i;
1640   int j;
1641   struct movable *m;
1642   enum rtx_code code;
1643   const char *fmt;
1644
1645   if (x == y)
1646     return 1;
1647   if (x == 0 || y == 0)
1648     return 0;
1649
1650   code = GET_CODE (x);
1651
1652   /* If we have a register and a constant, they may sometimes be
1653      equal.  */
1654   if (GET_CODE (x) == REG && regs->array[REGNO (x)].set_in_loop == -2
1655       && CONSTANT_P (y))
1656     {
1657       for (m = movables->head; m; m = m->next)
1658         if (m->move_insn && m->regno == REGNO (x)
1659             && rtx_equal_p (m->set_src, y))
1660           return 1;
1661     }
1662   else if (GET_CODE (y) == REG && regs->array[REGNO (y)].set_in_loop == -2
1663            && CONSTANT_P (x))
1664     {
1665       for (m = movables->head; m; m = m->next)
1666         if (m->move_insn && m->regno == REGNO (y)
1667             && rtx_equal_p (m->set_src, x))
1668           return 1;
1669     }
1670
1671   /* Otherwise, rtx's of different codes cannot be equal.  */
1672   if (code != GET_CODE (y))
1673     return 0;
1674
1675   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.
1676      (REG:SI x) and (REG:HI x) are NOT equivalent.  */
1677
1678   if (GET_MODE (x) != GET_MODE (y))
1679     return 0;
1680
1681   /* These three types of rtx's can be compared nonrecursively.  */
1682   if (code == REG)
1683     return (REGNO (x) == REGNO (y) || regs_match_p (x, y, movables));
1684
1685   if (code == LABEL_REF)
1686     return XEXP (x, 0) == XEXP (y, 0);
1687   if (code == SYMBOL_REF)
1688     return XSTR (x, 0) == XSTR (y, 0);
1689
1690   /* Compare the elements.  If any pair of corresponding elements
1691      fail to match, return 0 for the whole things.  */
1692
1693   fmt = GET_RTX_FORMAT (code);
1694   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1695     {
1696       switch (fmt[i])
1697         {
1698         case 'w':
1699           if (XWINT (x, i) != XWINT (y, i))
1700             return 0;
1701           break;
1702
1703         case 'i':
1704           if (XINT (x, i) != XINT (y, i))
1705             return 0;
1706           break;
1707
1708         case 'E':
1709           /* Two vectors must have the same length.  */
1710           if (XVECLEN (x, i) != XVECLEN (y, i))
1711             return 0;
1712
1713           /* And the corresponding elements must match.  */
1714           for (j = 0; j < XVECLEN (x, i); j++)
1715             if (rtx_equal_for_loop_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
1716                                       movables, regs) == 0)
1717               return 0;
1718           break;
1719
1720         case 'e':
1721           if (rtx_equal_for_loop_p (XEXP (x, i), XEXP (y, i), movables, regs)
1722               == 0)
1723             return 0;
1724           break;
1725
1726         case 's':
1727           if (strcmp (XSTR (x, i), XSTR (y, i)))
1728             return 0;
1729           break;
1730
1731         case 'u':
1732           /* These are just backpointers, so they don't matter.  */
1733           break;
1734
1735         case '0':
1736           break;
1737
1738           /* It is believed that rtx's at this level will never
1739              contain anything but integers and other rtx's,
1740              except for within LABEL_REFs and SYMBOL_REFs.  */
1741         default:
1742           abort ();
1743         }
1744     }
1745   return 1;
1746 }
1747 \f
1748 /* If X contains any LABEL_REF's, add REG_LABEL notes for them to all
1749    insns in INSNS which use the reference.  LABEL_NUSES for CODE_LABEL
1750    references is incremented once for each added note.  */
1751
1752 static void
1753 add_label_notes (x, insns)
1754      rtx x;
1755      rtx insns;
1756 {
1757   enum rtx_code code = GET_CODE (x);
1758   int i, j;
1759   const char *fmt;
1760   rtx insn;
1761
1762   if (code == LABEL_REF && !LABEL_REF_NONLOCAL_P (x))
1763     {
1764       /* This code used to ignore labels that referred to dispatch tables to
1765          avoid flow generating (slighly) worse code.
1766
1767          We no longer ignore such label references (see LABEL_REF handling in
1768          mark_jump_label for additional information).  */
1769       for (insn = insns; insn; insn = NEXT_INSN (insn))
1770         if (reg_mentioned_p (XEXP (x, 0), insn))
1771           {
1772             REG_NOTES (insn) = gen_rtx_INSN_LIST (REG_LABEL, XEXP (x, 0),
1773                                                   REG_NOTES (insn));
1774             if (LABEL_P (XEXP (x, 0)))
1775               LABEL_NUSES (XEXP (x, 0))++;
1776           }
1777     }
1778
1779   fmt = GET_RTX_FORMAT (code);
1780   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
1781     {
1782       if (fmt[i] == 'e')
1783         add_label_notes (XEXP (x, i), insns);
1784       else if (fmt[i] == 'E')
1785         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
1786           add_label_notes (XVECEXP (x, i, j), insns);
1787     }
1788 }
1789 \f
1790 /* Scan MOVABLES, and move the insns that deserve to be moved.
1791    If two matching movables are combined, replace one reg with the
1792    other throughout.  */
1793
1794 static void
1795 move_movables (loop, movables, threshold, insn_count)
1796      struct loop *loop;
1797      struct loop_movables *movables;
1798      int threshold;
1799      int insn_count;
1800 {
1801   struct loop_regs *regs = LOOP_REGS (loop);
1802   int nregs = regs->num;
1803   rtx new_start = 0;
1804   struct movable *m;
1805   rtx p;
1806   rtx loop_start = loop->start;
1807   rtx loop_end = loop->end;
1808   /* Map of pseudo-register replacements to handle combining
1809      when we move several insns that load the same value
1810      into different pseudo-registers.  */
1811   rtx *reg_map = (rtx *) xcalloc (nregs, sizeof (rtx));
1812   char *already_moved = (char *) xcalloc (nregs, sizeof (char));
1813
1814   for (m = movables->head; m; m = m->next)
1815     {
1816       /* Describe this movable insn.  */
1817
1818       if (loop_dump_stream)
1819         {
1820           fprintf (loop_dump_stream, "Insn %d: regno %d (life %d), ",
1821                    INSN_UID (m->insn), m->regno, m->lifetime);
1822           if (m->consec > 0)
1823             fprintf (loop_dump_stream, "consec %d, ", m->consec);
1824           if (m->cond)
1825             fprintf (loop_dump_stream, "cond ");
1826           if (m->force)
1827             fprintf (loop_dump_stream, "force ");
1828           if (m->global)
1829             fprintf (loop_dump_stream, "global ");
1830           if (m->done)
1831             fprintf (loop_dump_stream, "done ");
1832           if (m->move_insn)
1833             fprintf (loop_dump_stream, "move-insn ");
1834           if (m->match)
1835             fprintf (loop_dump_stream, "matches %d ",
1836                      INSN_UID (m->match->insn));
1837           if (m->forces)
1838             fprintf (loop_dump_stream, "forces %d ",
1839                      INSN_UID (m->forces->insn));
1840         }
1841
1842       /* Ignore the insn if it's already done (it matched something else).
1843          Otherwise, see if it is now safe to move.  */
1844
1845       if (!m->done
1846           && (! m->cond
1847               || (1 == loop_invariant_p (loop, m->set_src)
1848                   && (m->dependencies == 0
1849                       || 1 == loop_invariant_p (loop, m->dependencies))
1850                   && (m->consec == 0
1851                       || 1 == consec_sets_invariant_p (loop, m->set_dest,
1852                                                        m->consec + 1,
1853                                                        m->insn))))
1854           && (! m->forces || m->forces->done))
1855         {
1856           int regno;
1857           rtx p;
1858           int savings = m->savings;
1859
1860           /* We have an insn that is safe to move.
1861              Compute its desirability.  */
1862
1863           p = m->insn;
1864           regno = m->regno;
1865
1866           if (loop_dump_stream)
1867             fprintf (loop_dump_stream, "savings %d ", savings);
1868
1869           if (regs->array[regno].moved_once && loop_dump_stream)
1870             fprintf (loop_dump_stream, "halved since already moved ");
1871
1872           /* An insn MUST be moved if we already moved something else
1873              which is safe only if this one is moved too: that is,
1874              if already_moved[REGNO] is nonzero.  */
1875
1876           /* An insn is desirable to move if the new lifetime of the
1877              register is no more than THRESHOLD times the old lifetime.
1878              If it's not desirable, it means the loop is so big
1879              that moving won't speed things up much,
1880              and it is liable to make register usage worse.  */
1881
1882           /* It is also desirable to move if it can be moved at no
1883              extra cost because something else was already moved.  */
1884
1885           if (already_moved[regno]
1886               || flag_move_all_movables
1887               || (threshold * savings * m->lifetime) >=
1888                  (regs->array[regno].moved_once ? insn_count * 2 : insn_count)
1889               || (m->forces && m->forces->done
1890                   && regs->array[m->forces->regno].n_times_set == 1))
1891             {
1892               int count;
1893               struct movable *m1;
1894               rtx first = NULL_RTX;
1895               rtx newreg = NULL_RTX;
1896
1897               if (m->insert_temp)
1898                 newreg = gen_reg_rtx (GET_MODE (m->set_dest));
1899
1900               /* Now move the insns that set the reg.  */
1901
1902               if (m->partial && m->match)
1903                 {
1904                   rtx newpat, i1;
1905                   rtx r1, r2;
1906                   /* Find the end of this chain of matching regs.
1907                      Thus, we load each reg in the chain from that one reg.
1908                      And that reg is loaded with 0 directly,
1909                      since it has ->match == 0.  */
1910                   for (m1 = m; m1->match; m1 = m1->match);
1911                   newpat = gen_move_insn (SET_DEST (PATTERN (m->insn)),
1912                                           SET_DEST (PATTERN (m1->insn)));
1913                   i1 = loop_insn_hoist (loop, newpat);
1914
1915                   /* Mark the moved, invariant reg as being allowed to
1916                      share a hard reg with the other matching invariant.  */
1917                   REG_NOTES (i1) = REG_NOTES (m->insn);
1918                   r1 = SET_DEST (PATTERN (m->insn));
1919                   r2 = SET_DEST (PATTERN (m1->insn));
1920                   regs_may_share
1921                     = gen_rtx_EXPR_LIST (VOIDmode, r1,
1922                                          gen_rtx_EXPR_LIST (VOIDmode, r2,
1923                                                             regs_may_share));
1924                   delete_insn (m->insn);
1925
1926                   if (new_start == 0)
1927                     new_start = i1;
1928
1929                   if (loop_dump_stream)
1930                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
1931                 }
1932               /* If we are to re-generate the item being moved with a
1933                  new move insn, first delete what we have and then emit
1934                  the move insn before the loop.  */
1935               else if (m->move_insn)
1936                 {
1937                   rtx i1, temp, seq;
1938
1939                   for (count = m->consec; count >= 0; count--)
1940                     {
1941                       /* If this is the first insn of a library call sequence,
1942                          something is very wrong.  */
1943                       if (GET_CODE (p) != NOTE
1944                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
1945                         abort ();
1946
1947                       /* If this is the last insn of a libcall sequence, then
1948                          delete every insn in the sequence except the last.
1949                          The last insn is handled in the normal manner.  */
1950                       if (GET_CODE (p) != NOTE
1951                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
1952                         {
1953                           temp = XEXP (temp, 0);
1954                           while (temp != p)
1955                             temp = delete_insn (temp);
1956                         }
1957
1958                       temp = p;
1959                       p = delete_insn (p);
1960
1961                       /* simplify_giv_expr expects that it can walk the insns
1962                          at m->insn forwards and see this old sequence we are
1963                          tossing here.  delete_insn does preserve the next
1964                          pointers, but when we skip over a NOTE we must fix
1965                          it up.  Otherwise that code walks into the non-deleted
1966                          insn stream.  */
1967                       while (p && GET_CODE (p) == NOTE)
1968                         p = NEXT_INSN (temp) = NEXT_INSN (p);
1969
1970                       if (m->insert_temp)
1971                         {
1972                           /* Replace the original insn with a move from
1973                              our newly created temp.  */
1974                           start_sequence ();
1975                           emit_move_insn (m->set_dest, newreg);
1976                           seq = get_insns ();
1977                           end_sequence ();
1978                           emit_insn_before (seq, p);
1979                         }
1980                     }
1981
1982                   start_sequence ();
1983                   emit_move_insn (m->insert_temp ? newreg : m->set_dest,
1984                                   m->set_src);
1985                   seq = get_insns ();
1986                   end_sequence ();
1987
1988                   add_label_notes (m->set_src, seq);
1989
1990                   i1 = loop_insn_hoist (loop, seq);
1991                   if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
1992                     set_unique_reg_note (i1,
1993                                          m->is_equiv ? REG_EQUIV : REG_EQUAL,
1994                                          m->set_src);
1995
1996                   if (loop_dump_stream)
1997                     fprintf (loop_dump_stream, " moved to %d", INSN_UID (i1));
1998
1999                   /* The more regs we move, the less we like moving them.  */
2000                   threshold -= 3;
2001                 }
2002               else
2003                 {
2004                   for (count = m->consec; count >= 0; count--)
2005                     {
2006                       rtx i1, temp;
2007
2008                       /* If first insn of libcall sequence, skip to end.  */
2009                       /* Do this at start of loop, since p is guaranteed to
2010                          be an insn here.  */
2011                       if (GET_CODE (p) != NOTE
2012                           && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
2013                         p = XEXP (temp, 0);
2014
2015                       /* If last insn of libcall sequence, move all
2016                          insns except the last before the loop.  The last
2017                          insn is handled in the normal manner.  */
2018                       if (GET_CODE (p) != NOTE
2019                           && (temp = find_reg_note (p, REG_RETVAL, NULL_RTX)))
2020                         {
2021                           rtx fn_address = 0;
2022                           rtx fn_reg = 0;
2023                           rtx fn_address_insn = 0;
2024
2025                           first = 0;
2026                           for (temp = XEXP (temp, 0); temp != p;
2027                                temp = NEXT_INSN (temp))
2028                             {
2029                               rtx body;
2030                               rtx n;
2031                               rtx next;
2032
2033                               if (GET_CODE (temp) == NOTE)
2034                                 continue;
2035
2036                               body = PATTERN (temp);
2037
2038                               /* Find the next insn after TEMP,
2039                                  not counting USE or NOTE insns.  */
2040                               for (next = NEXT_INSN (temp); next != p;
2041                                    next = NEXT_INSN (next))
2042                                 if (! (GET_CODE (next) == INSN
2043                                        && GET_CODE (PATTERN (next)) == USE)
2044                                     && GET_CODE (next) != NOTE)
2045                                   break;
2046
2047                               /* If that is the call, this may be the insn
2048                                  that loads the function address.
2049
2050                                  Extract the function address from the insn
2051                                  that loads it into a register.
2052                                  If this insn was cse'd, we get incorrect code.
2053
2054                                  So emit a new move insn that copies the
2055                                  function address into the register that the
2056                                  call insn will use.  flow.c will delete any
2057                                  redundant stores that we have created.  */
2058                               if (GET_CODE (next) == CALL_INSN
2059                                   && GET_CODE (body) == SET
2060                                   && GET_CODE (SET_DEST (body)) == REG
2061                                   && (n = find_reg_note (temp, REG_EQUAL,
2062                                                          NULL_RTX)))
2063                                 {
2064                                   fn_reg = SET_SRC (body);
2065                                   if (GET_CODE (fn_reg) != REG)
2066                                     fn_reg = SET_DEST (body);
2067                                   fn_address = XEXP (n, 0);
2068                                   fn_address_insn = temp;
2069                                 }
2070                               /* We have the call insn.
2071                                  If it uses the register we suspect it might,
2072                                  load it with the correct address directly.  */
2073                               if (GET_CODE (temp) == CALL_INSN
2074                                   && fn_address != 0
2075                                   && reg_referenced_p (fn_reg, body))
2076                                 loop_insn_emit_after (loop, 0, fn_address_insn,
2077                                                       gen_move_insn
2078                                                       (fn_reg, fn_address));
2079
2080                               if (GET_CODE (temp) == CALL_INSN)
2081                                 {
2082                                   i1 = loop_call_insn_hoist (loop, body);
2083                                   /* Because the USAGE information potentially
2084                                      contains objects other than hard registers
2085                                      we need to copy it.  */
2086                                   if (CALL_INSN_FUNCTION_USAGE (temp))
2087                                     CALL_INSN_FUNCTION_USAGE (i1)
2088                                       = copy_rtx (CALL_INSN_FUNCTION_USAGE (temp));
2089                                 }
2090                               else
2091                                 i1 = loop_insn_hoist (loop, body);
2092                               if (first == 0)
2093                                 first = i1;
2094                               if (temp == fn_address_insn)
2095                                 fn_address_insn = i1;
2096                               REG_NOTES (i1) = REG_NOTES (temp);
2097                               REG_NOTES (temp) = NULL;
2098                               delete_insn (temp);
2099                             }
2100                           if (new_start == 0)
2101                             new_start = first;
2102                         }
2103                       if (m->savemode != VOIDmode)
2104                         {
2105                           /* P sets REG to zero; but we should clear only
2106                              the bits that are not covered by the mode
2107                              m->savemode.  */
2108                           rtx reg = m->set_dest;
2109                           rtx sequence;
2110                           rtx tem;
2111
2112                           start_sequence ();
2113                           tem = expand_simple_binop
2114                             (GET_MODE (reg), AND, reg,
2115                              GEN_INT ((((HOST_WIDE_INT) 1
2116                                         << GET_MODE_BITSIZE (m->savemode)))
2117                                       - 1),
2118                              reg, 1, OPTAB_LIB_WIDEN);
2119                           if (tem == 0)
2120                             abort ();
2121                           if (tem != reg)
2122                             emit_move_insn (reg, tem);
2123                           sequence = get_insns ();
2124                           end_sequence ();
2125                           i1 = loop_insn_hoist (loop, sequence);
2126                         }
2127                       else if (GET_CODE (p) == CALL_INSN)
2128                         {
2129                           i1 = loop_call_insn_hoist (loop, PATTERN (p));
2130                           /* Because the USAGE information potentially
2131                              contains objects other than hard registers
2132                              we need to copy it.  */
2133                           if (CALL_INSN_FUNCTION_USAGE (p))
2134                             CALL_INSN_FUNCTION_USAGE (i1)
2135                               = copy_rtx (CALL_INSN_FUNCTION_USAGE (p));
2136                         }
2137                       else if (count == m->consec && m->move_insn_first)
2138                         {
2139                           rtx seq;
2140                           /* The SET_SRC might not be invariant, so we must
2141                              use the REG_EQUAL note.  */
2142                           start_sequence ();
2143                           emit_move_insn (m->set_dest, m->set_src);
2144                           seq = get_insns ();
2145                           end_sequence ();
2146
2147                           add_label_notes (m->set_src, seq);
2148
2149                           i1 = loop_insn_hoist (loop, seq);
2150                           if (! find_reg_note (i1, REG_EQUAL, NULL_RTX))
2151                             set_unique_reg_note (i1, m->is_equiv ? REG_EQUIV
2152                                                      : REG_EQUAL, m->set_src);
2153                         }
2154                       else if (m->insert_temp)
2155                         {
2156                           rtx *reg_map2 = (rtx *) xcalloc (REGNO (newreg),
2157                                 sizeof(rtx));
2158                           reg_map2 [m->regno] = newreg;
2159
2160                           i1 = loop_insn_hoist (loop, copy_rtx (PATTERN (p)));
2161                           replace_regs (i1, reg_map2, REGNO (newreg), 1);
2162                           free (reg_map2);
2163                         }
2164                       else
2165                         i1 = loop_insn_hoist (loop, PATTERN (p));
2166
2167                       if (REG_NOTES (i1) == 0)
2168                         {
2169                           REG_NOTES (i1) = REG_NOTES (p);
2170                           REG_NOTES (p) = NULL;
2171
2172                           /* If there is a REG_EQUAL note present whose value
2173                              is not loop invariant, then delete it, since it
2174                              may cause problems with later optimization passes.
2175                              It is possible for cse to create such notes
2176                              like this as a result of record_jump_cond.  */
2177
2178                           if ((temp = find_reg_note (i1, REG_EQUAL, NULL_RTX))
2179                               && ! loop_invariant_p (loop, XEXP (temp, 0)))
2180                             remove_note (i1, temp);
2181                         }
2182
2183                       if (new_start == 0)
2184                         new_start = i1;
2185
2186                       if (loop_dump_stream)
2187                         fprintf (loop_dump_stream, " moved to %d",
2188                                  INSN_UID (i1));
2189
2190                       /* If library call, now fix the REG_NOTES that contain
2191                          insn pointers, namely REG_LIBCALL on FIRST
2192                          and REG_RETVAL on I1.  */
2193                       if ((temp = find_reg_note (i1, REG_RETVAL, NULL_RTX)))
2194                         {
2195                           XEXP (temp, 0) = first;
2196                           temp = find_reg_note (first, REG_LIBCALL, NULL_RTX);
2197                           XEXP (temp, 0) = i1;
2198                         }
2199
2200                       temp = p;
2201                       delete_insn (p);
2202                       p = NEXT_INSN (p);
2203
2204                       /* simplify_giv_expr expects that it can walk the insns
2205                          at m->insn forwards and see this old sequence we are
2206                          tossing here.  delete_insn does preserve the next
2207                          pointers, but when we skip over a NOTE we must fix
2208                          it up.  Otherwise that code walks into the non-deleted
2209                          insn stream.  */
2210                       while (p && GET_CODE (p) == NOTE)
2211                         p = NEXT_INSN (temp) = NEXT_INSN (p);
2212
2213                       if (m->insert_temp)
2214                         {
2215                           rtx seq;
2216                           /* Replace the original insn with a move from
2217                              our newly created temp.  */
2218                           start_sequence ();
2219                           emit_move_insn (m->set_dest, newreg);
2220                           seq = get_insns ();
2221                           end_sequence ();
2222                           emit_insn_before (seq, p);
2223                         }
2224                     }
2225
2226                   /* The more regs we move, the less we like moving them.  */
2227                   threshold -= 3;
2228                 }
2229
2230               m->done = 1;
2231
2232               if (!m->insert_temp)
2233                 {
2234                   /* Any other movable that loads the same register
2235                      MUST be moved.  */
2236                   already_moved[regno] = 1;
2237
2238                   /* This reg has been moved out of one loop.  */
2239                   regs->array[regno].moved_once = 1;
2240
2241                   /* The reg set here is now invariant.  */
2242                   if (! m->partial)
2243                     {
2244                       int i;
2245                       for (i = 0; i < LOOP_REGNO_NREGS (regno, m->set_dest); i++)
2246                         regs->array[regno+i].set_in_loop = 0;
2247                     }
2248
2249                   /* Change the length-of-life info for the register
2250                      to say it lives at least the full length of this loop.
2251                      This will help guide optimizations in outer loops.  */
2252
2253                   if (REGNO_FIRST_LUID (regno) > INSN_LUID (loop_start))
2254                     /* This is the old insn before all the moved insns.
2255                        We can't use the moved insn because it is out of range
2256                        in uid_luid.  Only the old insns have luids.  */
2257                     REGNO_FIRST_UID (regno) = INSN_UID (loop_start);
2258                   if (REGNO_LAST_LUID (regno) < INSN_LUID (loop_end))
2259                     REGNO_LAST_UID (regno) = INSN_UID (loop_end);
2260                 }
2261
2262               /* Combine with this moved insn any other matching movables.  */
2263
2264               if (! m->partial)
2265                 for (m1 = movables->head; m1; m1 = m1->next)
2266                   if (m1->match == m)
2267                     {
2268                       rtx temp;
2269
2270                       /* Schedule the reg loaded by M1
2271                          for replacement so that shares the reg of M.
2272                          If the modes differ (only possible in restricted
2273                          circumstances, make a SUBREG.
2274
2275                          Note this assumes that the target dependent files
2276                          treat REG and SUBREG equally, including within
2277                          GO_IF_LEGITIMATE_ADDRESS and in all the
2278                          predicates since we never verify that replacing the
2279                          original register with a SUBREG results in a
2280                          recognizable insn.  */
2281                       if (GET_MODE (m->set_dest) == GET_MODE (m1->set_dest))
2282                         reg_map[m1->regno] = m->set_dest;
2283                       else
2284                         reg_map[m1->regno]
2285                           = gen_lowpart_common (GET_MODE (m1->set_dest),
2286                                                 m->set_dest);
2287
2288                       /* Get rid of the matching insn
2289                          and prevent further processing of it.  */
2290                       m1->done = 1;
2291
2292                       /* if library call, delete all insns.  */
2293                       if ((temp = find_reg_note (m1->insn, REG_RETVAL,
2294                                                  NULL_RTX)))
2295                         delete_insn_chain (XEXP (temp, 0), m1->insn);
2296                       else
2297                         delete_insn (m1->insn);
2298
2299                       /* Any other movable that loads the same register
2300                          MUST be moved.  */
2301                       already_moved[m1->regno] = 1;
2302
2303                       /* The reg merged here is now invariant,
2304                          if the reg it matches is invariant.  */
2305                       if (! m->partial)
2306                         {
2307                           int i;
2308                           for (i = 0;
2309                                i < LOOP_REGNO_NREGS (regno, m1->set_dest);
2310                                i++)
2311                             regs->array[m1->regno+i].set_in_loop = 0;
2312                         }
2313                     }
2314             }
2315           else if (loop_dump_stream)
2316             fprintf (loop_dump_stream, "not desirable");
2317         }
2318       else if (loop_dump_stream && !m->match)
2319         fprintf (loop_dump_stream, "not safe");
2320
2321       if (loop_dump_stream)
2322         fprintf (loop_dump_stream, "\n");
2323     }
2324
2325   if (new_start == 0)
2326     new_start = loop_start;
2327
2328   /* Go through all the instructions in the loop, making
2329      all the register substitutions scheduled in REG_MAP.  */
2330   for (p = new_start; p != loop_end; p = NEXT_INSN (p))
2331     if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
2332         || GET_CODE (p) == CALL_INSN)
2333       {
2334         replace_regs (PATTERN (p), reg_map, nregs, 0);
2335         replace_regs (REG_NOTES (p), reg_map, nregs, 0);
2336         INSN_CODE (p) = -1;
2337       }
2338
2339   /* Clean up.  */
2340   free (reg_map);
2341   free (already_moved);
2342 }
2343
2344
2345 static void
2346 loop_movables_add (movables, m)
2347      struct loop_movables *movables;
2348      struct movable *m;
2349 {
2350   if (movables->head == 0)
2351     movables->head = m;
2352   else
2353     movables->last->next = m;
2354   movables->last = m;
2355 }
2356
2357
2358 static void
2359 loop_movables_free (movables)
2360      struct loop_movables *movables;
2361 {
2362   struct movable *m;
2363   struct movable *m_next;
2364
2365   for (m = movables->head; m; m = m_next)
2366     {
2367       m_next = m->next;
2368       free (m);
2369     }
2370 }
2371 \f
2372 #if 0
2373 /* Scan X and replace the address of any MEM in it with ADDR.
2374    REG is the address that MEM should have before the replacement.  */
2375
2376 static void
2377 replace_call_address (x, reg, addr)
2378      rtx x, reg, addr;
2379 {
2380   enum rtx_code code;
2381   int i;
2382   const char *fmt;
2383
2384   if (x == 0)
2385     return;
2386   code = GET_CODE (x);
2387   switch (code)
2388     {
2389     case PC:
2390     case CC0:
2391     case CONST_INT:
2392     case CONST_DOUBLE:
2393     case CONST:
2394     case SYMBOL_REF:
2395     case LABEL_REF:
2396     case REG:
2397       return;
2398
2399     case SET:
2400       /* Short cut for very common case.  */
2401       replace_call_address (XEXP (x, 1), reg, addr);
2402       return;
2403
2404     case CALL:
2405       /* Short cut for very common case.  */
2406       replace_call_address (XEXP (x, 0), reg, addr);
2407       return;
2408
2409     case MEM:
2410       /* If this MEM uses a reg other than the one we expected,
2411          something is wrong.  */
2412       if (XEXP (x, 0) != reg)
2413         abort ();
2414       XEXP (x, 0) = addr;
2415       return;
2416
2417     default:
2418       break;
2419     }
2420
2421   fmt = GET_RTX_FORMAT (code);
2422   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2423     {
2424       if (fmt[i] == 'e')
2425         replace_call_address (XEXP (x, i), reg, addr);
2426       else if (fmt[i] == 'E')
2427         {
2428           int j;
2429           for (j = 0; j < XVECLEN (x, i); j++)
2430             replace_call_address (XVECEXP (x, i, j), reg, addr);
2431         }
2432     }
2433 }
2434 #endif
2435 \f
2436 /* Return the number of memory refs to addresses that vary
2437    in the rtx X.  */
2438
2439 static int
2440 count_nonfixed_reads (loop, x)
2441      const struct loop *loop;
2442      rtx x;
2443 {
2444   enum rtx_code code;
2445   int i;
2446   const char *fmt;
2447   int value;
2448
2449   if (x == 0)
2450     return 0;
2451
2452   code = GET_CODE (x);
2453   switch (code)
2454     {
2455     case PC:
2456     case CC0:
2457     case CONST_INT:
2458     case CONST_DOUBLE:
2459     case CONST:
2460     case SYMBOL_REF:
2461     case LABEL_REF:
2462     case REG:
2463       return 0;
2464
2465     case MEM:
2466       return ((loop_invariant_p (loop, XEXP (x, 0)) != 1)
2467               + count_nonfixed_reads (loop, XEXP (x, 0)));
2468
2469     default:
2470       break;
2471     }
2472
2473   value = 0;
2474   fmt = GET_RTX_FORMAT (code);
2475   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2476     {
2477       if (fmt[i] == 'e')
2478         value += count_nonfixed_reads (loop, XEXP (x, i));
2479       if (fmt[i] == 'E')
2480         {
2481           int j;
2482           for (j = 0; j < XVECLEN (x, i); j++)
2483             value += count_nonfixed_reads (loop, XVECEXP (x, i, j));
2484         }
2485     }
2486   return value;
2487 }
2488 \f
2489 /* Scan a loop setting the elements `cont', `vtop', `loops_enclosed',
2490    `has_call', `has_nonconst_call', `has_volatile', `has_tablejump',
2491    `unknown_address_altered', `unknown_constant_address_altered', and
2492    `num_mem_sets' in LOOP.  Also, fill in the array `mems' and the
2493    list `store_mems' in LOOP.  */
2494
2495 static void
2496 prescan_loop (loop)
2497      struct loop *loop;
2498 {
2499   int level = 1;
2500   rtx insn;
2501   struct loop_info *loop_info = LOOP_INFO (loop);
2502   rtx start = loop->start;
2503   rtx end = loop->end;
2504   /* The label after END.  Jumping here is just like falling off the
2505      end of the loop.  We use next_nonnote_insn instead of next_label
2506      as a hedge against the (pathological) case where some actual insn
2507      might end up between the two.  */
2508   rtx exit_target = next_nonnote_insn (end);
2509
2510   loop_info->has_indirect_jump = indirect_jump_in_function;
2511   loop_info->pre_header_has_call = 0;
2512   loop_info->has_call = 0;
2513   loop_info->has_nonconst_call = 0;
2514   loop_info->has_prefetch = 0;
2515   loop_info->has_volatile = 0;
2516   loop_info->has_tablejump = 0;
2517   loop_info->has_multiple_exit_targets = 0;
2518   loop->level = 1;
2519
2520   loop_info->unknown_address_altered = 0;
2521   loop_info->unknown_constant_address_altered = 0;
2522   loop_info->store_mems = NULL_RTX;
2523   loop_info->first_loop_store_insn = NULL_RTX;
2524   loop_info->mems_idx = 0;
2525   loop_info->num_mem_sets = 0;
2526   /* If loop opts run twice, this was set on 1st pass for 2nd.  */
2527   loop_info->preconditioned = NOTE_PRECONDITIONED (end);
2528
2529   for (insn = start; insn && GET_CODE (insn) != CODE_LABEL;
2530        insn = PREV_INSN (insn))
2531     {
2532       if (GET_CODE (insn) == CALL_INSN)
2533         {
2534           loop_info->pre_header_has_call = 1;
2535           break;
2536         }
2537     }
2538
2539   for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2540        insn = NEXT_INSN (insn))
2541     {
2542       switch (GET_CODE (insn))
2543         {
2544         case NOTE:
2545           if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_BEG)
2546             {
2547               ++level;
2548               /* Count number of loops contained in this one.  */
2549               loop->level++;
2550             }
2551           else if (NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END)
2552             --level;
2553           break;
2554
2555         case CALL_INSN:
2556           if (! CONST_OR_PURE_CALL_P (insn))
2557             {
2558               loop_info->unknown_address_altered = 1;
2559               loop_info->has_nonconst_call = 1;
2560             }
2561           else if (pure_call_p (insn))
2562             loop_info->has_nonconst_call = 1;
2563           loop_info->has_call = 1;
2564           if (can_throw_internal (insn))
2565             loop_info->has_multiple_exit_targets = 1;
2566           break;
2567
2568         case JUMP_INSN:
2569           if (! loop_info->has_multiple_exit_targets)
2570             {
2571               rtx set = pc_set (insn);
2572
2573               if (set)
2574                 {
2575                   rtx src = SET_SRC (set);
2576                   rtx label1, label2;
2577
2578                   if (GET_CODE (src) == IF_THEN_ELSE)
2579                     {
2580                       label1 = XEXP (src, 1);
2581                       label2 = XEXP (src, 2);
2582                     }
2583                   else
2584                     {
2585                       label1 = src;
2586                       label2 = NULL_RTX;
2587                     }
2588
2589                   do
2590                     {
2591                       if (label1 && label1 != pc_rtx)
2592                         {
2593                           if (GET_CODE (label1) != LABEL_REF)
2594                             {
2595                               /* Something tricky.  */
2596                               loop_info->has_multiple_exit_targets = 1;
2597                               break;
2598                             }
2599                           else if (XEXP (label1, 0) != exit_target
2600                                    && LABEL_OUTSIDE_LOOP_P (label1))
2601                             {
2602                               /* A jump outside the current loop.  */
2603                               loop_info->has_multiple_exit_targets = 1;
2604                               break;
2605                             }
2606                         }
2607
2608                       label1 = label2;
2609                       label2 = NULL_RTX;
2610                     }
2611                   while (label1);
2612                 }
2613               else
2614                 {
2615                   /* A return, or something tricky.  */
2616                   loop_info->has_multiple_exit_targets = 1;
2617                 }
2618             }
2619           /* FALLTHRU */
2620
2621         case INSN:
2622           if (volatile_refs_p (PATTERN (insn)))
2623             loop_info->has_volatile = 1;
2624
2625           if (GET_CODE (insn) == JUMP_INSN
2626               && (GET_CODE (PATTERN (insn)) == ADDR_DIFF_VEC
2627                   || GET_CODE (PATTERN (insn)) == ADDR_VEC))
2628             loop_info->has_tablejump = 1;
2629
2630           note_stores (PATTERN (insn), note_addr_stored, loop_info);
2631           if (! loop_info->first_loop_store_insn && loop_info->store_mems)
2632             loop_info->first_loop_store_insn = insn;
2633
2634           if (flag_non_call_exceptions && can_throw_internal (insn))
2635             loop_info->has_multiple_exit_targets = 1;
2636           break;
2637
2638         default:
2639           break;
2640         }
2641     }
2642
2643   /* Now, rescan the loop, setting up the LOOP_MEMS array.  */
2644   if (/* An exception thrown by a called function might land us
2645          anywhere.  */
2646       ! loop_info->has_nonconst_call
2647       /* We don't want loads for MEMs moved to a location before the
2648          one at which their stack memory becomes allocated.  (Note
2649          that this is not a problem for malloc, etc., since those
2650          require actual function calls.  */
2651       && ! current_function_calls_alloca
2652       /* There are ways to leave the loop other than falling off the
2653          end.  */
2654       && ! loop_info->has_multiple_exit_targets)
2655     for (insn = NEXT_INSN (start); insn != NEXT_INSN (end);
2656          insn = NEXT_INSN (insn))
2657       for_each_rtx (&insn, insert_loop_mem, loop_info);
2658
2659   /* BLKmode MEMs are added to LOOP_STORE_MEM as necessary so
2660      that loop_invariant_p and load_mems can use true_dependence
2661      to determine what is really clobbered.  */
2662   if (loop_info->unknown_address_altered)
2663     {
2664       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
2665
2666       loop_info->store_mems
2667         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
2668     }
2669   if (loop_info->unknown_constant_address_altered)
2670     {
2671       rtx mem = gen_rtx_MEM (BLKmode, const0_rtx);
2672
2673       RTX_UNCHANGING_P (mem) = 1;
2674       loop_info->store_mems
2675         = gen_rtx_EXPR_LIST (VOIDmode, mem, loop_info->store_mems);
2676     }
2677 }
2678 \f
2679 /* Invalidate all loops containing LABEL.  */
2680
2681 static void
2682 invalidate_loops_containing_label (label)
2683      rtx label;
2684 {
2685   struct loop *loop;
2686   for (loop = uid_loop[INSN_UID (label)]; loop; loop = loop->outer)
2687     loop->invalid = 1;
2688 }
2689
2690 /* Scan the function looking for loops.  Record the start and end of each loop.
2691    Also mark as invalid loops any loops that contain a setjmp or are branched
2692    to from outside the loop.  */
2693
2694 static void
2695 find_and_verify_loops (f, loops)
2696      rtx f;
2697      struct loops *loops;
2698 {
2699   rtx insn;
2700   rtx label;
2701   int num_loops;
2702   struct loop *current_loop;
2703   struct loop *next_loop;
2704   struct loop *loop;
2705
2706   num_loops = loops->num;
2707
2708   compute_luids (f, NULL_RTX, 0);
2709
2710   /* If there are jumps to undefined labels,
2711      treat them as jumps out of any/all loops.
2712      This also avoids writing past end of tables when there are no loops.  */
2713   uid_loop[0] = NULL;
2714
2715   /* Find boundaries of loops, mark which loops are contained within
2716      loops, and invalidate loops that have setjmp.  */
2717
2718   num_loops = 0;
2719   current_loop = NULL;
2720   for (insn = f; insn; insn = NEXT_INSN (insn))
2721     {
2722       if (GET_CODE (insn) == NOTE)
2723         switch (NOTE_LINE_NUMBER (insn))
2724           {
2725           case NOTE_INSN_LOOP_BEG:
2726             next_loop = loops->array + num_loops;
2727             next_loop->num = num_loops;
2728             num_loops++;
2729             next_loop->start = insn;
2730             next_loop->outer = current_loop;
2731             current_loop = next_loop;
2732             break;
2733
2734           case NOTE_INSN_LOOP_CONT:
2735             current_loop->cont = insn;
2736             break;
2737
2738           case NOTE_INSN_LOOP_VTOP:
2739             current_loop->vtop = insn;
2740             break;
2741
2742           case NOTE_INSN_LOOP_END:
2743             if (! current_loop)
2744               abort ();
2745
2746             current_loop->end = insn;
2747             current_loop = current_loop->outer;
2748             break;
2749
2750           default:
2751             break;
2752           }
2753
2754       if (GET_CODE (insn) == CALL_INSN
2755           && find_reg_note (insn, REG_SETJMP, NULL))
2756         {
2757           /* In this case, we must invalidate our current loop and any
2758              enclosing loop.  */
2759           for (loop = current_loop; loop; loop = loop->outer)
2760             {
2761               loop->invalid = 1;
2762               if (loop_dump_stream)
2763                 fprintf (loop_dump_stream,
2764                          "\nLoop at %d ignored due to setjmp.\n",
2765                          INSN_UID (loop->start));
2766             }
2767         }
2768
2769       /* Note that this will mark the NOTE_INSN_LOOP_END note as being in the
2770          enclosing loop, but this doesn't matter.  */
2771       uid_loop[INSN_UID (insn)] = current_loop;
2772     }
2773
2774   /* Any loop containing a label used in an initializer must be invalidated,
2775      because it can be jumped into from anywhere.  */
2776   for (label = forced_labels; label; label = XEXP (label, 1))
2777     invalidate_loops_containing_label (XEXP (label, 0));
2778
2779   /* Any loop containing a label used for an exception handler must be
2780      invalidated, because it can be jumped into from anywhere.  */
2781   for_each_eh_label (invalidate_loops_containing_label);
2782
2783   /* Now scan all insn's in the function.  If any JUMP_INSN branches into a
2784      loop that it is not contained within, that loop is marked invalid.
2785      If any INSN or CALL_INSN uses a label's address, then the loop containing
2786      that label is marked invalid, because it could be jumped into from
2787      anywhere.
2788
2789      Also look for blocks of code ending in an unconditional branch that
2790      exits the loop.  If such a block is surrounded by a conditional
2791      branch around the block, move the block elsewhere (see below) and
2792      invert the jump to point to the code block.  This may eliminate a
2793      label in our loop and will simplify processing by both us and a
2794      possible second cse pass.  */
2795
2796   for (insn = f; insn; insn = NEXT_INSN (insn))
2797     if (INSN_P (insn))
2798       {
2799         struct loop *this_loop = uid_loop[INSN_UID (insn)];
2800
2801         if (GET_CODE (insn) == INSN || GET_CODE (insn) == CALL_INSN)
2802           {
2803             rtx note = find_reg_note (insn, REG_LABEL, NULL_RTX);
2804             if (note)
2805               invalidate_loops_containing_label (XEXP (note, 0));
2806           }
2807
2808         if (GET_CODE (insn) != JUMP_INSN)
2809           continue;
2810
2811         mark_loop_jump (PATTERN (insn), this_loop);
2812
2813         /* See if this is an unconditional branch outside the loop.  */
2814         if (this_loop
2815             && (GET_CODE (PATTERN (insn)) == RETURN
2816                 || (any_uncondjump_p (insn)
2817                     && onlyjump_p (insn)
2818                     && (uid_loop[INSN_UID (JUMP_LABEL (insn))]
2819                         != this_loop)))
2820             && get_max_uid () < max_uid_for_loop)
2821           {
2822             rtx p;
2823             rtx our_next = next_real_insn (insn);
2824             rtx last_insn_to_move = NEXT_INSN (insn);
2825             struct loop *dest_loop;
2826             struct loop *outer_loop = NULL;
2827
2828             /* Go backwards until we reach the start of the loop, a label,
2829                or a JUMP_INSN.  */
2830             for (p = PREV_INSN (insn);
2831                  GET_CODE (p) != CODE_LABEL
2832                  && ! (GET_CODE (p) == NOTE
2833                        && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
2834                  && GET_CODE (p) != JUMP_INSN;
2835                  p = PREV_INSN (p))
2836               ;
2837
2838             /* Check for the case where we have a jump to an inner nested
2839                loop, and do not perform the optimization in that case.  */
2840
2841             if (JUMP_LABEL (insn))
2842               {
2843                 dest_loop = uid_loop[INSN_UID (JUMP_LABEL (insn))];
2844                 if (dest_loop)
2845                   {
2846                     for (outer_loop = dest_loop; outer_loop;
2847                          outer_loop = outer_loop->outer)
2848                       if (outer_loop == this_loop)
2849                         break;
2850                   }
2851               }
2852
2853             /* Make sure that the target of P is within the current loop.  */
2854
2855             if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p)
2856                 && uid_loop[INSN_UID (JUMP_LABEL (p))] != this_loop)
2857               outer_loop = this_loop;
2858
2859             /* If we stopped on a JUMP_INSN to the next insn after INSN,
2860                we have a block of code to try to move.
2861
2862                We look backward and then forward from the target of INSN
2863                to find a BARRIER at the same loop depth as the target.
2864                If we find such a BARRIER, we make a new label for the start
2865                of the block, invert the jump in P and point it to that label,
2866                and move the block of code to the spot we found.  */
2867
2868             if (! outer_loop
2869                 && GET_CODE (p) == JUMP_INSN
2870                 && JUMP_LABEL (p) != 0
2871                 /* Just ignore jumps to labels that were never emitted.
2872                    These always indicate compilation errors.  */
2873                 && INSN_UID (JUMP_LABEL (p)) != 0
2874                 && any_condjump_p (p) && onlyjump_p (p)
2875                 && next_real_insn (JUMP_LABEL (p)) == our_next
2876                 /* If it's not safe to move the sequence, then we
2877                    mustn't try.  */
2878                 && insns_safe_to_move_p (p, NEXT_INSN (insn),
2879                                          &last_insn_to_move))
2880               {
2881                 rtx target
2882                   = JUMP_LABEL (insn) ? JUMP_LABEL (insn) : get_last_insn ();
2883                 struct loop *target_loop = uid_loop[INSN_UID (target)];
2884                 rtx loc, loc2;
2885                 rtx tmp;
2886
2887                 /* Search for possible garbage past the conditional jumps
2888                    and look for the last barrier.  */
2889                 for (tmp = last_insn_to_move;
2890                      tmp && GET_CODE (tmp) != CODE_LABEL; tmp = NEXT_INSN (tmp))
2891                   if (GET_CODE (tmp) == BARRIER)
2892                     last_insn_to_move = tmp;
2893
2894                 for (loc = target; loc; loc = PREV_INSN (loc))
2895                   if (GET_CODE (loc) == BARRIER
2896                       /* Don't move things inside a tablejump.  */
2897                       && ((loc2 = next_nonnote_insn (loc)) == 0
2898                           || GET_CODE (loc2) != CODE_LABEL
2899                           || (loc2 = next_nonnote_insn (loc2)) == 0
2900                           || GET_CODE (loc2) != JUMP_INSN
2901                           || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
2902                               && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
2903                       && uid_loop[INSN_UID (loc)] == target_loop)
2904                     break;
2905
2906                 if (loc == 0)
2907                   for (loc = target; loc; loc = NEXT_INSN (loc))
2908                     if (GET_CODE (loc) == BARRIER
2909                         /* Don't move things inside a tablejump.  */
2910                         && ((loc2 = next_nonnote_insn (loc)) == 0
2911                             || GET_CODE (loc2) != CODE_LABEL
2912                             || (loc2 = next_nonnote_insn (loc2)) == 0
2913                             || GET_CODE (loc2) != JUMP_INSN
2914                             || (GET_CODE (PATTERN (loc2)) != ADDR_VEC
2915                                 && GET_CODE (PATTERN (loc2)) != ADDR_DIFF_VEC))
2916                         && uid_loop[INSN_UID (loc)] == target_loop)
2917                       break;
2918
2919                 if (loc)
2920                   {
2921                     rtx cond_label = JUMP_LABEL (p);
2922                     rtx new_label = get_label_after (p);
2923
2924                     /* Ensure our label doesn't go away.  */
2925                     LABEL_NUSES (cond_label)++;
2926
2927                     /* Verify that uid_loop is large enough and that
2928                        we can invert P.  */
2929                     if (invert_jump (p, new_label, 1))
2930                       {
2931                         rtx q, r;
2932
2933                         /* If no suitable BARRIER was found, create a suitable
2934                            one before TARGET.  Since TARGET is a fall through
2935                            path, we'll need to insert a jump around our block
2936                            and add a BARRIER before TARGET.
2937
2938                            This creates an extra unconditional jump outside
2939                            the loop.  However, the benefits of removing rarely
2940                            executed instructions from inside the loop usually
2941                            outweighs the cost of the extra unconditional jump
2942                            outside the loop.  */
2943                         if (loc == 0)
2944                           {
2945                             rtx temp;
2946
2947                             temp = gen_jump (JUMP_LABEL (insn));
2948                             temp = emit_jump_insn_before (temp, target);
2949                             JUMP_LABEL (temp) = JUMP_LABEL (insn);
2950                             LABEL_NUSES (JUMP_LABEL (insn))++;
2951                             loc = emit_barrier_before (target);
2952                           }
2953
2954                         /* Include the BARRIER after INSN and copy the
2955                            block after LOC.  */
2956                         if (squeeze_notes (&new_label, &last_insn_to_move))
2957                           abort ();
2958                         reorder_insns (new_label, last_insn_to_move, loc);
2959
2960                         /* All those insns are now in TARGET_LOOP.  */
2961                         for (q = new_label;
2962                              q != NEXT_INSN (last_insn_to_move);
2963                              q = NEXT_INSN (q))
2964                           uid_loop[INSN_UID (q)] = target_loop;
2965
2966                         /* The label jumped to by INSN is no longer a loop
2967                            exit.  Unless INSN does not have a label (e.g.,
2968                            it is a RETURN insn), search loop->exit_labels
2969                            to find its label_ref, and remove it.  Also turn
2970                            off LABEL_OUTSIDE_LOOP_P bit.  */
2971                         if (JUMP_LABEL (insn))
2972                           {
2973                             for (q = 0, r = this_loop->exit_labels;
2974                                  r;
2975                                  q = r, r = LABEL_NEXTREF (r))
2976                               if (XEXP (r, 0) == JUMP_LABEL (insn))
2977                                 {
2978                                   LABEL_OUTSIDE_LOOP_P (r) = 0;
2979                                   if (q)
2980                                     LABEL_NEXTREF (q) = LABEL_NEXTREF (r);
2981                                   else
2982                                     this_loop->exit_labels = LABEL_NEXTREF (r);
2983                                   break;
2984                                 }
2985
2986                             for (loop = this_loop; loop && loop != target_loop;
2987                                  loop = loop->outer)
2988                               loop->exit_count--;
2989
2990                             /* If we didn't find it, then something is
2991                                wrong.  */
2992                             if (! r)
2993                               abort ();
2994                           }
2995
2996                         /* P is now a jump outside the loop, so it must be put
2997                            in loop->exit_labels, and marked as such.
2998                            The easiest way to do this is to just call
2999                            mark_loop_jump again for P.  */
3000                         mark_loop_jump (PATTERN (p), this_loop);
3001
3002                         /* If INSN now jumps to the insn after it,
3003                            delete INSN.  */
3004                         if (JUMP_LABEL (insn) != 0
3005                             && (next_real_insn (JUMP_LABEL (insn))
3006                                 == next_real_insn (insn)))
3007                           delete_related_insns (insn);
3008                       }
3009
3010                     /* Continue the loop after where the conditional
3011                        branch used to jump, since the only branch insn
3012                        in the block (if it still remains) is an inter-loop
3013                        branch and hence needs no processing.  */
3014                     insn = NEXT_INSN (cond_label);
3015
3016                     if (--LABEL_NUSES (cond_label) == 0)
3017                       delete_related_insns (cond_label);
3018
3019                     /* This loop will be continued with NEXT_INSN (insn).  */
3020                     insn = PREV_INSN (insn);
3021                   }
3022               }
3023           }
3024       }
3025 }
3026
3027 /* If any label in X jumps to a loop different from LOOP_NUM and any of the
3028    loops it is contained in, mark the target loop invalid.
3029
3030    For speed, we assume that X is part of a pattern of a JUMP_INSN.  */
3031
3032 static void
3033 mark_loop_jump (x, loop)
3034      rtx x;
3035      struct loop *loop;
3036 {
3037   struct loop *dest_loop;
3038   struct loop *outer_loop;
3039   int i;
3040
3041   switch (GET_CODE (x))
3042     {
3043     case PC:
3044     case USE:
3045     case CLOBBER:
3046     case REG:
3047     case MEM:
3048     case CONST_INT:
3049     case CONST_DOUBLE:
3050     case RETURN:
3051       return;
3052
3053     case CONST:
3054       /* There could be a label reference in here.  */
3055       mark_loop_jump (XEXP (x, 0), loop);
3056       return;
3057
3058     case PLUS:
3059     case MINUS:
3060     case MULT:
3061       mark_loop_jump (XEXP (x, 0), loop);
3062       mark_loop_jump (XEXP (x, 1), loop);
3063       return;
3064
3065     case LO_SUM:
3066       /* This may refer to a LABEL_REF or SYMBOL_REF.  */
3067       mark_loop_jump (XEXP (x, 1), loop);
3068       return;
3069
3070     case SIGN_EXTEND:
3071     case ZERO_EXTEND:
3072       mark_loop_jump (XEXP (x, 0), loop);
3073       return;
3074
3075     case LABEL_REF:
3076       dest_loop = uid_loop[INSN_UID (XEXP (x, 0))];
3077
3078       /* Link together all labels that branch outside the loop.  This
3079          is used by final_[bg]iv_value and the loop unrolling code.  Also
3080          mark this LABEL_REF so we know that this branch should predict
3081          false.  */
3082
3083       /* A check to make sure the label is not in an inner nested loop,
3084          since this does not count as a loop exit.  */
3085       if (dest_loop)
3086         {
3087           for (outer_loop = dest_loop; outer_loop;
3088                outer_loop = outer_loop->outer)
3089             if (outer_loop == loop)
3090               break;
3091         }
3092       else
3093         outer_loop = NULL;
3094
3095       if (loop && ! outer_loop)
3096         {
3097           LABEL_OUTSIDE_LOOP_P (x) = 1;
3098           LABEL_NEXTREF (x) = loop->exit_labels;
3099           loop->exit_labels = x;
3100
3101           for (outer_loop = loop;
3102                outer_loop && outer_loop != dest_loop;
3103                outer_loop = outer_loop->outer)
3104             outer_loop->exit_count++;
3105         }
3106
3107       /* If this is inside a loop, but not in the current loop or one enclosed
3108          by it, it invalidates at least one loop.  */
3109
3110       if (! dest_loop)
3111         return;
3112
3113       /* We must invalidate every nested loop containing the target of this
3114          label, except those that also contain the jump insn.  */
3115
3116       for (; dest_loop; dest_loop = dest_loop->outer)
3117         {
3118           /* Stop when we reach a loop that also contains the jump insn.  */
3119           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3120             if (dest_loop == outer_loop)
3121               return;
3122
3123           /* If we get here, we know we need to invalidate a loop.  */
3124           if (loop_dump_stream && ! dest_loop->invalid)
3125             fprintf (loop_dump_stream,
3126                      "\nLoop at %d ignored due to multiple entry points.\n",
3127                      INSN_UID (dest_loop->start));
3128
3129           dest_loop->invalid = 1;
3130         }
3131       return;
3132
3133     case SET:
3134       /* If this is not setting pc, ignore.  */
3135       if (SET_DEST (x) == pc_rtx)
3136         mark_loop_jump (SET_SRC (x), loop);
3137       return;
3138
3139     case IF_THEN_ELSE:
3140       mark_loop_jump (XEXP (x, 1), loop);
3141       mark_loop_jump (XEXP (x, 2), loop);
3142       return;
3143
3144     case PARALLEL:
3145     case ADDR_VEC:
3146       for (i = 0; i < XVECLEN (x, 0); i++)
3147         mark_loop_jump (XVECEXP (x, 0, i), loop);
3148       return;
3149
3150     case ADDR_DIFF_VEC:
3151       for (i = 0; i < XVECLEN (x, 1); i++)
3152         mark_loop_jump (XVECEXP (x, 1, i), loop);
3153       return;
3154
3155     default:
3156       /* Strictly speaking this is not a jump into the loop, only a possible
3157          jump out of the loop.  However, we have no way to link the destination
3158          of this jump onto the list of exit labels.  To be safe we mark this
3159          loop and any containing loops as invalid.  */
3160       if (loop)
3161         {
3162           for (outer_loop = loop; outer_loop; outer_loop = outer_loop->outer)
3163             {
3164               if (loop_dump_stream && ! outer_loop->invalid)
3165                 fprintf (loop_dump_stream,
3166                          "\nLoop at %d ignored due to unknown exit jump.\n",
3167                          INSN_UID (outer_loop->start));
3168               outer_loop->invalid = 1;
3169             }
3170         }
3171       return;
3172     }
3173 }
3174 \f
3175 /* Return nonzero if there is a label in the range from
3176    insn INSN to and including the insn whose luid is END
3177    INSN must have an assigned luid (i.e., it must not have
3178    been previously created by loop.c).  */
3179
3180 static int
3181 labels_in_range_p (insn, end)
3182      rtx insn;
3183      int end;
3184 {
3185   while (insn && INSN_LUID (insn) <= end)
3186     {
3187       if (GET_CODE (insn) == CODE_LABEL)
3188         return 1;
3189       insn = NEXT_INSN (insn);
3190     }
3191
3192   return 0;
3193 }
3194
3195 /* Record that a memory reference X is being set.  */
3196
3197 static void
3198 note_addr_stored (x, y, data)
3199      rtx x;
3200      rtx y ATTRIBUTE_UNUSED;
3201      void *data ATTRIBUTE_UNUSED;
3202 {
3203   struct loop_info *loop_info = data;
3204
3205   if (x == 0 || GET_CODE (x) != MEM)
3206     return;
3207
3208   /* Count number of memory writes.
3209      This affects heuristics in strength_reduce.  */
3210   loop_info->num_mem_sets++;
3211
3212   /* BLKmode MEM means all memory is clobbered.  */
3213   if (GET_MODE (x) == BLKmode)
3214     {
3215       if (RTX_UNCHANGING_P (x))
3216         loop_info->unknown_constant_address_altered = 1;
3217       else
3218         loop_info->unknown_address_altered = 1;
3219
3220       return;
3221     }
3222
3223   loop_info->store_mems = gen_rtx_EXPR_LIST (VOIDmode, x,
3224                                              loop_info->store_mems);
3225 }
3226
3227 /* X is a value modified by an INSN that references a biv inside a loop
3228    exit test (ie, X is somehow related to the value of the biv).  If X
3229    is a pseudo that is used more than once, then the biv is (effectively)
3230    used more than once.  DATA is a pointer to a loop_regs structure.  */
3231
3232 static void
3233 note_set_pseudo_multiple_uses (x, y, data)
3234      rtx x;
3235      rtx y ATTRIBUTE_UNUSED;
3236      void *data;
3237 {
3238   struct loop_regs *regs = (struct loop_regs *) data;
3239
3240   if (x == 0)
3241     return;
3242
3243   while (GET_CODE (x) == STRICT_LOW_PART
3244          || GET_CODE (x) == SIGN_EXTRACT
3245          || GET_CODE (x) == ZERO_EXTRACT
3246          || GET_CODE (x) == SUBREG)
3247     x = XEXP (x, 0);
3248
3249   if (GET_CODE (x) != REG || REGNO (x) < FIRST_PSEUDO_REGISTER)
3250     return;
3251
3252   /* If we do not have usage information, or if we know the register
3253      is used more than once, note that fact for check_dbra_loop.  */
3254   if (REGNO (x) >= max_reg_before_loop
3255       || ! regs->array[REGNO (x)].single_usage
3256       || regs->array[REGNO (x)].single_usage == const0_rtx)
3257     regs->multiple_uses = 1;
3258 }
3259 \f
3260 /* Return nonzero if the rtx X is invariant over the current loop.
3261
3262    The value is 2 if we refer to something only conditionally invariant.
3263
3264    A memory ref is invariant if it is not volatile and does not conflict
3265    with anything stored in `loop_info->store_mems'.  */
3266
3267 int
3268 loop_invariant_p (loop, x)
3269      const struct loop *loop;
3270      rtx x;
3271 {
3272   struct loop_info *loop_info = LOOP_INFO (loop);
3273   struct loop_regs *regs = LOOP_REGS (loop);
3274   int i;
3275   enum rtx_code code;
3276   const char *fmt;
3277   int conditional = 0;
3278   rtx mem_list_entry;
3279
3280   if (x == 0)
3281     return 1;
3282   code = GET_CODE (x);
3283   switch (code)
3284     {
3285     case CONST_INT:
3286     case CONST_DOUBLE:
3287     case SYMBOL_REF:
3288     case CONST:
3289       return 1;
3290
3291     case LABEL_REF:
3292       /* A LABEL_REF is normally invariant, however, if we are unrolling
3293          loops, and this label is inside the loop, then it isn't invariant.
3294          This is because each unrolled copy of the loop body will have
3295          a copy of this label.  If this was invariant, then an insn loading
3296          the address of this label into a register might get moved outside
3297          the loop, and then each loop body would end up using the same label.
3298
3299          We don't know the loop bounds here though, so just fail for all
3300          labels.  */
3301       if (flag_old_unroll_loops)
3302         return 0;
3303       else
3304         return 1;
3305
3306     case PC:
3307     case CC0:
3308     case UNSPEC_VOLATILE:
3309       return 0;
3310
3311     case REG:
3312       /* We used to check RTX_UNCHANGING_P (x) here, but that is invalid
3313          since the reg might be set by initialization within the loop.  */
3314
3315       if ((x == frame_pointer_rtx || x == hard_frame_pointer_rtx
3316            || x == arg_pointer_rtx || x == pic_offset_table_rtx)
3317           && ! current_function_has_nonlocal_goto)
3318         return 1;
3319
3320       if (LOOP_INFO (loop)->has_call
3321           && REGNO (x) < FIRST_PSEUDO_REGISTER && call_used_regs[REGNO (x)])
3322         return 0;
3323
3324       /* Out-of-range regs can occur when we are called from unrolling.
3325          These have always been created by the unroller and are set in
3326          the loop, hence are never invariant.  */
3327
3328       if (REGNO (x) >= (unsigned) regs->num)
3329         return 0;
3330
3331       if (regs->array[REGNO (x)].set_in_loop < 0)
3332         return 2;
3333
3334       return regs->array[REGNO (x)].set_in_loop == 0;
3335
3336     case MEM:
3337       /* Volatile memory references must be rejected.  Do this before
3338          checking for read-only items, so that volatile read-only items
3339          will be rejected also.  */
3340       if (MEM_VOLATILE_P (x))
3341         return 0;
3342
3343       /* See if there is any dependence between a store and this load.  */
3344       mem_list_entry = loop_info->store_mems;
3345       while (mem_list_entry)
3346         {
3347           if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
3348                                x, rtx_varies_p))
3349             return 0;
3350
3351           mem_list_entry = XEXP (mem_list_entry, 1);
3352         }
3353
3354       /* It's not invalidated by a store in memory
3355          but we must still verify the address is invariant.  */
3356       break;
3357
3358     case ASM_OPERANDS:
3359       /* Don't mess with insns declared volatile.  */
3360       if (MEM_VOLATILE_P (x))
3361         return 0;
3362       break;
3363
3364     default:
3365       break;
3366     }
3367
3368   fmt = GET_RTX_FORMAT (code);
3369   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3370     {
3371       if (fmt[i] == 'e')
3372         {
3373           int tem = loop_invariant_p (loop, XEXP (x, i));
3374           if (tem == 0)
3375             return 0;
3376           if (tem == 2)
3377             conditional = 1;
3378         }
3379       else if (fmt[i] == 'E')
3380         {
3381           int j;
3382           for (j = 0; j < XVECLEN (x, i); j++)
3383             {
3384               int tem = loop_invariant_p (loop, XVECEXP (x, i, j));
3385               if (tem == 0)
3386                 return 0;
3387               if (tem == 2)
3388                 conditional = 1;
3389             }
3390
3391         }
3392     }
3393
3394   return 1 + conditional;
3395 }
3396 \f
3397 /* Return nonzero if all the insns in the loop that set REG
3398    are INSN and the immediately following insns,
3399    and if each of those insns sets REG in an invariant way
3400    (not counting uses of REG in them).
3401
3402    The value is 2 if some of these insns are only conditionally invariant.
3403
3404    We assume that INSN itself is the first set of REG
3405    and that its source is invariant.  */
3406
3407 static int
3408 consec_sets_invariant_p (loop, reg, n_sets, insn)
3409      const struct loop *loop;
3410      int n_sets;
3411      rtx reg, insn;
3412 {
3413   struct loop_regs *regs = LOOP_REGS (loop);
3414   rtx p = insn;
3415   unsigned int regno = REGNO (reg);
3416   rtx temp;
3417   /* Number of sets we have to insist on finding after INSN.  */
3418   int count = n_sets - 1;
3419   int old = regs->array[regno].set_in_loop;
3420   int value = 0;
3421   int this;
3422
3423   /* If N_SETS hit the limit, we can't rely on its value.  */
3424   if (n_sets == 127)
3425     return 0;
3426
3427   regs->array[regno].set_in_loop = 0;
3428
3429   while (count > 0)
3430     {
3431       enum rtx_code code;
3432       rtx set;
3433
3434       p = NEXT_INSN (p);
3435       code = GET_CODE (p);
3436
3437       /* If library call, skip to end of it.  */
3438       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
3439         p = XEXP (temp, 0);
3440
3441       this = 0;
3442       if (code == INSN
3443           && (set = single_set (p))
3444           && GET_CODE (SET_DEST (set)) == REG
3445           && REGNO (SET_DEST (set)) == regno)
3446         {
3447           this = loop_invariant_p (loop, SET_SRC (set));
3448           if (this != 0)
3449             value |= this;
3450           else if ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX)))
3451             {
3452               /* If this is a libcall, then any invariant REG_EQUAL note is OK.
3453                  If this is an ordinary insn, then only CONSTANT_P REG_EQUAL
3454                  notes are OK.  */
3455               this = (CONSTANT_P (XEXP (temp, 0))
3456                       || (find_reg_note (p, REG_RETVAL, NULL_RTX)
3457                           && loop_invariant_p (loop, XEXP (temp, 0))));
3458               if (this != 0)
3459                 value |= this;
3460             }
3461         }
3462       if (this != 0)
3463         count--;
3464       else if (code != NOTE)
3465         {
3466           regs->array[regno].set_in_loop = old;
3467           return 0;
3468         }
3469     }
3470
3471   regs->array[regno].set_in_loop = old;
3472   /* If loop_invariant_p ever returned 2, we return 2.  */
3473   return 1 + (value & 2);
3474 }
3475
3476 #if 0
3477 /* I don't think this condition is sufficient to allow INSN
3478    to be moved, so we no longer test it.  */
3479
3480 /* Return 1 if all insns in the basic block of INSN and following INSN
3481    that set REG are invariant according to TABLE.  */
3482
3483 static int
3484 all_sets_invariant_p (reg, insn, table)
3485      rtx reg, insn;
3486      short *table;
3487 {
3488   rtx p = insn;
3489   int regno = REGNO (reg);
3490
3491   while (1)
3492     {
3493       enum rtx_code code;
3494       p = NEXT_INSN (p);
3495       code = GET_CODE (p);
3496       if (code == CODE_LABEL || code == JUMP_INSN)
3497         return 1;
3498       if (code == INSN && GET_CODE (PATTERN (p)) == SET
3499           && GET_CODE (SET_DEST (PATTERN (p))) == REG
3500           && REGNO (SET_DEST (PATTERN (p))) == regno)
3501         {
3502           if (! loop_invariant_p (loop, SET_SRC (PATTERN (p)), table))
3503             return 0;
3504         }
3505     }
3506 }
3507 #endif /* 0 */
3508 \f
3509 /* Look at all uses (not sets) of registers in X.  For each, if it is
3510    the single use, set USAGE[REGNO] to INSN; if there was a previous use in
3511    a different insn, set USAGE[REGNO] to const0_rtx.  */
3512
3513 static void
3514 find_single_use_in_loop (regs, insn, x)
3515      struct loop_regs *regs;
3516      rtx insn;
3517      rtx x;
3518 {
3519   enum rtx_code code = GET_CODE (x);
3520   const char *fmt = GET_RTX_FORMAT (code);
3521   int i, j;
3522
3523   if (code == REG)
3524     regs->array[REGNO (x)].single_usage
3525       = (regs->array[REGNO (x)].single_usage != 0
3526          && regs->array[REGNO (x)].single_usage != insn)
3527         ? const0_rtx : insn;
3528
3529   else if (code == SET)
3530     {
3531       /* Don't count SET_DEST if it is a REG; otherwise count things
3532          in SET_DEST because if a register is partially modified, it won't
3533          show up as a potential movable so we don't care how USAGE is set
3534          for it.  */
3535       if (GET_CODE (SET_DEST (x)) != REG)
3536         find_single_use_in_loop (regs, insn, SET_DEST (x));
3537       find_single_use_in_loop (regs, insn, SET_SRC (x));
3538     }
3539   else
3540     for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3541       {
3542         if (fmt[i] == 'e' && XEXP (x, i) != 0)
3543           find_single_use_in_loop (regs, insn, XEXP (x, i));
3544         else if (fmt[i] == 'E')
3545           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
3546             find_single_use_in_loop (regs, insn, XVECEXP (x, i, j));
3547       }
3548 }
3549 \f
3550 /* Count and record any set in X which is contained in INSN.  Update
3551    REGS->array[I].MAY_NOT_OPTIMIZE and LAST_SET for any register I set
3552    in X.  */
3553
3554 static void
3555 count_one_set (regs, insn, x, last_set)
3556      struct loop_regs *regs;
3557      rtx insn, x;
3558      rtx *last_set;
3559 {
3560   if (GET_CODE (x) == CLOBBER && GET_CODE (XEXP (x, 0)) == REG)
3561     /* Don't move a reg that has an explicit clobber.
3562        It's not worth the pain to try to do it correctly.  */
3563     regs->array[REGNO (XEXP (x, 0))].may_not_optimize = 1;
3564
3565   if (GET_CODE (x) == SET || GET_CODE (x) == CLOBBER)
3566     {
3567       rtx dest = SET_DEST (x);
3568       while (GET_CODE (dest) == SUBREG
3569              || GET_CODE (dest) == ZERO_EXTRACT
3570              || GET_CODE (dest) == SIGN_EXTRACT
3571              || GET_CODE (dest) == STRICT_LOW_PART)
3572         dest = XEXP (dest, 0);
3573       if (GET_CODE (dest) == REG)
3574         {
3575           int i;
3576           int regno = REGNO (dest);
3577           for (i = 0; i < LOOP_REGNO_NREGS (regno, dest); i++)
3578             {
3579               /* If this is the first setting of this reg
3580                  in current basic block, and it was set before,
3581                  it must be set in two basic blocks, so it cannot
3582                  be moved out of the loop.  */
3583               if (regs->array[regno].set_in_loop > 0
3584                   && last_set == 0)
3585                 regs->array[regno+i].may_not_optimize = 1;
3586               /* If this is not first setting in current basic block,
3587                  see if reg was used in between previous one and this.
3588                  If so, neither one can be moved.  */
3589               if (last_set[regno] != 0
3590                   && reg_used_between_p (dest, last_set[regno], insn))
3591                 regs->array[regno+i].may_not_optimize = 1;
3592               if (regs->array[regno+i].set_in_loop < 127)
3593                 ++regs->array[regno+i].set_in_loop;
3594               last_set[regno+i] = insn;
3595             }
3596         }
3597     }
3598 }
3599 \f
3600 /* Given a loop that is bounded by LOOP->START and LOOP->END and that
3601    is entered at LOOP->SCAN_START, return 1 if the register set in SET
3602    contained in insn INSN is used by any insn that precedes INSN in
3603    cyclic order starting from the loop entry point.
3604
3605    We don't want to use INSN_LUID here because if we restrict INSN to those
3606    that have a valid INSN_LUID, it means we cannot move an invariant out
3607    from an inner loop past two loops.  */
3608
3609 static int
3610 loop_reg_used_before_p (loop, set, insn)
3611      const struct loop *loop;
3612      rtx set, insn;
3613 {
3614   rtx reg = SET_DEST (set);
3615   rtx p;
3616
3617   /* Scan forward checking for register usage.  If we hit INSN, we
3618      are done.  Otherwise, if we hit LOOP->END, wrap around to LOOP->START.  */
3619   for (p = loop->scan_start; p != insn; p = NEXT_INSN (p))
3620     {
3621       if (INSN_P (p) && reg_overlap_mentioned_p (reg, PATTERN (p)))
3622         return 1;
3623
3624       if (p == loop->end)
3625         p = loop->start;
3626     }
3627
3628   return 0;
3629 }
3630 \f
3631
3632 /* Information we collect about arrays that we might want to prefetch.  */
3633 struct prefetch_info
3634 {
3635   struct iv_class *class;       /* Class this prefetch is based on.  */
3636   struct induction *giv;        /* GIV this prefetch is based on.  */
3637   rtx base_address;             /* Start prefetching from this address plus
3638                                    index.  */
3639   HOST_WIDE_INT index;
3640   HOST_WIDE_INT stride;         /* Prefetch stride in bytes in each
3641                                    iteration.  */
3642   unsigned int bytes_accessed;  /* Sum of sizes of all accesses to this
3643                                    prefetch area in one iteration.  */
3644   unsigned int total_bytes;     /* Total bytes loop will access in this block.
3645                                    This is set only for loops with known
3646                                    iteration counts and is 0xffffffff
3647                                    otherwise.  */
3648   int prefetch_in_loop;         /* Number of prefetch insns in loop.  */
3649   int prefetch_before_loop;     /* Number of prefetch insns before loop.  */
3650   unsigned int write : 1;       /* 1 for read/write prefetches.  */
3651 };
3652
3653 /* Data used by check_store function.  */
3654 struct check_store_data
3655 {
3656   rtx mem_address;
3657   int mem_write;
3658 };
3659
3660 static void check_store PARAMS ((rtx, rtx, void *));
3661 static void emit_prefetch_instructions PARAMS ((struct loop *));
3662 static int rtx_equal_for_prefetch_p PARAMS ((rtx, rtx));
3663
3664 /* Set mem_write when mem_address is found.  Used as callback to
3665    note_stores.  */
3666 static void
3667 check_store (x, pat, data)
3668      rtx x, pat ATTRIBUTE_UNUSED;
3669      void *data;
3670 {
3671   struct check_store_data *d = (struct check_store_data *) data;
3672
3673   if ((GET_CODE (x) == MEM) && rtx_equal_p (d->mem_address, XEXP (x, 0)))
3674     d->mem_write = 1;
3675 }
3676 \f
3677 /* Like rtx_equal_p, but attempts to swap commutative operands.  This is
3678    important to get some addresses combined.  Later more sophisticated
3679    transformations can be added when necessary.
3680
3681    ??? Same trick with swapping operand is done at several other places.
3682    It can be nice to develop some common way to handle this.  */
3683
3684 static int
3685 rtx_equal_for_prefetch_p (x, y)
3686      rtx x, y;
3687 {
3688   int i;
3689   int j;
3690   enum rtx_code code = GET_CODE (x);
3691   const char *fmt;
3692
3693   if (x == y)
3694     return 1;
3695   if (code != GET_CODE (y))
3696     return 0;
3697
3698   code = GET_CODE (x);
3699
3700   if (GET_RTX_CLASS (code) == 'c')
3701     {
3702       return ((rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 0))
3703                && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 1)))
3704               || (rtx_equal_for_prefetch_p (XEXP (x, 0), XEXP (y, 1))
3705                   && rtx_equal_for_prefetch_p (XEXP (x, 1), XEXP (y, 0))));
3706     }
3707   /* Compare the elements.  If any pair of corresponding elements fails to
3708      match, return 0 for the whole thing.  */
3709
3710   fmt = GET_RTX_FORMAT (code);
3711   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
3712     {
3713       switch (fmt[i])
3714         {
3715         case 'w':
3716           if (XWINT (x, i) != XWINT (y, i))
3717             return 0;
3718           break;
3719
3720         case 'i':
3721           if (XINT (x, i) != XINT (y, i))
3722             return 0;
3723           break;
3724
3725         case 'E':
3726           /* Two vectors must have the same length.  */
3727           if (XVECLEN (x, i) != XVECLEN (y, i))
3728             return 0;
3729
3730           /* And the corresponding elements must match.  */
3731           for (j = 0; j < XVECLEN (x, i); j++)
3732             if (rtx_equal_for_prefetch_p (XVECEXP (x, i, j),
3733                                           XVECEXP (y, i, j)) == 0)
3734               return 0;
3735           break;
3736
3737         case 'e':
3738           if (rtx_equal_for_prefetch_p (XEXP (x, i), XEXP (y, i)) == 0)
3739             return 0;
3740           break;
3741
3742         case 's':
3743           if (strcmp (XSTR (x, i), XSTR (y, i)))
3744             return 0;
3745           break;
3746
3747         case 'u':
3748           /* These are just backpointers, so they don't matter.  */
3749           break;
3750
3751         case '0':
3752           break;
3753
3754           /* It is believed that rtx's at this level will never
3755              contain anything but integers and other rtx's,
3756              except for within LABEL_REFs and SYMBOL_REFs.  */
3757         default:
3758           abort ();
3759         }
3760     }
3761   return 1;
3762 }
3763 \f
3764 /* Remove constant addition value from the expression X (when present)
3765    and return it.  */
3766
3767 static HOST_WIDE_INT
3768 remove_constant_addition (x)
3769      rtx *x;
3770 {
3771   HOST_WIDE_INT addval = 0;
3772   rtx exp = *x;
3773
3774   /* Avoid clobbering a shared CONST expression.  */
3775   if (GET_CODE (exp) == CONST)
3776     {
3777       if (GET_CODE (XEXP (exp, 0)) == PLUS
3778           && GET_CODE (XEXP (XEXP (exp, 0), 0)) == SYMBOL_REF
3779           && GET_CODE (XEXP (XEXP (exp, 0), 1)) == CONST_INT)
3780         {
3781           *x = XEXP (XEXP (exp, 0), 0);
3782           return INTVAL (XEXP (XEXP (exp, 0), 1));
3783         }
3784       return 0;
3785     }
3786
3787   if (GET_CODE (exp) == CONST_INT)
3788     {
3789       addval = INTVAL (exp);
3790       *x = const0_rtx;
3791     }
3792
3793   /* For plus expression recurse on ourself.  */
3794   else if (GET_CODE (exp) == PLUS)
3795     {
3796       addval += remove_constant_addition (&XEXP (exp, 0));
3797       addval += remove_constant_addition (&XEXP (exp, 1));
3798
3799       /* In case our parameter was constant, remove extra zero from the
3800          expression.  */
3801       if (XEXP (exp, 0) == const0_rtx)
3802         *x = XEXP (exp, 1);
3803       else if (XEXP (exp, 1) == const0_rtx)
3804         *x = XEXP (exp, 0);
3805     }
3806
3807   return addval;
3808 }
3809
3810 /* Attempt to identify accesses to arrays that are most likely to cause cache
3811    misses, and emit prefetch instructions a few prefetch blocks forward.
3812
3813    To detect the arrays we use the GIV information that was collected by the
3814    strength reduction pass.
3815
3816    The prefetch instructions are generated after the GIV information is done
3817    and before the strength reduction process. The new GIVs are injected into
3818    the strength reduction tables, so the prefetch addresses are optimized as
3819    well.
3820
3821    GIVs are split into base address, stride, and constant addition values.
3822    GIVs with the same address, stride and close addition values are combined
3823    into a single prefetch.  Also writes to GIVs are detected, so that prefetch
3824    for write instructions can be used for the block we write to, on machines
3825    that support write prefetches.
3826
3827    Several heuristics are used to determine when to prefetch.  They are
3828    controlled by defined symbols that can be overridden for each target.  */
3829
3830 static void
3831 emit_prefetch_instructions (loop)
3832      struct loop *loop;
3833 {
3834   int num_prefetches = 0;
3835   int num_real_prefetches = 0;
3836   int num_real_write_prefetches = 0;
3837   int num_prefetches_before = 0;
3838   int num_write_prefetches_before = 0;
3839   int ahead = 0;
3840   int i;
3841   struct iv_class *bl;
3842   struct induction *iv;
3843   struct prefetch_info info[MAX_PREFETCHES];
3844   struct loop_ivs *ivs = LOOP_IVS (loop);
3845
3846   if (!HAVE_prefetch)
3847     return;
3848
3849   /* Consider only loops w/o calls.  When a call is done, the loop is probably
3850      slow enough to read the memory.  */
3851   if (PREFETCH_NO_CALL && LOOP_INFO (loop)->has_call)
3852     {
3853       if (loop_dump_stream)
3854         fprintf (loop_dump_stream, "Prefetch: ignoring loop: has call.\n");
3855
3856       return;
3857     }
3858
3859   /* Don't prefetch in loops known to have few iterations.  */
3860   if (PREFETCH_NO_LOW_LOOPCNT
3861       && LOOP_INFO (loop)->n_iterations
3862       && LOOP_INFO (loop)->n_iterations <= PREFETCH_LOW_LOOPCNT)
3863     {
3864       if (loop_dump_stream)
3865         fprintf (loop_dump_stream,
3866                  "Prefetch: ignoring loop: not enough iterations.\n");
3867       return;
3868     }
3869
3870   /* Search all induction variables and pick those interesting for the prefetch
3871      machinery.  */
3872   for (bl = ivs->list; bl; bl = bl->next)
3873     {
3874       struct induction *biv = bl->biv, *biv1;
3875       int basestride = 0;
3876
3877       biv1 = biv;
3878
3879       /* Expect all BIVs to be executed in each iteration.  This makes our
3880          analysis more conservative.  */
3881       while (biv1)
3882         {
3883           /* Discard non-constant additions that we can't handle well yet, and
3884              BIVs that are executed multiple times; such BIVs ought to be
3885              handled in the nested loop.  We accept not_every_iteration BIVs,
3886              since these only result in larger strides and make our
3887              heuristics more conservative.  */
3888           if (GET_CODE (biv->add_val) != CONST_INT)
3889             {
3890               if (loop_dump_stream)
3891                 {
3892                   fprintf (loop_dump_stream,
3893                     "Prefetch: ignoring biv %d: non-constant addition at insn %d:",
3894                            REGNO (biv->src_reg), INSN_UID (biv->insn));
3895                   print_rtl (loop_dump_stream, biv->add_val);
3896                   fprintf (loop_dump_stream, "\n");
3897                 }
3898               break;
3899             }
3900
3901           if (biv->maybe_multiple)
3902             {
3903               if (loop_dump_stream)
3904                 {
3905                   fprintf (loop_dump_stream,
3906                            "Prefetch: ignoring biv %d: maybe_multiple at insn %i:",
3907                            REGNO (biv->src_reg), INSN_UID (biv->insn));
3908                   print_rtl (loop_dump_stream, biv->add_val);
3909                   fprintf (loop_dump_stream, "\n");
3910                 }
3911               break;
3912             }
3913
3914           basestride += INTVAL (biv1->add_val);
3915           biv1 = biv1->next_iv;
3916         }
3917
3918       if (biv1 || !basestride)
3919         continue;
3920
3921       for (iv = bl->giv; iv; iv = iv->next_iv)
3922         {
3923           rtx address;
3924           rtx temp;
3925           HOST_WIDE_INT index = 0;
3926           int add = 1;
3927           HOST_WIDE_INT stride = 0;
3928           int stride_sign = 1;
3929           struct check_store_data d;
3930           const char *ignore_reason = NULL;
3931           int size = GET_MODE_SIZE (GET_MODE (iv));
3932
3933           /* See whether an induction variable is interesting to us and if
3934              not, report the reason.  */
3935           if (iv->giv_type != DEST_ADDR)
3936             ignore_reason = "giv is not a destination address";
3937
3938           /* We are interested only in constant stride memory references
3939              in order to be able to compute density easily.  */
3940           else if (GET_CODE (iv->mult_val) != CONST_INT)
3941             ignore_reason = "stride is not constant";
3942
3943           else
3944             {
3945               stride = INTVAL (iv->mult_val) * basestride;
3946               if (stride < 0)
3947                 {
3948                   stride = -stride;
3949                   stride_sign = -1;
3950                 }
3951
3952               /* On some targets, reversed order prefetches are not
3953                  worthwhile.  */
3954               if (PREFETCH_NO_REVERSE_ORDER && stride_sign < 0)
3955                 ignore_reason = "reversed order stride";
3956
3957               /* Prefetch of accesses with an extreme stride might not be
3958                  worthwhile, either.  */
3959               else if (PREFETCH_NO_EXTREME_STRIDE
3960                        && stride > PREFETCH_EXTREME_STRIDE)
3961                 ignore_reason = "extreme stride";
3962
3963               /* Ignore GIVs with varying add values; we can't predict the
3964                  value for the next iteration.  */
3965               else if (!loop_invariant_p (loop, iv->add_val))
3966                 ignore_reason = "giv has varying add value";
3967
3968               /* Ignore GIVs in the nested loops; they ought to have been
3969                  handled already.  */
3970               else if (iv->maybe_multiple)
3971                 ignore_reason = "giv is in nested loop";
3972             }
3973
3974           if (ignore_reason != NULL)
3975             {
3976               if (loop_dump_stream)
3977                 fprintf (loop_dump_stream,
3978                          "Prefetch: ignoring giv at %d: %s.\n",
3979                          INSN_UID (iv->insn), ignore_reason);
3980               continue;
3981             }
3982
3983           /* Determine the pointer to the basic array we are examining.  It is
3984              the sum of the BIV's initial value and the GIV's add_val.  */
3985           address = copy_rtx (iv->add_val);
3986           temp = copy_rtx (bl->initial_value);
3987
3988           address = simplify_gen_binary (PLUS, Pmode, temp, address);
3989           index = remove_constant_addition (&address);
3990
3991           d.mem_write = 0;
3992           d.mem_address = *iv->location;
3993
3994           /* When the GIV is not always executed, we might be better off by
3995              not dirtying the cache pages.  */
3996           if (PREFETCH_CONDITIONAL || iv->always_executed)
3997             note_stores (PATTERN (iv->insn), check_store, &d);
3998           else
3999             {
4000               if (loop_dump_stream)
4001                 fprintf (loop_dump_stream, "Prefetch: Ignoring giv at %d: %s\n",
4002                          INSN_UID (iv->insn), "in conditional code.");
4003               continue;
4004             }
4005
4006           /* Attempt to find another prefetch to the same array and see if we
4007              can merge this one.  */
4008           for (i = 0; i < num_prefetches; i++)
4009             if (rtx_equal_for_prefetch_p (address, info[i].base_address)
4010                 && stride == info[i].stride)
4011               {
4012                 /* In case both access same array (same location
4013                    just with small difference in constant indexes), merge
4014                    the prefetches.  Just do the later and the earlier will
4015                    get prefetched from previous iteration.
4016                    The artificial threshold should not be too small,
4017                    but also not bigger than small portion of memory usually
4018                    traversed by single loop.  */
4019                 if (index >= info[i].index
4020                     && index - info[i].index < PREFETCH_EXTREME_DIFFERENCE)
4021                   {
4022                     info[i].write |= d.mem_write;
4023                     info[i].bytes_accessed += size;
4024                     info[i].index = index;
4025                     info[i].giv = iv;
4026                     info[i].class = bl;
4027                     info[num_prefetches].base_address = address;
4028                     add = 0;
4029                     break;
4030                   }
4031
4032                 if (index < info[i].index
4033                     && info[i].index - index < PREFETCH_EXTREME_DIFFERENCE)
4034                   {
4035                     info[i].write |= d.mem_write;
4036                     info[i].bytes_accessed += size;
4037                     add = 0;
4038                     break;
4039                   }
4040               }
4041
4042           /* Merging failed.  */
4043           if (add)
4044             {
4045               info[num_prefetches].giv = iv;
4046               info[num_prefetches].class = bl;
4047               info[num_prefetches].index = index;
4048               info[num_prefetches].stride = stride;
4049               info[num_prefetches].base_address = address;
4050               info[num_prefetches].write = d.mem_write;
4051               info[num_prefetches].bytes_accessed = size;
4052               num_prefetches++;
4053               if (num_prefetches >= MAX_PREFETCHES)
4054                 {
4055                   if (loop_dump_stream)
4056                     fprintf (loop_dump_stream,
4057                              "Maximal number of prefetches exceeded.\n");
4058                   return;
4059                 }
4060             }
4061         }
4062     }
4063
4064   for (i = 0; i < num_prefetches; i++)
4065     {
4066       int density;
4067
4068       /* Attempt to calculate the total number of bytes fetched by all
4069          iterations of the loop.  Avoid overflow.  */
4070       if (LOOP_INFO (loop)->n_iterations
4071           && ((unsigned HOST_WIDE_INT) (0xffffffff / info[i].stride)
4072               >= LOOP_INFO (loop)->n_iterations))
4073         info[i].total_bytes = info[i].stride * LOOP_INFO (loop)->n_iterations;
4074       else
4075         info[i].total_bytes = 0xffffffff;
4076
4077       density = info[i].bytes_accessed * 100 / info[i].stride;
4078
4079       /* Prefetch might be worthwhile only when the loads/stores are dense.  */
4080       if (PREFETCH_ONLY_DENSE_MEM)
4081         if (density * 256 > PREFETCH_DENSE_MEM * 100
4082             && (info[i].total_bytes / PREFETCH_BLOCK
4083                 >= PREFETCH_BLOCKS_BEFORE_LOOP_MIN))
4084           {
4085             info[i].prefetch_before_loop = 1;
4086             info[i].prefetch_in_loop
4087               = (info[i].total_bytes / PREFETCH_BLOCK
4088                  > PREFETCH_BLOCKS_BEFORE_LOOP_MAX);
4089           }
4090         else
4091           {
4092             info[i].prefetch_in_loop = 0, info[i].prefetch_before_loop = 0;
4093             if (loop_dump_stream)
4094               fprintf (loop_dump_stream,
4095                   "Prefetch: ignoring giv at %d: %d%% density is too low.\n",
4096                        INSN_UID (info[i].giv->insn), density);
4097           }
4098       else
4099         info[i].prefetch_in_loop = 1, info[i].prefetch_before_loop = 1;
4100
4101       /* Find how many prefetch instructions we'll use within the loop.  */
4102       if (info[i].prefetch_in_loop != 0)
4103         {
4104           info[i].prefetch_in_loop = ((info[i].stride + PREFETCH_BLOCK - 1)
4105                                   / PREFETCH_BLOCK);
4106           num_real_prefetches += info[i].prefetch_in_loop;
4107           if (info[i].write)
4108             num_real_write_prefetches += info[i].prefetch_in_loop;
4109         }
4110     }
4111
4112   /* Determine how many iterations ahead to prefetch within the loop, based
4113      on how many prefetches we currently expect to do within the loop.  */
4114   if (num_real_prefetches != 0)
4115     {
4116       if ((ahead = SIMULTANEOUS_PREFETCHES / num_real_prefetches) == 0)
4117         {
4118           if (loop_dump_stream)
4119             fprintf (loop_dump_stream,
4120                      "Prefetch: ignoring prefetches within loop: ahead is zero; %d < %d\n",
4121                      SIMULTANEOUS_PREFETCHES, num_real_prefetches);
4122           num_real_prefetches = 0, num_real_write_prefetches = 0;
4123         }
4124     }
4125   /* We'll also use AHEAD to determine how many prefetch instructions to
4126      emit before a loop, so don't leave it zero.  */
4127   if (ahead == 0)
4128     ahead = PREFETCH_BLOCKS_BEFORE_LOOP_MAX;
4129
4130   for (i = 0; i < num_prefetches; i++)
4131     {
4132       /* Update if we've decided not to prefetch anything within the loop.  */
4133       if (num_real_prefetches == 0)
4134         info[i].prefetch_in_loop = 0;
4135
4136       /* Find how many prefetch instructions we'll use before the loop.  */
4137       if (info[i].prefetch_before_loop != 0)
4138         {
4139           int n = info[i].total_bytes / PREFETCH_BLOCK;
4140           if (n > ahead)
4141             n = ahead;
4142           info[i].prefetch_before_loop = n;
4143           num_prefetches_before += n;
4144           if (info[i].write)
4145             num_write_prefetches_before += n;
4146         }
4147
4148       if (loop_dump_stream)
4149         {
4150           if (info[i].prefetch_in_loop == 0
4151               && info[i].prefetch_before_loop == 0)
4152             continue;
4153           fprintf (loop_dump_stream, "Prefetch insn: %d",
4154                    INSN_UID (info[i].giv->insn));
4155           fprintf (loop_dump_stream,
4156                    "; in loop: %d; before: %d; %s\n",
4157                    info[i].prefetch_in_loop,
4158                    info[i].prefetch_before_loop,
4159                    info[i].write ? "read/write" : "read only");
4160           fprintf (loop_dump_stream,
4161                    " density: %d%%; bytes_accessed: %u; total_bytes: %u\n",
4162                    (int) (info[i].bytes_accessed * 100 / info[i].stride),
4163                    info[i].bytes_accessed, info[i].total_bytes);
4164           fprintf (loop_dump_stream, " index: ");
4165           fprintf (loop_dump_stream, HOST_WIDE_INT_PRINT_DEC, info[i].index);
4166           fprintf (loop_dump_stream, "; stride: ");
4167           fprintf (loop_dump_stream, HOST_WIDE_INT_PRINT_DEC, info[i].stride);
4168           fprintf (loop_dump_stream, "; address: ");
4169           print_rtl (loop_dump_stream, info[i].base_address);
4170           fprintf (loop_dump_stream, "\n");
4171         }
4172     }
4173
4174   if (num_real_prefetches + num_prefetches_before > 0)
4175     {
4176       /* Record that this loop uses prefetch instructions.  */
4177       LOOP_INFO (loop)->has_prefetch = 1;
4178
4179       if (loop_dump_stream)
4180         {
4181           fprintf (loop_dump_stream, "Real prefetches needed within loop: %d (write: %d)\n",
4182                    num_real_prefetches, num_real_write_prefetches);
4183           fprintf (loop_dump_stream, "Real prefetches needed before loop: %d (write: %d)\n",
4184                    num_prefetches_before, num_write_prefetches_before);
4185         }
4186     }
4187
4188   for (i = 0; i < num_prefetches; i++)
4189     {
4190       int y;
4191
4192       for (y = 0; y < info[i].prefetch_in_loop; y++)
4193         {
4194           rtx loc = copy_rtx (*info[i].giv->location);
4195           rtx insn;
4196           int bytes_ahead = PREFETCH_BLOCK * (ahead + y);
4197           rtx before_insn = info[i].giv->insn;
4198           rtx prev_insn = PREV_INSN (info[i].giv->insn);
4199           rtx seq;
4200
4201           /* We can save some effort by offsetting the address on
4202              architectures with offsettable memory references.  */
4203           if (offsettable_address_p (0, VOIDmode, loc))
4204             loc = plus_constant (loc, bytes_ahead);
4205           else
4206             {
4207               rtx reg = gen_reg_rtx (Pmode);
4208               loop_iv_add_mult_emit_before (loop, loc, const1_rtx,
4209                                             GEN_INT (bytes_ahead), reg,
4210                                             0, before_insn);
4211               loc = reg;
4212             }
4213
4214           start_sequence ();
4215           /* Make sure the address operand is valid for prefetch.  */
4216           if (! (*insn_data[(int)CODE_FOR_prefetch].operand[0].predicate)
4217                   (loc, insn_data[(int)CODE_FOR_prefetch].operand[0].mode))
4218             loc = force_reg (Pmode, loc);
4219           emit_insn (gen_prefetch (loc, GEN_INT (info[i].write),
4220                                    GEN_INT (3)));
4221           seq = get_insns ();
4222           end_sequence ();
4223           emit_insn_before (seq, before_insn);
4224
4225           /* Check all insns emitted and record the new GIV
4226              information.  */
4227           insn = NEXT_INSN (prev_insn);
4228           while (insn != before_insn)
4229             {
4230               insn = check_insn_for_givs (loop, insn,
4231                                           info[i].giv->always_executed,
4232                                           info[i].giv->maybe_multiple);
4233               insn = NEXT_INSN (insn);
4234             }
4235         }
4236
4237       if (PREFETCH_BEFORE_LOOP)
4238         {
4239           /* Emit insns before the loop to fetch the first cache lines or,
4240              if we're not prefetching within the loop, everything we expect
4241              to need.  */
4242           for (y = 0; y < info[i].prefetch_before_loop; y++)
4243             {
4244               rtx reg = gen_reg_rtx (Pmode);
4245               rtx loop_start = loop->start;
4246               rtx init_val = info[i].class->initial_value;
4247               rtx add_val = simplify_gen_binary (PLUS, Pmode,
4248                                                  info[i].giv->add_val,
4249                                                  GEN_INT (y * PREFETCH_BLOCK));
4250
4251               /* Functions called by LOOP_IV_ADD_EMIT_BEFORE expect a
4252                  non-constant INIT_VAL to have the same mode as REG, which
4253                  in this case we know to be Pmode.  */
4254               if (GET_MODE (init_val) != Pmode && !CONSTANT_P (init_val))
4255                 {
4256                   rtx seq;
4257
4258                   start_sequence ();
4259                   init_val = convert_to_mode (Pmode, init_val, 0);
4260                   seq = get_insns ();
4261                   end_sequence ();
4262                   loop_insn_emit_before (loop, 0, loop_start, seq);
4263                 }
4264               loop_iv_add_mult_emit_before (loop, init_val,
4265                                             info[i].giv->mult_val,
4266                                             add_val, reg, 0, loop_start);
4267               emit_insn_before (gen_prefetch (reg, GEN_INT (info[i].write),
4268                                               GEN_INT (3)),
4269                                 loop_start);
4270             }
4271         }
4272     }
4273
4274   return;
4275 }
4276 \f
4277 /* A "basic induction variable" or biv is a pseudo reg that is set
4278    (within this loop) only by incrementing or decrementing it.  */
4279 /* A "general induction variable" or giv is a pseudo reg whose
4280    value is a linear function of a biv.  */
4281
4282 /* Bivs are recognized by `basic_induction_var';
4283    Givs by `general_induction_var'.  */
4284
4285 /* Communication with routines called via `note_stores'.  */
4286
4287 static rtx note_insn;
4288
4289 /* Dummy register to have nonzero DEST_REG for DEST_ADDR type givs.  */
4290
4291 static rtx addr_placeholder;
4292
4293 /* ??? Unfinished optimizations, and possible future optimizations,
4294    for the strength reduction code.  */
4295
4296 /* ??? The interaction of biv elimination, and recognition of 'constant'
4297    bivs, may cause problems.  */
4298
4299 /* ??? Add heuristics so that DEST_ADDR strength reduction does not cause
4300    performance problems.
4301
4302    Perhaps don't eliminate things that can be combined with an addressing
4303    mode.  Find all givs that have the same biv, mult_val, and add_val;
4304    then for each giv, check to see if its only use dies in a following
4305    memory address.  If so, generate a new memory address and check to see
4306    if it is valid.   If it is valid, then store the modified memory address,
4307    otherwise, mark the giv as not done so that it will get its own iv.  */
4308
4309 /* ??? Could try to optimize branches when it is known that a biv is always
4310    positive.  */
4311
4312 /* ??? When replace a biv in a compare insn, we should replace with closest
4313    giv so that an optimized branch can still be recognized by the combiner,
4314    e.g. the VAX acb insn.  */
4315
4316 /* ??? Many of the checks involving uid_luid could be simplified if regscan
4317    was rerun in loop_optimize whenever a register was added or moved.
4318    Also, some of the optimizations could be a little less conservative.  */
4319 \f
4320 /* Scan the loop body and call FNCALL for each insn.  In the addition to the
4321    LOOP and INSN parameters pass MAYBE_MULTIPLE and NOT_EVERY_ITERATION to the
4322    callback.
4323
4324    NOT_EVERY_ITERATION is 1 if current insn is not known to be executed at
4325    least once for every loop iteration except for the last one.
4326
4327    MAYBE_MULTIPLE is 1 if current insn may be executed more than once for every
4328    loop iteration.
4329  */
4330 void
4331 for_each_insn_in_loop (loop, fncall)
4332      struct loop *loop;
4333      loop_insn_callback fncall;
4334 {
4335   int not_every_iteration = 0;
4336   int maybe_multiple = 0;
4337   int past_loop_latch = 0;
4338   int loop_depth = 0;
4339   rtx p;
4340
4341   /* If loop_scan_start points to the loop exit test, we have to be wary of
4342      subversive use of gotos inside expression statements.  */
4343   if (prev_nonnote_insn (loop->scan_start) != prev_nonnote_insn (loop->start))
4344     maybe_multiple = back_branch_in_range_p (loop, loop->scan_start);
4345
4346   /* Scan through loop and update NOT_EVERY_ITERATION and MAYBE_MULTIPLE.  */
4347   for (p = next_insn_in_loop (loop, loop->scan_start);
4348        p != NULL_RTX;
4349        p = next_insn_in_loop (loop, p))
4350     {
4351       p = fncall (loop, p, not_every_iteration, maybe_multiple);
4352
4353       /* Past CODE_LABEL, we get to insns that may be executed multiple
4354          times.  The only way we can be sure that they can't is if every
4355          jump insn between here and the end of the loop either
4356          returns, exits the loop, is a jump to a location that is still
4357          behind the label, or is a jump to the loop start.  */
4358
4359       if (GET_CODE (p) == CODE_LABEL)
4360         {
4361           rtx insn = p;
4362
4363           maybe_multiple = 0;
4364
4365           while (1)
4366             {
4367               insn = NEXT_INSN (insn);
4368               if (insn == loop->scan_start)
4369                 break;
4370               if (insn == loop->end)
4371                 {
4372                   if (loop->top != 0)
4373                     insn = loop->top;
4374                   else
4375                     break;
4376                   if (insn == loop->scan_start)
4377                     break;
4378                 }
4379
4380               if (GET_CODE (insn) == JUMP_INSN
4381                   && GET_CODE (PATTERN (insn)) != RETURN
4382                   && (!any_condjump_p (insn)
4383                       || (JUMP_LABEL (insn) != 0
4384                           && JUMP_LABEL (insn) != loop->scan_start
4385                           && !loop_insn_first_p (p, JUMP_LABEL (insn)))))
4386                 {
4387                   maybe_multiple = 1;
4388                   break;
4389                 }
4390             }
4391         }
4392
4393       /* Past a jump, we get to insns for which we can't count
4394          on whether they will be executed during each iteration.  */
4395       /* This code appears twice in strength_reduce.  There is also similar
4396          code in scan_loop.  */
4397       if (GET_CODE (p) == JUMP_INSN
4398       /* If we enter the loop in the middle, and scan around to the
4399          beginning, don't set not_every_iteration for that.
4400          This can be any kind of jump, since we want to know if insns
4401          will be executed if the loop is executed.  */
4402           && !(JUMP_LABEL (p) == loop->top
4403                && ((NEXT_INSN (NEXT_INSN (p)) == loop->end
4404                     && any_uncondjump_p (p))
4405                    || (NEXT_INSN (p) == loop->end && any_condjump_p (p)))))
4406         {
4407           rtx label = 0;
4408
4409           /* If this is a jump outside the loop, then it also doesn't
4410              matter.  Check to see if the target of this branch is on the
4411              loop->exits_labels list.  */
4412
4413           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
4414             if (XEXP (label, 0) == JUMP_LABEL (p))
4415               break;
4416
4417           if (!label)
4418             not_every_iteration = 1;
4419         }
4420
4421       else if (GET_CODE (p) == NOTE)
4422         {
4423           /* At the virtual top of a converted loop, insns are again known to
4424              be executed each iteration: logically, the loop begins here
4425              even though the exit code has been duplicated.
4426
4427              Insns are also again known to be executed each iteration at
4428              the LOOP_CONT note.  */
4429           if ((NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_VTOP
4430                || NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_CONT)
4431               && loop_depth == 0)
4432             not_every_iteration = 0;
4433           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_BEG)
4434             loop_depth++;
4435           else if (NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
4436             loop_depth--;
4437         }
4438
4439       /* Note if we pass a loop latch.  If we do, then we can not clear
4440          NOT_EVERY_ITERATION below when we pass the last CODE_LABEL in
4441          a loop since a jump before the last CODE_LABEL may have started
4442          a new loop iteration.
4443
4444          Note that LOOP_TOP is only set for rotated loops and we need
4445          this check for all loops, so compare against the CODE_LABEL
4446          which immediately follows LOOP_START.  */
4447       if (GET_CODE (p) == JUMP_INSN
4448           && JUMP_LABEL (p) == NEXT_INSN (loop->start))
4449         past_loop_latch = 1;
4450
4451       /* Unlike in the code motion pass where MAYBE_NEVER indicates that
4452          an insn may never be executed, NOT_EVERY_ITERATION indicates whether
4453          or not an insn is known to be executed each iteration of the
4454          loop, whether or not any iterations are known to occur.
4455
4456          Therefore, if we have just passed a label and have no more labels
4457          between here and the test insn of the loop, and we have not passed
4458          a jump to the top of the loop, then we know these insns will be
4459          executed each iteration.  */
4460
4461       if (not_every_iteration
4462           && !past_loop_latch
4463           && GET_CODE (p) == CODE_LABEL
4464           && no_labels_between_p (p, loop->end)
4465           && loop_insn_first_p (p, loop->cont))
4466         not_every_iteration = 0;
4467     }
4468 }
4469 \f
4470 static void
4471 loop_bivs_find (loop)
4472      struct loop *loop;
4473 {
4474   struct loop_regs *regs = LOOP_REGS (loop);
4475   struct loop_ivs *ivs = LOOP_IVS (loop);
4476   /* Temporary list pointers for traversing ivs->list.  */
4477   struct iv_class *bl, **backbl;
4478
4479   ivs->list = 0;
4480
4481   for_each_insn_in_loop (loop, check_insn_for_bivs);
4482
4483   /* Scan ivs->list to remove all regs that proved not to be bivs.
4484      Make a sanity check against regs->n_times_set.  */
4485   for (backbl = &ivs->list, bl = *backbl; bl; bl = bl->next)
4486     {
4487       if (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4488           /* Above happens if register modified by subreg, etc.  */
4489           /* Make sure it is not recognized as a basic induction var: */
4490           || regs->array[bl->regno].n_times_set != bl->biv_count
4491           /* If never incremented, it is invariant that we decided not to
4492              move.  So leave it alone.  */
4493           || ! bl->incremented)
4494         {
4495           if (loop_dump_stream)
4496             fprintf (loop_dump_stream, "Biv %d: discarded, %s\n",
4497                      bl->regno,
4498                      (REG_IV_TYPE (ivs, bl->regno) != BASIC_INDUCT
4499                       ? "not induction variable"
4500                       : (! bl->incremented ? "never incremented"
4501                          : "count error")));
4502
4503           REG_IV_TYPE (ivs, bl->regno) = NOT_BASIC_INDUCT;
4504           *backbl = bl->next;
4505         }
4506       else
4507         {
4508           backbl = &bl->next;
4509
4510           if (loop_dump_stream)
4511             fprintf (loop_dump_stream, "Biv %d: verified\n", bl->regno);
4512         }
4513     }
4514 }
4515
4516
4517 /* Determine how BIVS are initialized by looking through pre-header
4518    extended basic block.  */
4519 static void
4520 loop_bivs_init_find (loop)
4521      struct loop *loop;
4522 {
4523   struct loop_ivs *ivs = LOOP_IVS (loop);
4524   /* Temporary list pointers for traversing ivs->list.  */
4525   struct iv_class *bl;
4526   int call_seen;
4527   rtx p;
4528
4529   /* Find initial value for each biv by searching backwards from loop_start,
4530      halting at first label.  Also record any test condition.  */
4531
4532   call_seen = 0;
4533   for (p = loop->start; p && GET_CODE (p) != CODE_LABEL; p = PREV_INSN (p))
4534     {
4535       rtx test;
4536
4537       note_insn = p;
4538
4539       if (GET_CODE (p) == CALL_INSN)
4540         call_seen = 1;
4541
4542       if (INSN_P (p))
4543         note_stores (PATTERN (p), record_initial, ivs);
4544
4545       /* Record any test of a biv that branches around the loop if no store
4546          between it and the start of loop.  We only care about tests with
4547          constants and registers and only certain of those.  */
4548       if (GET_CODE (p) == JUMP_INSN
4549           && JUMP_LABEL (p) != 0
4550           && next_real_insn (JUMP_LABEL (p)) == next_real_insn (loop->end)
4551           && (test = get_condition_for_loop (loop, p)) != 0
4552           && GET_CODE (XEXP (test, 0)) == REG
4553           && REGNO (XEXP (test, 0)) < max_reg_before_loop
4554           && (bl = REG_IV_CLASS (ivs, REGNO (XEXP (test, 0)))) != 0
4555           && valid_initial_value_p (XEXP (test, 1), p, call_seen, loop->start)
4556           && bl->init_insn == 0)
4557         {
4558           /* If an NE test, we have an initial value!  */
4559           if (GET_CODE (test) == NE)
4560             {
4561               bl->init_insn = p;
4562               bl->init_set = gen_rtx_SET (VOIDmode,
4563                                           XEXP (test, 0), XEXP (test, 1));
4564             }
4565           else
4566             bl->initial_test = test;
4567         }
4568     }
4569 }
4570
4571
4572 /* Look at the each biv and see if we can say anything better about its
4573    initial value from any initializing insns set up above.  (This is done
4574    in two passes to avoid missing SETs in a PARALLEL.)  */
4575 static void
4576 loop_bivs_check (loop)
4577      struct loop *loop;
4578 {
4579   struct loop_ivs *ivs = LOOP_IVS (loop);
4580   /* Temporary list pointers for traversing ivs->list.  */
4581   struct iv_class *bl;
4582   struct iv_class **backbl;
4583
4584   for (backbl = &ivs->list; (bl = *backbl); backbl = &bl->next)
4585     {
4586       rtx src;
4587       rtx note;
4588
4589       if (! bl->init_insn)
4590         continue;
4591
4592       /* IF INIT_INSN has a REG_EQUAL or REG_EQUIV note and the value
4593          is a constant, use the value of that.  */
4594       if (((note = find_reg_note (bl->init_insn, REG_EQUAL, 0)) != NULL
4595            && CONSTANT_P (XEXP (note, 0)))
4596           || ((note = find_reg_note (bl->init_insn, REG_EQUIV, 0)) != NULL
4597               && CONSTANT_P (XEXP (note, 0))))
4598         src = XEXP (note, 0);
4599       else
4600         src = SET_SRC (bl->init_set);
4601
4602       if (loop_dump_stream)
4603         fprintf (loop_dump_stream,
4604                  "Biv %d: initialized at insn %d: initial value ",
4605                  bl->regno, INSN_UID (bl->init_insn));
4606
4607       if ((GET_MODE (src) == GET_MODE (regno_reg_rtx[bl->regno])
4608            || GET_MODE (src) == VOIDmode)
4609           && valid_initial_value_p (src, bl->init_insn,
4610                                     LOOP_INFO (loop)->pre_header_has_call,
4611                                     loop->start))
4612         {
4613           bl->initial_value = src;
4614
4615           if (loop_dump_stream)
4616             {
4617               print_simple_rtl (loop_dump_stream, src);
4618               fputc ('\n', loop_dump_stream);
4619             }
4620         }
4621       /* If we can't make it a giv,
4622          let biv keep initial value of "itself".  */
4623       else if (loop_dump_stream)
4624         fprintf (loop_dump_stream, "is complex\n");
4625     }
4626 }
4627
4628
4629 /* Search the loop for general induction variables.  */
4630
4631 static void
4632 loop_givs_find (loop)
4633      struct loop* loop;
4634 {
4635   for_each_insn_in_loop (loop, check_insn_for_givs);
4636 }
4637
4638
4639 /* For each giv for which we still don't know whether or not it is
4640    replaceable, check to see if it is replaceable because its final value
4641    can be calculated.  */
4642
4643 static void
4644 loop_givs_check (loop)
4645      struct loop *loop;
4646 {
4647   struct loop_ivs *ivs = LOOP_IVS (loop);
4648   struct iv_class *bl;
4649
4650   for (bl = ivs->list; bl; bl = bl->next)
4651     {
4652       struct induction *v;
4653
4654       for (v = bl->giv; v; v = v->next_iv)
4655         if (! v->replaceable && ! v->not_replaceable)
4656           check_final_value (loop, v);
4657     }
4658 }
4659
4660
4661 /* Return nonzero if it is possible to eliminate the biv BL provided
4662    all givs are reduced.  This is possible if either the reg is not
4663    used outside the loop, or we can compute what its final value will
4664    be.  */
4665
4666 static int
4667 loop_biv_eliminable_p (loop, bl, threshold, insn_count)
4668      struct loop *loop;
4669      struct iv_class *bl;
4670      int threshold;
4671      int insn_count;
4672 {
4673   /* For architectures with a decrement_and_branch_until_zero insn,
4674      don't do this if we put a REG_NONNEG note on the endtest for this
4675      biv.  */
4676
4677 #ifdef HAVE_decrement_and_branch_until_zero
4678   if (bl->nonneg)
4679     {
4680       if (loop_dump_stream)
4681         fprintf (loop_dump_stream,
4682                  "Cannot eliminate nonneg biv %d.\n", bl->regno);
4683       return 0;
4684     }
4685 #endif
4686
4687   /* Check that biv is used outside loop or if it has a final value.
4688      Compare against bl->init_insn rather than loop->start.  We aren't
4689      concerned with any uses of the biv between init_insn and
4690      loop->start since these won't be affected by the value of the biv
4691      elsewhere in the function, so long as init_insn doesn't use the
4692      biv itself.  */
4693
4694   if ((REGNO_LAST_LUID (bl->regno) < INSN_LUID (loop->end)
4695        && bl->init_insn
4696        && INSN_UID (bl->init_insn) < max_uid_for_loop
4697        && REGNO_FIRST_LUID (bl->regno) >= INSN_LUID (bl->init_insn)
4698        && ! reg_mentioned_p (bl->biv->dest_reg, SET_SRC (bl->init_set)))
4699       || (bl->final_value = final_biv_value (loop, bl)))
4700     return maybe_eliminate_biv (loop, bl, 0, threshold, insn_count);
4701
4702   if (loop_dump_stream)
4703     {
4704       fprintf (loop_dump_stream,
4705                "Cannot eliminate biv %d.\n",
4706                bl->regno);
4707       fprintf (loop_dump_stream,
4708                "First use: insn %d, last use: insn %d.\n",
4709                REGNO_FIRST_UID (bl->regno),
4710                REGNO_LAST_UID (bl->regno));
4711     }
4712   return 0;
4713 }
4714
4715
4716 /* Reduce each giv of BL that we have decided to reduce.  */
4717
4718 static void
4719 loop_givs_reduce (loop, bl)
4720      struct loop *loop;
4721      struct iv_class *bl;
4722 {
4723   struct induction *v;
4724
4725   for (v = bl->giv; v; v = v->next_iv)
4726     {
4727       struct induction *tv;
4728       if (! v->ignore && v->same == 0)
4729         {
4730           int auto_inc_opt = 0;
4731
4732           /* If the code for derived givs immediately below has already
4733              allocated a new_reg, we must keep it.  */
4734           if (! v->new_reg)
4735             v->new_reg = gen_reg_rtx (v->mode);
4736
4737 #ifdef AUTO_INC_DEC
4738           /* If the target has auto-increment addressing modes, and
4739              this is an address giv, then try to put the increment
4740              immediately after its use, so that flow can create an
4741              auto-increment addressing mode.  */
4742           if (v->giv_type == DEST_ADDR && bl->biv_count == 1
4743               && bl->biv->always_executed && ! bl->biv->maybe_multiple
4744               /* We don't handle reversed biv's because bl->biv->insn
4745                  does not have a valid INSN_LUID.  */
4746               && ! bl->reversed
4747               && v->always_executed && ! v->maybe_multiple
4748               && INSN_UID (v->insn) < max_uid_for_loop)
4749             {
4750               /* If other giv's have been combined with this one, then
4751                  this will work only if all uses of the other giv's occur
4752                  before this giv's insn.  This is difficult to check.
4753
4754                  We simplify this by looking for the common case where
4755                  there is one DEST_REG giv, and this giv's insn is the
4756                  last use of the dest_reg of that DEST_REG giv.  If the
4757                  increment occurs after the address giv, then we can
4758                  perform the optimization.  (Otherwise, the increment
4759                  would have to go before other_giv, and we would not be
4760                  able to combine it with the address giv to get an
4761                  auto-inc address.)  */
4762               if (v->combined_with)
4763                 {
4764                   struct induction *other_giv = 0;
4765
4766                   for (tv = bl->giv; tv; tv = tv->next_iv)
4767                     if (tv->same == v)
4768                       {
4769                         if (other_giv)
4770                           break;
4771                         else
4772                           other_giv = tv;
4773                       }
4774                   if (! tv && other_giv
4775                       && REGNO (other_giv->dest_reg) < max_reg_before_loop
4776                       && (REGNO_LAST_UID (REGNO (other_giv->dest_reg))
4777                           == INSN_UID (v->insn))
4778                       && INSN_LUID (v->insn) < INSN_LUID (bl->biv->insn))
4779                     auto_inc_opt = 1;
4780                 }
4781               /* Check for case where increment is before the address
4782                  giv.  Do this test in "loop order".  */
4783               else if ((INSN_LUID (v->insn) > INSN_LUID (bl->biv->insn)
4784                         && (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
4785                             || (INSN_LUID (bl->biv->insn)
4786                                 > INSN_LUID (loop->scan_start))))
4787                        || (INSN_LUID (v->insn) < INSN_LUID (loop->scan_start)
4788                            && (INSN_LUID (loop->scan_start)
4789                                < INSN_LUID (bl->biv->insn))))
4790                 auto_inc_opt = -1;
4791               else
4792                 auto_inc_opt = 1;
4793
4794 #ifdef HAVE_cc0
4795               {
4796                 rtx prev;
4797
4798                 /* We can't put an insn immediately after one setting
4799                    cc0, or immediately before one using cc0.  */
4800                 if ((auto_inc_opt == 1 && sets_cc0_p (PATTERN (v->insn)))
4801                     || (auto_inc_opt == -1
4802                         && (prev = prev_nonnote_insn (v->insn)) != 0
4803                         && INSN_P (prev)
4804                         && sets_cc0_p (PATTERN (prev))))
4805                   auto_inc_opt = 0;
4806               }
4807 #endif
4808
4809               if (auto_inc_opt)
4810                 v->auto_inc_opt = 1;
4811             }
4812 #endif
4813
4814           /* For each place where the biv is incremented, add an insn
4815              to increment the new, reduced reg for the giv.  */
4816           for (tv = bl->biv; tv; tv = tv->next_iv)
4817             {
4818               rtx insert_before;
4819
4820               /* Skip if location is the same as a previous one.  */
4821               if (tv->same)
4822                 continue;
4823               if (! auto_inc_opt)
4824                 insert_before = NEXT_INSN (tv->insn);
4825               else if (auto_inc_opt == 1)
4826                 insert_before = NEXT_INSN (v->insn);
4827               else
4828                 insert_before = v->insn;
4829
4830               if (tv->mult_val == const1_rtx)
4831                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
4832                                               v->new_reg, v->new_reg,
4833                                               0, insert_before);
4834               else /* tv->mult_val == const0_rtx */
4835                 /* A multiply is acceptable here
4836                    since this is presumed to be seldom executed.  */
4837                 loop_iv_add_mult_emit_before (loop, tv->add_val, v->mult_val,
4838                                               v->add_val, v->new_reg,
4839                                               0, insert_before);
4840             }
4841
4842           /* Add code at loop start to initialize giv's reduced reg.  */
4843
4844           loop_iv_add_mult_hoist (loop,
4845                                   extend_value_for_giv (v, bl->initial_value),
4846                                   v->mult_val, v->add_val, v->new_reg);
4847         }
4848     }
4849 }
4850
4851
4852 /* Check for givs whose first use is their definition and whose
4853    last use is the definition of another giv.  If so, it is likely
4854    dead and should not be used to derive another giv nor to
4855    eliminate a biv.  */
4856
4857 static void
4858 loop_givs_dead_check (loop, bl)
4859      struct loop *loop ATTRIBUTE_UNUSED;
4860      struct iv_class *bl;
4861 {
4862   struct induction *v;
4863
4864   for (v = bl->giv; v; v = v->next_iv)
4865     {
4866       if (v->ignore
4867           || (v->same && v->same->ignore))
4868         continue;
4869
4870       if (v->giv_type == DEST_REG
4871           && REGNO_FIRST_UID (REGNO (v->dest_reg)) == INSN_UID (v->insn))
4872         {
4873           struct induction *v1;
4874
4875           for (v1 = bl->giv; v1; v1 = v1->next_iv)
4876             if (REGNO_LAST_UID (REGNO (v->dest_reg)) == INSN_UID (v1->insn))
4877               v->maybe_dead = 1;
4878         }
4879     }
4880 }
4881
4882
4883 static void
4884 loop_givs_rescan (loop, bl, reg_map)
4885      struct loop *loop;
4886      struct iv_class *bl;
4887      rtx *reg_map;
4888 {
4889   struct induction *v;
4890
4891   for (v = bl->giv; v; v = v->next_iv)
4892     {
4893       if (v->same && v->same->ignore)
4894         v->ignore = 1;
4895
4896       if (v->ignore)
4897         continue;
4898
4899       /* Update expression if this was combined, in case other giv was
4900          replaced.  */
4901       if (v->same)
4902         v->new_reg = replace_rtx (v->new_reg,
4903                                   v->same->dest_reg, v->same->new_reg);
4904
4905       /* See if this register is known to be a pointer to something.  If
4906          so, see if we can find the alignment.  First see if there is a
4907          destination register that is a pointer.  If so, this shares the
4908          alignment too.  Next see if we can deduce anything from the
4909          computational information.  If not, and this is a DEST_ADDR
4910          giv, at least we know that it's a pointer, though we don't know
4911          the alignment.  */
4912       if (GET_CODE (v->new_reg) == REG
4913           && v->giv_type == DEST_REG
4914           && REG_POINTER (v->dest_reg))
4915         mark_reg_pointer (v->new_reg,
4916                           REGNO_POINTER_ALIGN (REGNO (v->dest_reg)));
4917       else if (GET_CODE (v->new_reg) == REG
4918                && REG_POINTER (v->src_reg))
4919         {
4920           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->src_reg));
4921
4922           if (align == 0
4923               || GET_CODE (v->add_val) != CONST_INT
4924               || INTVAL (v->add_val) % (align / BITS_PER_UNIT) != 0)
4925             align = 0;
4926
4927           mark_reg_pointer (v->new_reg, align);
4928         }
4929       else if (GET_CODE (v->new_reg) == REG
4930                && GET_CODE (v->add_val) == REG
4931                && REG_POINTER (v->add_val))
4932         {
4933           unsigned int align = REGNO_POINTER_ALIGN (REGNO (v->add_val));
4934
4935           if (align == 0 || GET_CODE (v->mult_val) != CONST_INT
4936               || INTVAL (v->mult_val) % (align / BITS_PER_UNIT) != 0)
4937             align = 0;
4938
4939           mark_reg_pointer (v->new_reg, align);
4940         }
4941       else if (GET_CODE (v->new_reg) == REG && v->giv_type == DEST_ADDR)
4942         mark_reg_pointer (v->new_reg, 0);
4943
4944       if (v->giv_type == DEST_ADDR)
4945         /* Store reduced reg as the address in the memref where we found
4946            this giv.  */
4947         validate_change (v->insn, v->location, v->new_reg, 0);
4948       else if (v->replaceable)
4949         {
4950           reg_map[REGNO (v->dest_reg)] = v->new_reg;
4951         }
4952       else
4953         {
4954           rtx original_insn = v->insn;
4955           rtx note;
4956
4957           /* Not replaceable; emit an insn to set the original giv reg from
4958              the reduced giv, same as above.  */
4959           v->insn = loop_insn_emit_after (loop, 0, original_insn,
4960                                           gen_move_insn (v->dest_reg,
4961                                                          v->new_reg));
4962
4963           /* The original insn may have a REG_EQUAL note.  This note is
4964              now incorrect and may result in invalid substitutions later.
4965              The original insn is dead, but may be part of a libcall
4966              sequence, which doesn't seem worth the bother of handling.  */
4967           note = find_reg_note (original_insn, REG_EQUAL, NULL_RTX);
4968           if (note)
4969             remove_note (original_insn, note);
4970         }
4971
4972       /* When a loop is reversed, givs which depend on the reversed
4973          biv, and which are live outside the loop, must be set to their
4974          correct final value.  This insn is only needed if the giv is
4975          not replaceable.  The correct final value is the same as the
4976          value that the giv starts the reversed loop with.  */
4977       if (bl->reversed && ! v->replaceable)
4978         loop_iv_add_mult_sink (loop,
4979                                extend_value_for_giv (v, bl->initial_value),
4980                                v->mult_val, v->add_val, v->dest_reg);
4981       else if (v->final_value)
4982         loop_insn_sink_or_swim (loop,
4983                                 gen_load_of_final_value (v->dest_reg,
4984                                                          v->final_value));
4985
4986       if (loop_dump_stream)
4987         {
4988           fprintf (loop_dump_stream, "giv at %d reduced to ",
4989                    INSN_UID (v->insn));
4990           print_simple_rtl (loop_dump_stream, v->new_reg);
4991           fprintf (loop_dump_stream, "\n");
4992         }
4993     }
4994 }
4995
4996
4997 static int
4998 loop_giv_reduce_benefit (loop, bl, v, test_reg)
4999      struct loop *loop ATTRIBUTE_UNUSED;
5000      struct iv_class *bl;
5001      struct induction *v;
5002      rtx test_reg;
5003 {
5004   int add_cost;
5005   int benefit;
5006
5007   benefit = v->benefit;
5008   PUT_MODE (test_reg, v->mode);
5009   add_cost = iv_add_mult_cost (bl->biv->add_val, v->mult_val,
5010                                test_reg, test_reg);
5011
5012   /* Reduce benefit if not replaceable, since we will insert a
5013      move-insn to replace the insn that calculates this giv.  Don't do
5014      this unless the giv is a user variable, since it will often be
5015      marked non-replaceable because of the duplication of the exit
5016      code outside the loop.  In such a case, the copies we insert are
5017      dead and will be deleted.  So they don't have a cost.  Similar
5018      situations exist.  */
5019   /* ??? The new final_[bg]iv_value code does a much better job of
5020      finding replaceable giv's, and hence this code may no longer be
5021      necessary.  */
5022   if (! v->replaceable && ! bl->eliminable
5023       && REG_USERVAR_P (v->dest_reg))
5024     benefit -= copy_cost;
5025
5026   /* Decrease the benefit to count the add-insns that we will insert
5027      to increment the reduced reg for the giv.  ??? This can
5028      overestimate the run-time cost of the additional insns, e.g. if
5029      there are multiple basic blocks that increment the biv, but only
5030      one of these blocks is executed during each iteration.  There is
5031      no good way to detect cases like this with the current structure
5032      of the loop optimizer.  This code is more accurate for
5033      determining code size than run-time benefits.  */
5034   benefit -= add_cost * bl->biv_count;
5035
5036   /* Decide whether to strength-reduce this giv or to leave the code
5037      unchanged (recompute it from the biv each time it is used).  This
5038      decision can be made independently for each giv.  */
5039
5040 #ifdef AUTO_INC_DEC
5041   /* Attempt to guess whether autoincrement will handle some of the
5042      new add insns; if so, increase BENEFIT (undo the subtraction of
5043      add_cost that was done above).  */
5044   if (v->giv_type == DEST_ADDR
5045       /* Increasing the benefit is risky, since this is only a guess.
5046          Avoid increasing register pressure in cases where there would
5047          be no other benefit from reducing this giv.  */
5048       && benefit > 0
5049       && GET_CODE (v->mult_val) == CONST_INT)
5050     {
5051       int size = GET_MODE_SIZE (GET_MODE (v->mem));
5052
5053       if (HAVE_POST_INCREMENT
5054           && INTVAL (v->mult_val) == size)
5055         benefit += add_cost * bl->biv_count;
5056       else if (HAVE_PRE_INCREMENT
5057                && INTVAL (v->mult_val) == size)
5058         benefit += add_cost * bl->biv_count;
5059       else if (HAVE_POST_DECREMENT
5060                && -INTVAL (v->mult_val) == size)
5061         benefit += add_cost * bl->biv_count;
5062       else if (HAVE_PRE_DECREMENT
5063                && -INTVAL (v->mult_val) == size)
5064         benefit += add_cost * bl->biv_count;
5065     }
5066 #endif
5067
5068   return benefit;
5069 }
5070
5071
5072 /* Free IV structures for LOOP.  */
5073
5074 static void
5075 loop_ivs_free (loop)
5076      struct loop *loop;
5077 {
5078   struct loop_ivs *ivs = LOOP_IVS (loop);
5079   struct iv_class *iv = ivs->list;
5080
5081   free (ivs->regs);
5082
5083   while (iv)
5084     {
5085       struct iv_class *next = iv->next;
5086       struct induction *induction;
5087       struct induction *next_induction;
5088
5089       for (induction = iv->biv; induction; induction = next_induction)
5090         {
5091           next_induction = induction->next_iv;
5092           free (induction);
5093         }
5094       for (induction = iv->giv; induction; induction = next_induction)
5095         {
5096           next_induction = induction->next_iv;
5097           free (induction);
5098         }
5099
5100       free (iv);
5101       iv = next;
5102     }
5103 }
5104
5105
5106 /* Perform strength reduction and induction variable elimination.
5107
5108    Pseudo registers created during this function will be beyond the
5109    last valid index in several tables including
5110    REGS->ARRAY[I].N_TIMES_SET and REGNO_LAST_UID.  This does not cause a
5111    problem here, because the added registers cannot be givs outside of
5112    their loop, and hence will never be reconsidered.  But scan_loop
5113    must check regnos to make sure they are in bounds.  */
5114
5115 static void
5116 strength_reduce (loop, flags)
5117      struct loop *loop;
5118      int flags;
5119 {
5120   struct loop_info *loop_info = LOOP_INFO (loop);
5121   struct loop_regs *regs = LOOP_REGS (loop);
5122   struct loop_ivs *ivs = LOOP_IVS (loop);
5123   rtx p;
5124   /* Temporary list pointer for traversing ivs->list.  */
5125   struct iv_class *bl;
5126   /* Ratio of extra register life span we can justify
5127      for saving an instruction.  More if loop doesn't call subroutines
5128      since in that case saving an insn makes more difference
5129      and more registers are available.  */
5130   /* ??? could set this to last value of threshold in move_movables */
5131   int threshold = (loop_info->has_call ? 1 : 2) * (3 + n_non_fixed_regs);
5132   /* Map of pseudo-register replacements.  */
5133   rtx *reg_map = NULL;
5134   int reg_map_size;
5135   int unrolled_insn_copies = 0;
5136   rtx test_reg = gen_rtx_REG (word_mode, LAST_VIRTUAL_REGISTER + 1);
5137   int insn_count = count_insns_in_loop (loop);
5138
5139   addr_placeholder = gen_reg_rtx (Pmode);
5140
5141   ivs->n_regs = max_reg_before_loop;
5142   ivs->regs = (struct iv *) xcalloc (ivs->n_regs, sizeof (struct iv));
5143
5144   /* Find all BIVs in loop.  */
5145   loop_bivs_find (loop);
5146
5147   /* Exit if there are no bivs.  */
5148   if (! ivs->list)
5149     {
5150       /* Can still unroll the loop anyways, but indicate that there is no
5151          strength reduction info available.  */
5152       if (flags & LOOP_UNROLL)
5153         unroll_loop (loop, insn_count, 0);
5154
5155       loop_ivs_free (loop);
5156       return;
5157     }
5158
5159   /* Determine how BIVS are initialized by looking through pre-header
5160      extended basic block.  */
5161   loop_bivs_init_find (loop);
5162
5163   /* Look at the each biv and see if we can say anything better about its
5164      initial value from any initializing insns set up above.  */
5165   loop_bivs_check (loop);
5166
5167   /* Search the loop for general induction variables.  */
5168   loop_givs_find (loop);
5169
5170   /* Try to calculate and save the number of loop iterations.  This is
5171      set to zero if the actual number can not be calculated.  This must
5172      be called after all giv's have been identified, since otherwise it may
5173      fail if the iteration variable is a giv.  */
5174   loop_iterations (loop);
5175
5176 #ifdef HAVE_prefetch
5177   if (flags & LOOP_PREFETCH)
5178     emit_prefetch_instructions (loop);
5179 #endif
5180
5181   /* Now for each giv for which we still don't know whether or not it is
5182      replaceable, check to see if it is replaceable because its final value
5183      can be calculated.  This must be done after loop_iterations is called,
5184      so that final_giv_value will work correctly.  */
5185   loop_givs_check (loop);
5186
5187   /* Try to prove that the loop counter variable (if any) is always
5188      nonnegative; if so, record that fact with a REG_NONNEG note
5189      so that "decrement and branch until zero" insn can be used.  */
5190   check_dbra_loop (loop, insn_count);
5191
5192   /* Create reg_map to hold substitutions for replaceable giv regs.
5193      Some givs might have been made from biv increments, so look at
5194      ivs->reg_iv_type for a suitable size.  */
5195   reg_map_size = ivs->n_regs;
5196   reg_map = (rtx *) xcalloc (reg_map_size, sizeof (rtx));
5197
5198   /* Examine each iv class for feasibility of strength reduction/induction
5199      variable elimination.  */
5200
5201   for (bl = ivs->list; bl; bl = bl->next)
5202     {
5203       struct induction *v;
5204       int benefit;
5205
5206       /* Test whether it will be possible to eliminate this biv
5207          provided all givs are reduced.  */
5208       bl->eliminable = loop_biv_eliminable_p (loop, bl, threshold, insn_count);
5209
5210       /* This will be true at the end, if all givs which depend on this
5211          biv have been strength reduced.
5212          We can't (currently) eliminate the biv unless this is so.  */
5213       bl->all_reduced = 1;
5214
5215       /* Check each extension dependent giv in this class to see if its
5216          root biv is safe from wrapping in the interior mode.  */
5217       check_ext_dependent_givs (bl, loop_info);
5218
5219       /* Combine all giv's for this iv_class.  */
5220       combine_givs (regs, bl);
5221
5222       for (v = bl->giv; v; v = v->next_iv)
5223         {
5224           struct induction *tv;
5225
5226           if (v->ignore || v->same)
5227             continue;
5228
5229           benefit = loop_giv_reduce_benefit (loop, bl, v, test_reg);
5230
5231           /* If an insn is not to be strength reduced, then set its ignore
5232              flag, and clear bl->all_reduced.  */
5233
5234           /* A giv that depends on a reversed biv must be reduced if it is
5235              used after the loop exit, otherwise, it would have the wrong
5236              value after the loop exit.  To make it simple, just reduce all
5237              of such giv's whether or not we know they are used after the loop
5238              exit.  */
5239
5240           if (! flag_reduce_all_givs
5241               && v->lifetime * threshold * benefit < insn_count
5242               && ! bl->reversed)
5243             {
5244               if (loop_dump_stream)
5245                 fprintf (loop_dump_stream,
5246                          "giv of insn %d not worth while, %d vs %d.\n",
5247                          INSN_UID (v->insn),
5248                          v->lifetime * threshold * benefit, insn_count);
5249               v->ignore = 1;
5250               bl->all_reduced = 0;
5251             }
5252           else
5253             {
5254               /* Check that we can increment the reduced giv without a
5255                  multiply insn.  If not, reject it.  */
5256
5257               for (tv = bl->biv; tv; tv = tv->next_iv)
5258                 if (tv->mult_val == const1_rtx
5259                     && ! product_cheap_p (tv->add_val, v->mult_val))
5260                   {
5261                     if (loop_dump_stream)
5262                       fprintf (loop_dump_stream,
5263                                "giv of insn %d: would need a multiply.\n",
5264                                INSN_UID (v->insn));
5265                     v->ignore = 1;
5266                     bl->all_reduced = 0;
5267                     break;
5268                   }
5269             }
5270         }
5271
5272       /* Check for givs whose first use is their definition and whose
5273          last use is the definition of another giv.  If so, it is likely
5274          dead and should not be used to derive another giv nor to
5275          eliminate a biv.  */
5276       loop_givs_dead_check (loop, bl);
5277
5278       /* Reduce each giv that we decided to reduce.  */
5279       loop_givs_reduce (loop, bl);
5280
5281       /* Rescan all givs.  If a giv is the same as a giv not reduced, mark it
5282          as not reduced.
5283
5284          For each giv register that can be reduced now: if replaceable,
5285          substitute reduced reg wherever the old giv occurs;
5286          else add new move insn "giv_reg = reduced_reg".  */
5287       loop_givs_rescan (loop, bl, reg_map);
5288
5289       /* All the givs based on the biv bl have been reduced if they
5290          merit it.  */
5291
5292       /* For each giv not marked as maybe dead that has been combined with a
5293          second giv, clear any "maybe dead" mark on that second giv.
5294          v->new_reg will either be or refer to the register of the giv it
5295          combined with.
5296
5297          Doing this clearing avoids problems in biv elimination where
5298          a giv's new_reg is a complex value that can't be put in the
5299          insn but the giv combined with (with a reg as new_reg) is
5300          marked maybe_dead.  Since the register will be used in either
5301          case, we'd prefer it be used from the simpler giv.  */
5302
5303       for (v = bl->giv; v; v = v->next_iv)
5304         if (! v->maybe_dead && v->same)
5305           v->same->maybe_dead = 0;
5306
5307       /* Try to eliminate the biv, if it is a candidate.
5308          This won't work if ! bl->all_reduced,
5309          since the givs we planned to use might not have been reduced.
5310
5311          We have to be careful that we didn't initially think we could
5312          eliminate this biv because of a giv that we now think may be
5313          dead and shouldn't be used as a biv replacement.
5314
5315          Also, there is the possibility that we may have a giv that looks
5316          like it can be used to eliminate a biv, but the resulting insn
5317          isn't valid.  This can happen, for example, on the 88k, where a
5318          JUMP_INSN can compare a register only with zero.  Attempts to
5319          replace it with a compare with a constant will fail.
5320
5321          Note that in cases where this call fails, we may have replaced some
5322          of the occurrences of the biv with a giv, but no harm was done in
5323          doing so in the rare cases where it can occur.  */
5324
5325       if (bl->all_reduced == 1 && bl->eliminable
5326           && maybe_eliminate_biv (loop, bl, 1, threshold, insn_count))
5327         {
5328           /* ?? If we created a new test to bypass the loop entirely,
5329              or otherwise drop straight in, based on this test, then
5330              we might want to rewrite it also.  This way some later
5331              pass has more hope of removing the initialization of this
5332              biv entirely.  */
5333
5334           /* If final_value != 0, then the biv may be used after loop end
5335              and we must emit an insn to set it just in case.
5336
5337              Reversed bivs already have an insn after the loop setting their
5338              value, so we don't need another one.  We can't calculate the
5339              proper final value for such a biv here anyways.  */
5340           if (bl->final_value && ! bl->reversed)
5341               loop_insn_sink_or_swim (loop,
5342                                       gen_load_of_final_value (bl->biv->dest_reg,
5343                                                                bl->final_value));
5344
5345           if (loop_dump_stream)
5346             fprintf (loop_dump_stream, "Reg %d: biv eliminated\n",
5347                      bl->regno);
5348         }
5349       /* See above note wrt final_value.  But since we couldn't eliminate
5350          the biv, we must set the value after the loop instead of before.  */
5351       else if (bl->final_value && ! bl->reversed)
5352         loop_insn_sink (loop, gen_load_of_final_value (bl->biv->dest_reg,
5353                                                        bl->final_value));
5354     }
5355
5356   /* Go through all the instructions in the loop, making all the
5357      register substitutions scheduled in REG_MAP.  */
5358
5359   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
5360     if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5361         || GET_CODE (p) == CALL_INSN)
5362       {
5363         replace_regs (PATTERN (p), reg_map, reg_map_size, 0);
5364         replace_regs (REG_NOTES (p), reg_map, reg_map_size, 0);
5365         INSN_CODE (p) = -1;
5366       }
5367
5368   if (loop_info->n_iterations > 0)
5369     {
5370       /* When we completely unroll a loop we will likely not need the increment
5371          of the loop BIV and we will not need the conditional branch at the
5372          end of the loop.  */
5373       unrolled_insn_copies = insn_count - 2;
5374
5375 #ifdef HAVE_cc0
5376       /* When we completely unroll a loop on a HAVE_cc0 machine we will not
5377          need the comparison before the conditional branch at the end of the
5378          loop.  */
5379       unrolled_insn_copies -= 1;
5380 #endif
5381
5382       /* We'll need one copy for each loop iteration.  */
5383       unrolled_insn_copies *= loop_info->n_iterations;
5384
5385       /* A little slop to account for the ability to remove initialization
5386          code, better CSE, and other secondary benefits of completely
5387          unrolling some loops.  */
5388       unrolled_insn_copies -= 1;
5389
5390       /* Clamp the value.  */
5391       if (unrolled_insn_copies < 0)
5392         unrolled_insn_copies = 0;
5393     }
5394
5395   /* Unroll loops from within strength reduction so that we can use the
5396      induction variable information that strength_reduce has already
5397      collected.  Always unroll loops that would be as small or smaller
5398      unrolled than when rolled.  */
5399   if ((flags & LOOP_UNROLL)
5400       || ((flags & LOOP_AUTO_UNROLL)
5401           && loop_info->n_iterations > 0
5402           && unrolled_insn_copies <= insn_count))
5403     unroll_loop (loop, insn_count, 1);
5404
5405 #ifdef HAVE_doloop_end
5406   if (HAVE_doloop_end && (flags & LOOP_BCT) && flag_branch_on_count_reg)
5407     doloop_optimize (loop);
5408 #endif  /* HAVE_doloop_end  */
5409
5410   /* In case number of iterations is known, drop branch prediction note
5411      in the branch.  Do that only in second loop pass, as loop unrolling
5412      may change the number of iterations performed.  */
5413   if (flags & LOOP_BCT)
5414     {
5415       unsigned HOST_WIDE_INT n
5416         = loop_info->n_iterations / loop_info->unroll_number;
5417       if (n > 1)
5418         predict_insn (prev_nonnote_insn (loop->end), PRED_LOOP_ITERATIONS,
5419                       REG_BR_PROB_BASE - REG_BR_PROB_BASE / n);
5420     }
5421
5422   if (loop_dump_stream)
5423     fprintf (loop_dump_stream, "\n");
5424
5425   loop_ivs_free (loop);
5426   if (reg_map)
5427     free (reg_map);
5428 }
5429 \f
5430 /*Record all basic induction variables calculated in the insn.  */
5431 static rtx
5432 check_insn_for_bivs (loop, p, not_every_iteration, maybe_multiple)
5433      struct loop *loop;
5434      rtx p;
5435      int not_every_iteration;
5436      int maybe_multiple;
5437 {
5438   struct loop_ivs *ivs = LOOP_IVS (loop);
5439   rtx set;
5440   rtx dest_reg;
5441   rtx inc_val;
5442   rtx mult_val;
5443   rtx *location;
5444
5445   if (GET_CODE (p) == INSN
5446       && (set = single_set (p))
5447       && GET_CODE (SET_DEST (set)) == REG)
5448     {
5449       dest_reg = SET_DEST (set);
5450       if (REGNO (dest_reg) < max_reg_before_loop
5451           && REGNO (dest_reg) >= FIRST_PSEUDO_REGISTER
5452           && REG_IV_TYPE (ivs, REGNO (dest_reg)) != NOT_BASIC_INDUCT)
5453         {
5454           if (basic_induction_var (loop, SET_SRC (set),
5455                                    GET_MODE (SET_SRC (set)),
5456                                    dest_reg, p, &inc_val, &mult_val,
5457                                    &location))
5458             {
5459               /* It is a possible basic induction variable.
5460                  Create and initialize an induction structure for it.  */
5461
5462               struct induction *v
5463                 = (struct induction *) xmalloc (sizeof (struct induction));
5464
5465               record_biv (loop, v, p, dest_reg, inc_val, mult_val, location,
5466                           not_every_iteration, maybe_multiple);
5467               REG_IV_TYPE (ivs, REGNO (dest_reg)) = BASIC_INDUCT;
5468             }
5469           else if (REGNO (dest_reg) < ivs->n_regs)
5470             REG_IV_TYPE (ivs, REGNO (dest_reg)) = NOT_BASIC_INDUCT;
5471         }
5472     }
5473   return p;
5474 }
5475 \f
5476 /* Record all givs calculated in the insn.
5477    A register is a giv if: it is only set once, it is a function of a
5478    biv and a constant (or invariant), and it is not a biv.  */
5479 static rtx
5480 check_insn_for_givs (loop, p, not_every_iteration, maybe_multiple)
5481      struct loop *loop;
5482      rtx p;
5483      int not_every_iteration;
5484      int maybe_multiple;
5485 {
5486   struct loop_regs *regs = LOOP_REGS (loop);
5487
5488   rtx set;
5489   /* Look for a general induction variable in a register.  */
5490   if (GET_CODE (p) == INSN
5491       && (set = single_set (p))
5492       && GET_CODE (SET_DEST (set)) == REG
5493       && ! regs->array[REGNO (SET_DEST (set))].may_not_optimize)
5494     {
5495       rtx src_reg;
5496       rtx dest_reg;
5497       rtx add_val;
5498       rtx mult_val;
5499       rtx ext_val;
5500       int benefit;
5501       rtx regnote = 0;
5502       rtx last_consec_insn;
5503
5504       dest_reg = SET_DEST (set);
5505       if (REGNO (dest_reg) < FIRST_PSEUDO_REGISTER)
5506         return p;
5507
5508       if (/* SET_SRC is a giv.  */
5509           (general_induction_var (loop, SET_SRC (set), &src_reg, &add_val,
5510                                   &mult_val, &ext_val, 0, &benefit, VOIDmode)
5511            /* Equivalent expression is a giv.  */
5512            || ((regnote = find_reg_note (p, REG_EQUAL, NULL_RTX))
5513                && general_induction_var (loop, XEXP (regnote, 0), &src_reg,
5514                                          &add_val, &mult_val, &ext_val, 0,
5515                                          &benefit, VOIDmode)))
5516           /* Don't try to handle any regs made by loop optimization.
5517              We have nothing on them in regno_first_uid, etc.  */
5518           && REGNO (dest_reg) < max_reg_before_loop
5519           /* Don't recognize a BASIC_INDUCT_VAR here.  */
5520           && dest_reg != src_reg
5521           /* This must be the only place where the register is set.  */
5522           && (regs->array[REGNO (dest_reg)].n_times_set == 1
5523               /* or all sets must be consecutive and make a giv.  */
5524               || (benefit = consec_sets_giv (loop, benefit, p,
5525                                              src_reg, dest_reg,
5526                                              &add_val, &mult_val, &ext_val,
5527                                              &last_consec_insn))))
5528         {
5529           struct induction *v
5530             = (struct induction *) xmalloc (sizeof (struct induction));
5531
5532           /* If this is a library call, increase benefit.  */
5533           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
5534             benefit += libcall_benefit (p);
5535
5536           /* Skip the consecutive insns, if there are any.  */
5537           if (regs->array[REGNO (dest_reg)].n_times_set != 1)
5538             p = last_consec_insn;
5539
5540           record_giv (loop, v, p, src_reg, dest_reg, mult_val, add_val,
5541                       ext_val, benefit, DEST_REG, not_every_iteration,
5542                       maybe_multiple, (rtx*) 0);
5543
5544         }
5545     }
5546
5547 #ifndef DONT_REDUCE_ADDR
5548   /* Look for givs which are memory addresses.  */
5549   /* This resulted in worse code on a VAX 8600.  I wonder if it
5550      still does.  */
5551   if (GET_CODE (p) == INSN)
5552     find_mem_givs (loop, PATTERN (p), p, not_every_iteration,
5553                    maybe_multiple);
5554 #endif
5555
5556   /* Update the status of whether giv can derive other givs.  This can
5557      change when we pass a label or an insn that updates a biv.  */
5558   if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
5559       || GET_CODE (p) == CODE_LABEL)
5560     update_giv_derive (loop, p);
5561   return p;
5562 }
5563 \f
5564 /* Return 1 if X is a valid source for an initial value (or as value being
5565    compared against in an initial test).
5566
5567    X must be either a register or constant and must not be clobbered between
5568    the current insn and the start of the loop.
5569
5570    INSN is the insn containing X.  */
5571
5572 static int
5573 valid_initial_value_p (x, insn, call_seen, loop_start)
5574      rtx x;
5575      rtx insn;
5576      int call_seen;
5577      rtx loop_start;
5578 {
5579   if (CONSTANT_P (x))
5580     return 1;
5581
5582   /* Only consider pseudos we know about initialized in insns whose luids
5583      we know.  */
5584   if (GET_CODE (x) != REG
5585       || REGNO (x) >= max_reg_before_loop)
5586     return 0;
5587
5588   /* Don't use call-clobbered registers across a call which clobbers it.  On
5589      some machines, don't use any hard registers at all.  */
5590   if (REGNO (x) < FIRST_PSEUDO_REGISTER
5591       && (SMALL_REGISTER_CLASSES
5592           || (call_used_regs[REGNO (x)] && call_seen)))
5593     return 0;
5594
5595   /* Don't use registers that have been clobbered before the start of the
5596      loop.  */
5597   if (reg_set_between_p (x, insn, loop_start))
5598     return 0;
5599
5600   return 1;
5601 }
5602 \f
5603 /* Scan X for memory refs and check each memory address
5604    as a possible giv.  INSN is the insn whose pattern X comes from.
5605    NOT_EVERY_ITERATION is 1 if the insn might not be executed during
5606    every loop iteration.  MAYBE_MULTIPLE is 1 if the insn might be executed
5607    more than once in each loop iteration.  */
5608
5609 static void
5610 find_mem_givs (loop, x, insn, not_every_iteration, maybe_multiple)
5611      const struct loop *loop;
5612      rtx x;
5613      rtx insn;
5614      int not_every_iteration, maybe_multiple;
5615 {
5616   int i, j;
5617   enum rtx_code code;
5618   const char *fmt;
5619
5620   if (x == 0)
5621     return;
5622
5623   code = GET_CODE (x);
5624   switch (code)
5625     {
5626     case REG:
5627     case CONST_INT:
5628     case CONST:
5629     case CONST_DOUBLE:
5630     case SYMBOL_REF:
5631     case LABEL_REF:
5632     case PC:
5633     case CC0:
5634     case ADDR_VEC:
5635     case ADDR_DIFF_VEC:
5636     case USE:
5637     case CLOBBER:
5638       return;
5639
5640     case MEM:
5641       {
5642         rtx src_reg;
5643         rtx add_val;
5644         rtx mult_val;
5645         rtx ext_val;
5646         int benefit;
5647
5648         /* This code used to disable creating GIVs with mult_val == 1 and
5649            add_val == 0.  However, this leads to lost optimizations when
5650            it comes time to combine a set of related DEST_ADDR GIVs, since
5651            this one would not be seen.  */
5652
5653         if (general_induction_var (loop, XEXP (x, 0), &src_reg, &add_val,
5654                                    &mult_val, &ext_val, 1, &benefit,
5655                                    GET_MODE (x)))
5656           {
5657             /* Found one; record it.  */
5658             struct induction *v
5659               = (struct induction *) xmalloc (sizeof (struct induction));
5660
5661             record_giv (loop, v, insn, src_reg, addr_placeholder, mult_val,
5662                         add_val, ext_val, benefit, DEST_ADDR,
5663                         not_every_iteration, maybe_multiple, &XEXP (x, 0));
5664
5665             v->mem = x;
5666           }
5667       }
5668       return;
5669
5670     default:
5671       break;
5672     }
5673
5674   /* Recursively scan the subexpressions for other mem refs.  */
5675
5676   fmt = GET_RTX_FORMAT (code);
5677   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
5678     if (fmt[i] == 'e')
5679       find_mem_givs (loop, XEXP (x, i), insn, not_every_iteration,
5680                      maybe_multiple);
5681     else if (fmt[i] == 'E')
5682       for (j = 0; j < XVECLEN (x, i); j++)
5683         find_mem_givs (loop, XVECEXP (x, i, j), insn, not_every_iteration,
5684                        maybe_multiple);
5685 }
5686 \f
5687 /* Fill in the data about one biv update.
5688    V is the `struct induction' in which we record the biv.  (It is
5689    allocated by the caller, with alloca.)
5690    INSN is the insn that sets it.
5691    DEST_REG is the biv's reg.
5692
5693    MULT_VAL is const1_rtx if the biv is being incremented here, in which case
5694    INC_VAL is the increment.  Otherwise, MULT_VAL is const0_rtx and the biv is
5695    being set to INC_VAL.
5696
5697    NOT_EVERY_ITERATION is nonzero if this biv update is not know to be
5698    executed every iteration; MAYBE_MULTIPLE is nonzero if this biv update
5699    can be executed more than once per iteration.  If MAYBE_MULTIPLE
5700    and NOT_EVERY_ITERATION are both zero, we know that the biv update is
5701    executed exactly once per iteration.  */
5702
5703 static void
5704 record_biv (loop, v, insn, dest_reg, inc_val, mult_val, location,
5705             not_every_iteration, maybe_multiple)
5706      struct loop *loop;
5707      struct induction *v;
5708      rtx insn;
5709      rtx dest_reg;
5710      rtx inc_val;
5711      rtx mult_val;
5712      rtx *location;
5713      int not_every_iteration;
5714      int maybe_multiple;
5715 {
5716   struct loop_ivs *ivs = LOOP_IVS (loop);
5717   struct iv_class *bl;
5718
5719   v->insn = insn;
5720   v->src_reg = dest_reg;
5721   v->dest_reg = dest_reg;
5722   v->mult_val = mult_val;
5723   v->add_val = inc_val;
5724   v->ext_dependent = NULL_RTX;
5725   v->location = location;
5726   v->mode = GET_MODE (dest_reg);
5727   v->always_computable = ! not_every_iteration;
5728   v->always_executed = ! not_every_iteration;
5729   v->maybe_multiple = maybe_multiple;
5730   v->same = 0;
5731
5732   /* Add this to the reg's iv_class, creating a class
5733      if this is the first incrementation of the reg.  */
5734
5735   bl = REG_IV_CLASS (ivs, REGNO (dest_reg));
5736   if (bl == 0)
5737     {
5738       /* Create and initialize new iv_class.  */
5739
5740       bl = (struct iv_class *) xmalloc (sizeof (struct iv_class));
5741
5742       bl->regno = REGNO (dest_reg);
5743       bl->biv = 0;
5744       bl->giv = 0;
5745       bl->biv_count = 0;
5746       bl->giv_count = 0;
5747
5748       /* Set initial value to the reg itself.  */
5749       bl->initial_value = dest_reg;
5750       bl->final_value = 0;
5751       /* We haven't seen the initializing insn yet */
5752       bl->init_insn = 0;
5753       bl->init_set = 0;
5754       bl->initial_test = 0;
5755       bl->incremented = 0;
5756       bl->eliminable = 0;
5757       bl->nonneg = 0;
5758       bl->reversed = 0;
5759       bl->total_benefit = 0;
5760
5761       /* Add this class to ivs->list.  */
5762       bl->next = ivs->list;
5763       ivs->list = bl;
5764
5765       /* Put it in the array of biv register classes.  */
5766       REG_IV_CLASS (ivs, REGNO (dest_reg)) = bl;
5767     }
5768   else
5769     {
5770       /* Check if location is the same as a previous one.  */
5771       struct induction *induction;
5772       for (induction = bl->biv; induction; induction = induction->next_iv)
5773         if (location == induction->location)
5774           {
5775             v->same = induction;
5776             break;
5777           }
5778     }
5779
5780   /* Update IV_CLASS entry for this biv.  */
5781   v->next_iv = bl->biv;
5782   bl->biv = v;
5783   bl->biv_count++;
5784   if (mult_val == const1_rtx)
5785     bl->incremented = 1;
5786
5787   if (loop_dump_stream)
5788     loop_biv_dump (v, loop_dump_stream, 0);
5789 }
5790 \f
5791 /* Fill in the data about one giv.
5792    V is the `struct induction' in which we record the giv.  (It is
5793    allocated by the caller, with alloca.)
5794    INSN is the insn that sets it.
5795    BENEFIT estimates the savings from deleting this insn.
5796    TYPE is DEST_REG or DEST_ADDR; it says whether the giv is computed
5797    into a register or is used as a memory address.
5798
5799    SRC_REG is the biv reg which the giv is computed from.
5800    DEST_REG is the giv's reg (if the giv is stored in a reg).
5801    MULT_VAL and ADD_VAL are the coefficients used to compute the giv.
5802    LOCATION points to the place where this giv's value appears in INSN.  */
5803
5804 static void
5805 record_giv (loop, v, insn, src_reg, dest_reg, mult_val, add_val, ext_val,
5806             benefit, type, not_every_iteration, maybe_multiple, location)
5807      const struct loop *loop;
5808      struct induction *v;
5809      rtx insn;
5810      rtx src_reg;
5811      rtx dest_reg;
5812      rtx mult_val, add_val, ext_val;
5813      int benefit;
5814      enum g_types type;
5815      int not_every_iteration, maybe_multiple;
5816      rtx *location;
5817 {
5818   struct loop_ivs *ivs = LOOP_IVS (loop);
5819   struct induction *b;
5820   struct iv_class *bl;
5821   rtx set = single_set (insn);
5822   rtx temp;
5823
5824   /* Attempt to prove constantness of the values.  Don't let simplify_rtx
5825      undo the MULT canonicalization that we performed earlier.  */
5826   temp = simplify_rtx (add_val);
5827   if (temp
5828       && ! (GET_CODE (add_val) == MULT
5829             && GET_CODE (temp) == ASHIFT))
5830     add_val = temp;
5831
5832   v->insn = insn;
5833   v->src_reg = src_reg;
5834   v->giv_type = type;
5835   v->dest_reg = dest_reg;
5836   v->mult_val = mult_val;
5837   v->add_val = add_val;
5838   v->ext_dependent = ext_val;
5839   v->benefit = benefit;
5840   v->location = location;
5841   v->cant_derive = 0;
5842   v->combined_with = 0;
5843   v->maybe_multiple = maybe_multiple;
5844   v->maybe_dead = 0;
5845   v->derive_adjustment = 0;
5846   v->same = 0;
5847   v->ignore = 0;
5848   v->new_reg = 0;
5849   v->final_value = 0;
5850   v->same_insn = 0;
5851   v->auto_inc_opt = 0;
5852   v->unrolled = 0;
5853   v->shared = 0;
5854
5855   /* The v->always_computable field is used in update_giv_derive, to
5856      determine whether a giv can be used to derive another giv.  For a
5857      DEST_REG giv, INSN computes a new value for the giv, so its value
5858      isn't computable if INSN insn't executed every iteration.
5859      However, for a DEST_ADDR giv, INSN merely uses the value of the giv;
5860      it does not compute a new value.  Hence the value is always computable
5861      regardless of whether INSN is executed each iteration.  */
5862
5863   if (type == DEST_ADDR)
5864     v->always_computable = 1;
5865   else
5866     v->always_computable = ! not_every_iteration;
5867
5868   v->always_executed = ! not_every_iteration;
5869
5870   if (type == DEST_ADDR)
5871     {
5872       v->mode = GET_MODE (*location);
5873       v->lifetime = 1;
5874     }
5875   else /* type == DEST_REG */
5876     {
5877       v->mode = GET_MODE (SET_DEST (set));
5878
5879       v->lifetime = LOOP_REG_LIFETIME (loop, REGNO (dest_reg));
5880
5881       /* If the lifetime is zero, it means that this register is
5882          really a dead store.  So mark this as a giv that can be
5883          ignored.  This will not prevent the biv from being eliminated.  */
5884       if (v->lifetime == 0)
5885         v->ignore = 1;
5886
5887       REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
5888       REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
5889     }
5890
5891   /* Add the giv to the class of givs computed from one biv.  */
5892
5893   bl = REG_IV_CLASS (ivs, REGNO (src_reg));
5894   if (bl)
5895     {
5896       v->next_iv = bl->giv;
5897       bl->giv = v;
5898       /* Don't count DEST_ADDR.  This is supposed to count the number of
5899          insns that calculate givs.  */
5900       if (type == DEST_REG)
5901         bl->giv_count++;
5902       bl->total_benefit += benefit;
5903     }
5904   else
5905     /* Fatal error, biv missing for this giv?  */
5906     abort ();
5907
5908   if (type == DEST_ADDR)
5909     {
5910       v->replaceable = 1;
5911       v->not_replaceable = 0;
5912     }
5913   else
5914     {
5915       /* The giv can be replaced outright by the reduced register only if all
5916          of the following conditions are true:
5917          - the insn that sets the giv is always executed on any iteration
5918            on which the giv is used at all
5919            (there are two ways to deduce this:
5920             either the insn is executed on every iteration,
5921             or all uses follow that insn in the same basic block),
5922          - the giv is not used outside the loop
5923          - no assignments to the biv occur during the giv's lifetime.  */
5924
5925       if (REGNO_FIRST_UID (REGNO (dest_reg)) == INSN_UID (insn)
5926           /* Previous line always fails if INSN was moved by loop opt.  */
5927           && REGNO_LAST_LUID (REGNO (dest_reg))
5928           < INSN_LUID (loop->end)
5929           && (! not_every_iteration
5930               || last_use_this_basic_block (dest_reg, insn)))
5931         {
5932           /* Now check that there are no assignments to the biv within the
5933              giv's lifetime.  This requires two separate checks.  */
5934
5935           /* Check each biv update, and fail if any are between the first
5936              and last use of the giv.
5937
5938              If this loop contains an inner loop that was unrolled, then
5939              the insn modifying the biv may have been emitted by the loop
5940              unrolling code, and hence does not have a valid luid.  Just
5941              mark the biv as not replaceable in this case.  It is not very
5942              useful as a biv, because it is used in two different loops.
5943              It is very unlikely that we would be able to optimize the giv
5944              using this biv anyways.  */
5945
5946           v->replaceable = 1;
5947           v->not_replaceable = 0;
5948           for (b = bl->biv; b; b = b->next_iv)
5949             {
5950               if (INSN_UID (b->insn) >= max_uid_for_loop
5951                   || ((INSN_LUID (b->insn)
5952                        >= REGNO_FIRST_LUID (REGNO (dest_reg)))
5953                       && (INSN_LUID (b->insn)
5954                           <= REGNO_LAST_LUID (REGNO (dest_reg)))))
5955                 {
5956                   v->replaceable = 0;
5957                   v->not_replaceable = 1;
5958                   break;
5959                 }
5960             }
5961
5962           /* If there are any backwards branches that go from after the
5963              biv update to before it, then this giv is not replaceable.  */
5964           if (v->replaceable)
5965             for (b = bl->biv; b; b = b->next_iv)
5966               if (back_branch_in_range_p (loop, b->insn))
5967                 {
5968                   v->replaceable = 0;
5969                   v->not_replaceable = 1;
5970                   break;
5971                 }
5972         }
5973       else
5974         {
5975           /* May still be replaceable, we don't have enough info here to
5976              decide.  */
5977           v->replaceable = 0;
5978           v->not_replaceable = 0;
5979         }
5980     }
5981
5982   /* Record whether the add_val contains a const_int, for later use by
5983      combine_givs.  */
5984   {
5985     rtx tem = add_val;
5986
5987     v->no_const_addval = 1;
5988     if (tem == const0_rtx)
5989       ;
5990     else if (CONSTANT_P (add_val))
5991       v->no_const_addval = 0;
5992     if (GET_CODE (tem) == PLUS)
5993       {
5994         while (1)
5995           {
5996             if (GET_CODE (XEXP (tem, 0)) == PLUS)
5997               tem = XEXP (tem, 0);
5998             else if (GET_CODE (XEXP (tem, 1)) == PLUS)
5999               tem = XEXP (tem, 1);
6000             else
6001               break;
6002           }
6003         if (CONSTANT_P (XEXP (tem, 1)))
6004           v->no_const_addval = 0;
6005       }
6006   }
6007
6008   if (loop_dump_stream)
6009     loop_giv_dump (v, loop_dump_stream, 0);
6010 }
6011
6012 /* All this does is determine whether a giv can be made replaceable because
6013    its final value can be calculated.  This code can not be part of record_giv
6014    above, because final_giv_value requires that the number of loop iterations
6015    be known, and that can not be accurately calculated until after all givs
6016    have been identified.  */
6017
6018 static void
6019 check_final_value (loop, v)
6020      const struct loop *loop;
6021      struct induction *v;
6022 {
6023   rtx final_value = 0;
6024
6025   /* DEST_ADDR givs will never reach here, because they are always marked
6026      replaceable above in record_giv.  */
6027
6028   /* The giv can be replaced outright by the reduced register only if all
6029      of the following conditions are true:
6030      - the insn that sets the giv is always executed on any iteration
6031        on which the giv is used at all
6032        (there are two ways to deduce this:
6033         either the insn is executed on every iteration,
6034         or all uses follow that insn in the same basic block),
6035      - its final value can be calculated (this condition is different
6036        than the one above in record_giv)
6037      - it's not used before the it's set
6038      - no assignments to the biv occur during the giv's lifetime.  */
6039
6040 #if 0
6041   /* This is only called now when replaceable is known to be false.  */
6042   /* Clear replaceable, so that it won't confuse final_giv_value.  */
6043   v->replaceable = 0;
6044 #endif
6045
6046   if ((final_value = final_giv_value (loop, v))
6047       && (v->always_executed
6048           || last_use_this_basic_block (v->dest_reg, v->insn)))
6049     {
6050       int biv_increment_seen = 0, before_giv_insn = 0;
6051       rtx p = v->insn;
6052       rtx last_giv_use;
6053
6054       v->replaceable = 1;
6055       v->not_replaceable = 0;
6056
6057       /* When trying to determine whether or not a biv increment occurs
6058          during the lifetime of the giv, we can ignore uses of the variable
6059          outside the loop because final_value is true.  Hence we can not
6060          use regno_last_uid and regno_first_uid as above in record_giv.  */
6061
6062       /* Search the loop to determine whether any assignments to the
6063          biv occur during the giv's lifetime.  Start with the insn
6064          that sets the giv, and search around the loop until we come
6065          back to that insn again.
6066
6067          Also fail if there is a jump within the giv's lifetime that jumps
6068          to somewhere outside the lifetime but still within the loop.  This
6069          catches spaghetti code where the execution order is not linear, and
6070          hence the above test fails.  Here we assume that the giv lifetime
6071          does not extend from one iteration of the loop to the next, so as
6072          to make the test easier.  Since the lifetime isn't known yet,
6073          this requires two loops.  See also record_giv above.  */
6074
6075       last_giv_use = v->insn;
6076
6077       while (1)
6078         {
6079           p = NEXT_INSN (p);
6080           if (p == loop->end)
6081             {
6082               before_giv_insn = 1;
6083               p = NEXT_INSN (loop->start);
6084             }
6085           if (p == v->insn)
6086             break;
6087
6088           if (GET_CODE (p) == INSN || GET_CODE (p) == JUMP_INSN
6089               || GET_CODE (p) == CALL_INSN)
6090             {
6091               /* It is possible for the BIV increment to use the GIV if we
6092                  have a cycle.  Thus we must be sure to check each insn for
6093                  both BIV and GIV uses, and we must check for BIV uses
6094                  first.  */
6095
6096               if (! biv_increment_seen
6097                   && reg_set_p (v->src_reg, PATTERN (p)))
6098                 biv_increment_seen = 1;
6099
6100               if (reg_mentioned_p (v->dest_reg, PATTERN (p)))
6101                 {
6102                   if (biv_increment_seen || before_giv_insn)
6103                     {
6104                       v->replaceable = 0;
6105                       v->not_replaceable = 1;
6106                       break;
6107                     }
6108                   last_giv_use = p;
6109                 }
6110             }
6111         }
6112
6113       /* Now that the lifetime of the giv is known, check for branches
6114          from within the lifetime to outside the lifetime if it is still
6115          replaceable.  */
6116
6117       if (v->replaceable)
6118         {
6119           p = v->insn;
6120           while (1)
6121             {
6122               p = NEXT_INSN (p);
6123               if (p == loop->end)
6124                 p = NEXT_INSN (loop->start);
6125               if (p == last_giv_use)
6126                 break;
6127
6128               if (GET_CODE (p) == JUMP_INSN && JUMP_LABEL (p)
6129                   && LABEL_NAME (JUMP_LABEL (p))
6130                   && ((loop_insn_first_p (JUMP_LABEL (p), v->insn)
6131                        && loop_insn_first_p (loop->start, JUMP_LABEL (p)))
6132                       || (loop_insn_first_p (last_giv_use, JUMP_LABEL (p))
6133                           && loop_insn_first_p (JUMP_LABEL (p), loop->end))))
6134                 {
6135                   v->replaceable = 0;
6136                   v->not_replaceable = 1;
6137
6138                   if (loop_dump_stream)
6139                     fprintf (loop_dump_stream,
6140                              "Found branch outside giv lifetime.\n");
6141
6142                   break;
6143                 }
6144             }
6145         }
6146
6147       /* If it is replaceable, then save the final value.  */
6148       if (v->replaceable)
6149         v->final_value = final_value;
6150     }
6151
6152   if (loop_dump_stream && v->replaceable)
6153     fprintf (loop_dump_stream, "Insn %d: giv reg %d final_value replaceable\n",
6154              INSN_UID (v->insn), REGNO (v->dest_reg));
6155 }
6156 \f
6157 /* Update the status of whether a giv can derive other givs.
6158
6159    We need to do something special if there is or may be an update to the biv
6160    between the time the giv is defined and the time it is used to derive
6161    another giv.
6162
6163    In addition, a giv that is only conditionally set is not allowed to
6164    derive another giv once a label has been passed.
6165
6166    The cases we look at are when a label or an update to a biv is passed.  */
6167
6168 static void
6169 update_giv_derive (loop, p)
6170      const struct loop *loop;
6171      rtx p;
6172 {
6173   struct loop_ivs *ivs = LOOP_IVS (loop);
6174   struct iv_class *bl;
6175   struct induction *biv, *giv;
6176   rtx tem;
6177   int dummy;
6178
6179   /* Search all IV classes, then all bivs, and finally all givs.
6180
6181      There are three cases we are concerned with.  First we have the situation
6182      of a giv that is only updated conditionally.  In that case, it may not
6183      derive any givs after a label is passed.
6184
6185      The second case is when a biv update occurs, or may occur, after the
6186      definition of a giv.  For certain biv updates (see below) that are
6187      known to occur between the giv definition and use, we can adjust the
6188      giv definition.  For others, or when the biv update is conditional,
6189      we must prevent the giv from deriving any other givs.  There are two
6190      sub-cases within this case.
6191
6192      If this is a label, we are concerned with any biv update that is done
6193      conditionally, since it may be done after the giv is defined followed by
6194      a branch here (actually, we need to pass both a jump and a label, but
6195      this extra tracking doesn't seem worth it).
6196
6197      If this is a jump, we are concerned about any biv update that may be
6198      executed multiple times.  We are actually only concerned about
6199      backward jumps, but it is probably not worth performing the test
6200      on the jump again here.
6201
6202      If this is a biv update, we must adjust the giv status to show that a
6203      subsequent biv update was performed.  If this adjustment cannot be done,
6204      the giv cannot derive further givs.  */
6205
6206   for (bl = ivs->list; bl; bl = bl->next)
6207     for (biv = bl->biv; biv; biv = biv->next_iv)
6208       if (GET_CODE (p) == CODE_LABEL || GET_CODE (p) == JUMP_INSN
6209           || biv->insn == p)
6210         {
6211           for (giv = bl->giv; giv; giv = giv->next_iv)
6212             {
6213               /* If cant_derive is already true, there is no point in
6214                  checking all of these conditions again.  */
6215               if (giv->cant_derive)
6216                 continue;
6217
6218               /* If this giv is conditionally set and we have passed a label,
6219                  it cannot derive anything.  */
6220               if (GET_CODE (p) == CODE_LABEL && ! giv->always_computable)
6221                 giv->cant_derive = 1;
6222
6223               /* Skip givs that have mult_val == 0, since
6224                  they are really invariants.  Also skip those that are
6225                  replaceable, since we know their lifetime doesn't contain
6226                  any biv update.  */
6227               else if (giv->mult_val == const0_rtx || giv->replaceable)
6228                 continue;
6229
6230               /* The only way we can allow this giv to derive another
6231                  is if this is a biv increment and we can form the product
6232                  of biv->add_val and giv->mult_val.  In this case, we will
6233                  be able to compute a compensation.  */
6234               else if (biv->insn == p)
6235                 {
6236                   rtx ext_val_dummy;
6237
6238                   tem = 0;
6239                   if (biv->mult_val == const1_rtx)
6240                     tem = simplify_giv_expr (loop,
6241                                              gen_rtx_MULT (giv->mode,
6242                                                            biv->add_val,
6243                                                            giv->mult_val),
6244                                              &ext_val_dummy, &dummy);
6245
6246                   if (tem && giv->derive_adjustment)
6247                     tem = simplify_giv_expr
6248                       (loop,
6249                        gen_rtx_PLUS (giv->mode, tem, giv->derive_adjustment),
6250                        &ext_val_dummy, &dummy);
6251
6252                   if (tem)
6253                     giv->derive_adjustment = tem;
6254                   else
6255                     giv->cant_derive = 1;
6256                 }
6257               else if ((GET_CODE (p) == CODE_LABEL && ! biv->always_computable)
6258                        || (GET_CODE (p) == JUMP_INSN && biv->maybe_multiple))
6259                 giv->cant_derive = 1;
6260             }
6261         }
6262 }
6263 \f
6264 /* Check whether an insn is an increment legitimate for a basic induction var.
6265    X is the source of insn P, or a part of it.
6266    MODE is the mode in which X should be interpreted.
6267
6268    DEST_REG is the putative biv, also the destination of the insn.
6269    We accept patterns of these forms:
6270      REG = REG + INVARIANT (includes REG = REG - CONSTANT)
6271      REG = INVARIANT + REG
6272
6273    If X is suitable, we return 1, set *MULT_VAL to CONST1_RTX,
6274    store the additive term into *INC_VAL, and store the place where
6275    we found the additive term into *LOCATION.
6276
6277    If X is an assignment of an invariant into DEST_REG, we set
6278    *MULT_VAL to CONST0_RTX, and store the invariant into *INC_VAL.
6279
6280    We also want to detect a BIV when it corresponds to a variable
6281    whose mode was promoted via PROMOTED_MODE.  In that case, an increment
6282    of the variable may be a PLUS that adds a SUBREG of that variable to
6283    an invariant and then sign- or zero-extends the result of the PLUS
6284    into the variable.
6285
6286    Most GIVs in such cases will be in the promoted mode, since that is the
6287    probably the natural computation mode (and almost certainly the mode
6288    used for addresses) on the machine.  So we view the pseudo-reg containing
6289    the variable as the BIV, as if it were simply incremented.
6290
6291    Note that treating the entire pseudo as a BIV will result in making
6292    simple increments to any GIVs based on it.  However, if the variable
6293    overflows in its declared mode but not its promoted mode, the result will
6294    be incorrect.  This is acceptable if the variable is signed, since
6295    overflows in such cases are undefined, but not if it is unsigned, since
6296    those overflows are defined.  So we only check for SIGN_EXTEND and
6297    not ZERO_EXTEND.
6298
6299    If we cannot find a biv, we return 0.  */
6300
6301 static int
6302 basic_induction_var (loop, x, mode, dest_reg, p, inc_val, mult_val, location)
6303      const struct loop *loop;
6304      rtx x;
6305      enum machine_mode mode;
6306      rtx dest_reg;
6307      rtx p;
6308      rtx *inc_val;
6309      rtx *mult_val;
6310      rtx **location;
6311 {
6312   enum rtx_code code;
6313   rtx *argp, arg;
6314   rtx insn, set = 0;
6315
6316   code = GET_CODE (x);
6317   *location = NULL;
6318   switch (code)
6319     {
6320     case PLUS:
6321       if (rtx_equal_p (XEXP (x, 0), dest_reg)
6322           || (GET_CODE (XEXP (x, 0)) == SUBREG
6323               && SUBREG_PROMOTED_VAR_P (XEXP (x, 0))
6324               && SUBREG_REG (XEXP (x, 0)) == dest_reg))
6325         {
6326           argp = &XEXP (x, 1);
6327         }
6328       else if (rtx_equal_p (XEXP (x, 1), dest_reg)
6329                || (GET_CODE (XEXP (x, 1)) == SUBREG
6330                    && SUBREG_PROMOTED_VAR_P (XEXP (x, 1))
6331                    && SUBREG_REG (XEXP (x, 1)) == dest_reg))
6332         {
6333           argp = &XEXP (x, 0);
6334         }
6335       else
6336         return 0;
6337
6338       arg = *argp;
6339       if (loop_invariant_p (loop, arg) != 1)
6340         return 0;
6341
6342       *inc_val = convert_modes (GET_MODE (dest_reg), GET_MODE (x), arg, 0);
6343       *mult_val = const1_rtx;
6344       *location = argp;
6345       return 1;
6346
6347     case SUBREG:
6348       /* If what's inside the SUBREG is a BIV, then the SUBREG.  This will
6349          handle addition of promoted variables.
6350          ??? The comment at the start of this function is wrong: promoted
6351          variable increments don't look like it says they do.  */
6352       return basic_induction_var (loop, SUBREG_REG (x),
6353                                   GET_MODE (SUBREG_REG (x)),
6354                                   dest_reg, p, inc_val, mult_val, location);
6355
6356     case REG:
6357       /* If this register is assigned in a previous insn, look at its
6358          source, but don't go outside the loop or past a label.  */
6359
6360       /* If this sets a register to itself, we would repeat any previous
6361          biv increment if we applied this strategy blindly.  */
6362       if (rtx_equal_p (dest_reg, x))
6363         return 0;
6364
6365       insn = p;
6366       while (1)
6367         {
6368           rtx dest;
6369           do
6370             {
6371               insn = PREV_INSN (insn);
6372             }
6373           while (insn && GET_CODE (insn) == NOTE
6374                  && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
6375
6376           if (!insn)
6377             break;
6378           set = single_set (insn);
6379           if (set == 0)
6380             break;
6381           dest = SET_DEST (set);
6382           if (dest == x
6383               || (GET_CODE (dest) == SUBREG
6384                   && (GET_MODE_SIZE (GET_MODE (dest)) <= UNITS_PER_WORD)
6385                   && (GET_MODE_CLASS (GET_MODE (dest)) == MODE_INT)
6386                   && SUBREG_REG (dest) == x))
6387             return basic_induction_var (loop, SET_SRC (set),
6388                                         (GET_MODE (SET_SRC (set)) == VOIDmode
6389                                          ? GET_MODE (x)
6390                                          : GET_MODE (SET_SRC (set))),
6391                                         dest_reg, insn,
6392                                         inc_val, mult_val, location);
6393
6394           while (GET_CODE (dest) == SIGN_EXTRACT
6395                  || GET_CODE (dest) == ZERO_EXTRACT
6396                  || GET_CODE (dest) == SUBREG
6397                  || GET_CODE (dest) == STRICT_LOW_PART)
6398             dest = XEXP (dest, 0);
6399           if (dest == x)
6400             break;
6401         }
6402       /* Fall through.  */
6403
6404       /* Can accept constant setting of biv only when inside inner most loop.
6405          Otherwise, a biv of an inner loop may be incorrectly recognized
6406          as a biv of the outer loop,
6407          causing code to be moved INTO the inner loop.  */
6408     case MEM:
6409       if (loop_invariant_p (loop, x) != 1)
6410         return 0;
6411     case CONST_INT:
6412     case SYMBOL_REF:
6413     case CONST:
6414       /* convert_modes aborts if we try to convert to or from CCmode, so just
6415          exclude that case.  It is very unlikely that a condition code value
6416          would be a useful iterator anyways.  convert_modes aborts if we try to
6417          convert a float mode to non-float or vice versa too.  */
6418       if (loop->level == 1
6419           && GET_MODE_CLASS (mode) == GET_MODE_CLASS (GET_MODE (dest_reg))
6420           && GET_MODE_CLASS (mode) != MODE_CC)
6421         {
6422           /* Possible bug here?  Perhaps we don't know the mode of X.  */
6423           *inc_val = convert_modes (GET_MODE (dest_reg), mode, x, 0);
6424           *mult_val = const0_rtx;
6425           return 1;
6426         }
6427       else
6428         return 0;
6429
6430     case SIGN_EXTEND:
6431       return basic_induction_var (loop, XEXP (x, 0), GET_MODE (XEXP (x, 0)),
6432                                   dest_reg, p, inc_val, mult_val, location);
6433
6434     case ASHIFTRT:
6435       /* Similar, since this can be a sign extension.  */
6436       for (insn = PREV_INSN (p);
6437            (insn && GET_CODE (insn) == NOTE
6438             && NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG);
6439            insn = PREV_INSN (insn))
6440         ;
6441
6442       if (insn)
6443         set = single_set (insn);
6444
6445       if (! rtx_equal_p (dest_reg, XEXP (x, 0))
6446           && set && SET_DEST (set) == XEXP (x, 0)
6447           && GET_CODE (XEXP (x, 1)) == CONST_INT
6448           && INTVAL (XEXP (x, 1)) >= 0
6449           && GET_CODE (SET_SRC (set)) == ASHIFT
6450           && XEXP (x, 1) == XEXP (SET_SRC (set), 1))
6451         return basic_induction_var (loop, XEXP (SET_SRC (set), 0),
6452                                     GET_MODE (XEXP (x, 0)),
6453                                     dest_reg, insn, inc_val, mult_val,
6454                                     location);
6455       return 0;
6456
6457     default:
6458       return 0;
6459     }
6460 }
6461 \f
6462 /* A general induction variable (giv) is any quantity that is a linear
6463    function   of a basic induction variable,
6464    i.e. giv = biv * mult_val + add_val.
6465    The coefficients can be any loop invariant quantity.
6466    A giv need not be computed directly from the biv;
6467    it can be computed by way of other givs.  */
6468
6469 /* Determine whether X computes a giv.
6470    If it does, return a nonzero value
6471      which is the benefit from eliminating the computation of X;
6472    set *SRC_REG to the register of the biv that it is computed from;
6473    set *ADD_VAL and *MULT_VAL to the coefficients,
6474      such that the value of X is biv * mult + add;  */
6475
6476 static int
6477 general_induction_var (loop, x, src_reg, add_val, mult_val, ext_val,
6478                        is_addr, pbenefit, addr_mode)
6479      const struct loop *loop;
6480      rtx x;
6481      rtx *src_reg;
6482      rtx *add_val;
6483      rtx *mult_val;
6484      rtx *ext_val;
6485      int is_addr;
6486      int *pbenefit;
6487      enum machine_mode addr_mode;
6488 {
6489   struct loop_ivs *ivs = LOOP_IVS (loop);
6490   rtx orig_x = x;
6491
6492   /* If this is an invariant, forget it, it isn't a giv.  */
6493   if (loop_invariant_p (loop, x) == 1)
6494     return 0;
6495
6496   *pbenefit = 0;
6497   *ext_val = NULL_RTX;
6498   x = simplify_giv_expr (loop, x, ext_val, pbenefit);
6499   if (x == 0)
6500     return 0;
6501
6502   switch (GET_CODE (x))
6503     {
6504     case USE:
6505     case CONST_INT:
6506       /* Since this is now an invariant and wasn't before, it must be a giv
6507          with MULT_VAL == 0.  It doesn't matter which BIV we associate this
6508          with.  */
6509       *src_reg = ivs->list->biv->dest_reg;
6510       *mult_val = const0_rtx;
6511       *add_val = x;
6512       break;
6513
6514     case REG:
6515       /* This is equivalent to a BIV.  */
6516       *src_reg = x;
6517       *mult_val = const1_rtx;
6518       *add_val = const0_rtx;
6519       break;
6520
6521     case PLUS:
6522       /* Either (plus (biv) (invar)) or
6523          (plus (mult (biv) (invar_1)) (invar_2)).  */
6524       if (GET_CODE (XEXP (x, 0)) == MULT)
6525         {
6526           *src_reg = XEXP (XEXP (x, 0), 0);
6527           *mult_val = XEXP (XEXP (x, 0), 1);
6528         }
6529       else
6530         {
6531           *src_reg = XEXP (x, 0);
6532           *mult_val = const1_rtx;
6533         }
6534       *add_val = XEXP (x, 1);
6535       break;
6536
6537     case MULT:
6538       /* ADD_VAL is zero.  */
6539       *src_reg = XEXP (x, 0);
6540       *mult_val = XEXP (x, 1);
6541       *add_val = const0_rtx;
6542       break;
6543
6544     default:
6545       abort ();
6546     }
6547
6548   /* Remove any enclosing USE from ADD_VAL and MULT_VAL (there will be
6549      unless they are CONST_INT).  */
6550   if (GET_CODE (*add_val) == USE)
6551     *add_val = XEXP (*add_val, 0);
6552   if (GET_CODE (*mult_val) == USE)
6553     *mult_val = XEXP (*mult_val, 0);
6554
6555   if (is_addr)
6556     *pbenefit += address_cost (orig_x, addr_mode) - reg_address_cost;
6557   else
6558     *pbenefit += rtx_cost (orig_x, SET);
6559
6560   /* Always return true if this is a giv so it will be detected as such,
6561      even if the benefit is zero or negative.  This allows elimination
6562      of bivs that might otherwise not be eliminated.  */
6563   return 1;
6564 }
6565 \f
6566 /* Given an expression, X, try to form it as a linear function of a biv.
6567    We will canonicalize it to be of the form
6568         (plus (mult (BIV) (invar_1))
6569               (invar_2))
6570    with possible degeneracies.
6571
6572    The invariant expressions must each be of a form that can be used as a
6573    machine operand.  We surround then with a USE rtx (a hack, but localized
6574    and certainly unambiguous!) if not a CONST_INT for simplicity in this
6575    routine; it is the caller's responsibility to strip them.
6576
6577    If no such canonicalization is possible (i.e., two biv's are used or an
6578    expression that is neither invariant nor a biv or giv), this routine
6579    returns 0.
6580
6581    For a nonzero return, the result will have a code of CONST_INT, USE,
6582    REG (for a BIV), PLUS, or MULT.  No other codes will occur.
6583
6584    *BENEFIT will be incremented by the benefit of any sub-giv encountered.  */
6585
6586 static rtx sge_plus PARAMS ((enum machine_mode, rtx, rtx));
6587 static rtx sge_plus_constant PARAMS ((rtx, rtx));
6588
6589 static rtx
6590 simplify_giv_expr (loop, x, ext_val, benefit)
6591      const struct loop *loop;
6592      rtx x;
6593      rtx *ext_val;
6594      int *benefit;
6595 {
6596   struct loop_ivs *ivs = LOOP_IVS (loop);
6597   struct loop_regs *regs = LOOP_REGS (loop);
6598   enum machine_mode mode = GET_MODE (x);
6599   rtx arg0, arg1;
6600   rtx tem;
6601
6602   /* If this is not an integer mode, or if we cannot do arithmetic in this
6603      mode, this can't be a giv.  */
6604   if (mode != VOIDmode
6605       && (GET_MODE_CLASS (mode) != MODE_INT
6606           || GET_MODE_BITSIZE (mode) > HOST_BITS_PER_WIDE_INT))
6607     return NULL_RTX;
6608
6609   switch (GET_CODE (x))
6610     {
6611     case PLUS:
6612       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6613       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
6614       if (arg0 == 0 || arg1 == 0)
6615         return NULL_RTX;
6616
6617       /* Put constant last, CONST_INT last if both constant.  */
6618       if ((GET_CODE (arg0) == USE
6619            || GET_CODE (arg0) == CONST_INT)
6620           && ! ((GET_CODE (arg0) == USE
6621                  && GET_CODE (arg1) == USE)
6622                 || GET_CODE (arg1) == CONST_INT))
6623         tem = arg0, arg0 = arg1, arg1 = tem;
6624
6625       /* Handle addition of zero, then addition of an invariant.  */
6626       if (arg1 == const0_rtx)
6627         return arg0;
6628       else if (GET_CODE (arg1) == CONST_INT || GET_CODE (arg1) == USE)
6629         switch (GET_CODE (arg0))
6630           {
6631           case CONST_INT:
6632           case USE:
6633             /* Adding two invariants must result in an invariant, so enclose
6634                addition operation inside a USE and return it.  */
6635             if (GET_CODE (arg0) == USE)
6636               arg0 = XEXP (arg0, 0);
6637             if (GET_CODE (arg1) == USE)
6638               arg1 = XEXP (arg1, 0);
6639
6640             if (GET_CODE (arg0) == CONST_INT)
6641               tem = arg0, arg0 = arg1, arg1 = tem;
6642             if (GET_CODE (arg1) == CONST_INT)
6643               tem = sge_plus_constant (arg0, arg1);
6644             else
6645               tem = sge_plus (mode, arg0, arg1);
6646
6647             if (GET_CODE (tem) != CONST_INT)
6648               tem = gen_rtx_USE (mode, tem);
6649             return tem;
6650
6651           case REG:
6652           case MULT:
6653             /* biv + invar or mult + invar.  Return sum.  */
6654             return gen_rtx_PLUS (mode, arg0, arg1);
6655
6656           case PLUS:
6657             /* (a + invar_1) + invar_2.  Associate.  */
6658             return
6659               simplify_giv_expr (loop,
6660                                  gen_rtx_PLUS (mode,
6661                                                XEXP (arg0, 0),
6662                                                gen_rtx_PLUS (mode,
6663                                                              XEXP (arg0, 1),
6664                                                              arg1)),
6665                                  ext_val, benefit);
6666
6667           default:
6668             abort ();
6669           }
6670
6671       /* Each argument must be either REG, PLUS, or MULT.  Convert REG to
6672          MULT to reduce cases.  */
6673       if (GET_CODE (arg0) == REG)
6674         arg0 = gen_rtx_MULT (mode, arg0, const1_rtx);
6675       if (GET_CODE (arg1) == REG)
6676         arg1 = gen_rtx_MULT (mode, arg1, const1_rtx);
6677
6678       /* Now have PLUS + PLUS, PLUS + MULT, MULT + PLUS, or MULT + MULT.
6679          Put a MULT first, leaving PLUS + PLUS, MULT + PLUS, or MULT + MULT.
6680          Recurse to associate the second PLUS.  */
6681       if (GET_CODE (arg1) == MULT)
6682         tem = arg0, arg0 = arg1, arg1 = tem;
6683
6684       if (GET_CODE (arg1) == PLUS)
6685         return
6686           simplify_giv_expr (loop,
6687                              gen_rtx_PLUS (mode,
6688                                            gen_rtx_PLUS (mode, arg0,
6689                                                          XEXP (arg1, 0)),
6690                                            XEXP (arg1, 1)),
6691                              ext_val, benefit);
6692
6693       /* Now must have MULT + MULT.  Distribute if same biv, else not giv.  */
6694       if (GET_CODE (arg0) != MULT || GET_CODE (arg1) != MULT)
6695         return NULL_RTX;
6696
6697       if (!rtx_equal_p (arg0, arg1))
6698         return NULL_RTX;
6699
6700       return simplify_giv_expr (loop,
6701                                 gen_rtx_MULT (mode,
6702                                               XEXP (arg0, 0),
6703                                               gen_rtx_PLUS (mode,
6704                                                             XEXP (arg0, 1),
6705                                                             XEXP (arg1, 1))),
6706                                 ext_val, benefit);
6707
6708     case MINUS:
6709       /* Handle "a - b" as "a + b * (-1)".  */
6710       return simplify_giv_expr (loop,
6711                                 gen_rtx_PLUS (mode,
6712                                               XEXP (x, 0),
6713                                               gen_rtx_MULT (mode,
6714                                                             XEXP (x, 1),
6715                                                             constm1_rtx)),
6716                                 ext_val, benefit);
6717
6718     case MULT:
6719       arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6720       arg1 = simplify_giv_expr (loop, XEXP (x, 1), ext_val, benefit);
6721       if (arg0 == 0 || arg1 == 0)
6722         return NULL_RTX;
6723
6724       /* Put constant last, CONST_INT last if both constant.  */
6725       if ((GET_CODE (arg0) == USE || GET_CODE (arg0) == CONST_INT)
6726           && GET_CODE (arg1) != CONST_INT)
6727         tem = arg0, arg0 = arg1, arg1 = tem;
6728
6729       /* If second argument is not now constant, not giv.  */
6730       if (GET_CODE (arg1) != USE && GET_CODE (arg1) != CONST_INT)
6731         return NULL_RTX;
6732
6733       /* Handle multiply by 0 or 1.  */
6734       if (arg1 == const0_rtx)
6735         return const0_rtx;
6736
6737       else if (arg1 == const1_rtx)
6738         return arg0;
6739
6740       switch (GET_CODE (arg0))
6741         {
6742         case REG:
6743           /* biv * invar.  Done.  */
6744           return gen_rtx_MULT (mode, arg0, arg1);
6745
6746         case CONST_INT:
6747           /* Product of two constants.  */
6748           return GEN_INT (INTVAL (arg0) * INTVAL (arg1));
6749
6750         case USE:
6751           /* invar * invar is a giv, but attempt to simplify it somehow.  */
6752           if (GET_CODE (arg1) != CONST_INT)
6753             return NULL_RTX;
6754
6755           arg0 = XEXP (arg0, 0);
6756           if (GET_CODE (arg0) == MULT)
6757             {
6758               /* (invar_0 * invar_1) * invar_2.  Associate.  */
6759               return simplify_giv_expr (loop,
6760                                         gen_rtx_MULT (mode,
6761                                                       XEXP (arg0, 0),
6762                                                       gen_rtx_MULT (mode,
6763                                                                     XEXP (arg0,
6764                                                                           1),
6765                                                                     arg1)),
6766                                         ext_val, benefit);
6767             }
6768           /* Propagate the MULT expressions to the intermost nodes.  */
6769           else if (GET_CODE (arg0) == PLUS)
6770             {
6771               /* (invar_0 + invar_1) * invar_2.  Distribute.  */
6772               return simplify_giv_expr (loop,
6773                                         gen_rtx_PLUS (mode,
6774                                                       gen_rtx_MULT (mode,
6775                                                                     XEXP (arg0,
6776                                                                           0),
6777                                                                     arg1),
6778                                                       gen_rtx_MULT (mode,
6779                                                                     XEXP (arg0,
6780                                                                           1),
6781                                                                     arg1)),
6782                                         ext_val, benefit);
6783             }
6784           return gen_rtx_USE (mode, gen_rtx_MULT (mode, arg0, arg1));
6785
6786         case MULT:
6787           /* (a * invar_1) * invar_2.  Associate.  */
6788           return simplify_giv_expr (loop,
6789                                     gen_rtx_MULT (mode,
6790                                                   XEXP (arg0, 0),
6791                                                   gen_rtx_MULT (mode,
6792                                                                 XEXP (arg0, 1),
6793                                                                 arg1)),
6794                                     ext_val, benefit);
6795
6796         case PLUS:
6797           /* (a + invar_1) * invar_2.  Distribute.  */
6798           return simplify_giv_expr (loop,
6799                                     gen_rtx_PLUS (mode,
6800                                                   gen_rtx_MULT (mode,
6801                                                                 XEXP (arg0, 0),
6802                                                                 arg1),
6803                                                   gen_rtx_MULT (mode,
6804                                                                 XEXP (arg0, 1),
6805                                                                 arg1)),
6806                                     ext_val, benefit);
6807
6808         default:
6809           abort ();
6810         }
6811
6812     case ASHIFT:
6813       /* Shift by constant is multiply by power of two.  */
6814       if (GET_CODE (XEXP (x, 1)) != CONST_INT)
6815         return 0;
6816
6817       return
6818         simplify_giv_expr (loop,
6819                            gen_rtx_MULT (mode,
6820                                          XEXP (x, 0),
6821                                          GEN_INT ((HOST_WIDE_INT) 1
6822                                                   << INTVAL (XEXP (x, 1)))),
6823                            ext_val, benefit);
6824
6825     case NEG:
6826       /* "-a" is "a * (-1)" */
6827       return simplify_giv_expr (loop,
6828                                 gen_rtx_MULT (mode, XEXP (x, 0), constm1_rtx),
6829                                 ext_val, benefit);
6830
6831     case NOT:
6832       /* "~a" is "-a - 1". Silly, but easy.  */
6833       return simplify_giv_expr (loop,
6834                                 gen_rtx_MINUS (mode,
6835                                                gen_rtx_NEG (mode, XEXP (x, 0)),
6836                                                const1_rtx),
6837                                 ext_val, benefit);
6838
6839     case USE:
6840       /* Already in proper form for invariant.  */
6841       return x;
6842
6843     case SIGN_EXTEND:
6844     case ZERO_EXTEND:
6845     case TRUNCATE:
6846       /* Conditionally recognize extensions of simple IVs.  After we've
6847          computed loop traversal counts and verified the range of the
6848          source IV, we'll reevaluate this as a GIV.  */
6849       if (*ext_val == NULL_RTX)
6850         {
6851           arg0 = simplify_giv_expr (loop, XEXP (x, 0), ext_val, benefit);
6852           if (arg0 && *ext_val == NULL_RTX && GET_CODE (arg0) == REG)
6853             {
6854               *ext_val = gen_rtx_fmt_e (GET_CODE (x), mode, arg0);
6855               return arg0;
6856             }
6857         }
6858       goto do_default;
6859
6860     case REG:
6861       /* If this is a new register, we can't deal with it.  */
6862       if (REGNO (x) >= max_reg_before_loop)
6863         return 0;
6864
6865       /* Check for biv or giv.  */
6866       switch (REG_IV_TYPE (ivs, REGNO (x)))
6867         {
6868         case BASIC_INDUCT:
6869           return x;
6870         case GENERAL_INDUCT:
6871           {
6872             struct induction *v = REG_IV_INFO (ivs, REGNO (x));
6873
6874             /* Form expression from giv and add benefit.  Ensure this giv
6875                can derive another and subtract any needed adjustment if so.  */
6876
6877             /* Increasing the benefit here is risky.  The only case in which it
6878                is arguably correct is if this is the only use of V.  In other
6879                cases, this will artificially inflate the benefit of the current
6880                giv, and lead to suboptimal code.  Thus, it is disabled, since
6881                potentially not reducing an only marginally beneficial giv is
6882                less harmful than reducing many givs that are not really
6883                beneficial.  */
6884             {
6885               rtx single_use = regs->array[REGNO (x)].single_usage;
6886               if (single_use && single_use != const0_rtx)
6887                 *benefit += v->benefit;
6888             }
6889
6890             if (v->cant_derive)
6891               return 0;
6892
6893             tem = gen_rtx_PLUS (mode, gen_rtx_MULT (mode,
6894                                                     v->src_reg, v->mult_val),
6895                                 v->add_val);
6896
6897             if (v->derive_adjustment)
6898               tem = gen_rtx_MINUS (mode, tem, v->derive_adjustment);
6899             arg0 = simplify_giv_expr (loop, tem, ext_val, benefit);
6900             if (*ext_val)
6901               {
6902                 if (!v->ext_dependent)
6903                   return arg0;
6904               }
6905             else
6906               {
6907                 *ext_val = v->ext_dependent;
6908                 return arg0;
6909               }
6910             return 0;
6911           }
6912
6913         default:
6914         do_default:
6915           /* If it isn't an induction variable, and it is invariant, we
6916              may be able to simplify things further by looking through
6917              the bits we just moved outside the loop.  */
6918           if (loop_invariant_p (loop, x) == 1)
6919             {
6920               struct movable *m;
6921               struct loop_movables *movables = LOOP_MOVABLES (loop);
6922
6923               for (m = movables->head; m; m = m->next)
6924                 if (rtx_equal_p (x, m->set_dest))
6925                   {
6926                     /* Ok, we found a match.  Substitute and simplify.  */
6927
6928                     /* If we match another movable, we must use that, as
6929                        this one is going away.  */
6930                     if (m->match)
6931                       return simplify_giv_expr (loop, m->match->set_dest,
6932                                                 ext_val, benefit);
6933
6934                     /* If consec is nonzero, this is a member of a group of
6935                        instructions that were moved together.  We handle this
6936                        case only to the point of seeking to the last insn and
6937                        looking for a REG_EQUAL.  Fail if we don't find one.  */
6938                     if (m->consec != 0)
6939                       {
6940                         int i = m->consec;
6941                         tem = m->insn;
6942                         do
6943                           {
6944                             tem = NEXT_INSN (tem);
6945                           }
6946                         while (--i > 0);
6947
6948                         tem = find_reg_note (tem, REG_EQUAL, NULL_RTX);
6949                         if (tem)
6950                           tem = XEXP (tem, 0);
6951                       }
6952                     else
6953                       {
6954                         tem = single_set (m->insn);
6955                         if (tem)
6956                           tem = SET_SRC (tem);
6957                       }
6958
6959                     if (tem)
6960                       {
6961                         /* What we are most interested in is pointer
6962                            arithmetic on invariants -- only take
6963                            patterns we may be able to do something with.  */
6964                         if (GET_CODE (tem) == PLUS
6965                             || GET_CODE (tem) == MULT
6966                             || GET_CODE (tem) == ASHIFT
6967                             || GET_CODE (tem) == CONST_INT
6968                             || GET_CODE (tem) == SYMBOL_REF)
6969                           {
6970                             tem = simplify_giv_expr (loop, tem, ext_val,
6971                                                      benefit);
6972                             if (tem)
6973                               return tem;
6974                           }
6975                         else if (GET_CODE (tem) == CONST
6976                                  && GET_CODE (XEXP (tem, 0)) == PLUS
6977                                  && GET_CODE (XEXP (XEXP (tem, 0), 0)) == SYMBOL_REF
6978                                  && GET_CODE (XEXP (XEXP (tem, 0), 1)) == CONST_INT)
6979                           {
6980                             tem = simplify_giv_expr (loop, XEXP (tem, 0),
6981                                                      ext_val, benefit);
6982                             if (tem)
6983                               return tem;
6984                           }
6985                       }
6986                     break;
6987                   }
6988             }
6989           break;
6990         }
6991
6992       /* Fall through to general case.  */
6993     default:
6994       /* If invariant, return as USE (unless CONST_INT).
6995          Otherwise, not giv.  */
6996       if (GET_CODE (x) == USE)
6997         x = XEXP (x, 0);
6998
6999       if (loop_invariant_p (loop, x) == 1)
7000         {
7001           if (GET_CODE (x) == CONST_INT)
7002             return x;
7003           if (GET_CODE (x) == CONST
7004               && GET_CODE (XEXP (x, 0)) == PLUS
7005               && GET_CODE (XEXP (XEXP (x, 0), 0)) == SYMBOL_REF
7006               && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT)
7007             x = XEXP (x, 0);
7008           return gen_rtx_USE (mode, x);
7009         }
7010       else
7011         return 0;
7012     }
7013 }
7014
7015 /* This routine folds invariants such that there is only ever one
7016    CONST_INT in the summation.  It is only used by simplify_giv_expr.  */
7017
7018 static rtx
7019 sge_plus_constant (x, c)
7020      rtx x, c;
7021 {
7022   if (GET_CODE (x) == CONST_INT)
7023     return GEN_INT (INTVAL (x) + INTVAL (c));
7024   else if (GET_CODE (x) != PLUS)
7025     return gen_rtx_PLUS (GET_MODE (x), x, c);
7026   else if (GET_CODE (XEXP (x, 1)) == CONST_INT)
7027     {
7028       return gen_rtx_PLUS (GET_MODE (x), XEXP (x, 0),
7029                            GEN_INT (INTVAL (XEXP (x, 1)) + INTVAL (c)));
7030     }
7031   else if (GET_CODE (XEXP (x, 0)) == PLUS
7032            || GET_CODE (XEXP (x, 1)) != PLUS)
7033     {
7034       return gen_rtx_PLUS (GET_MODE (x),
7035                            sge_plus_constant (XEXP (x, 0), c), XEXP (x, 1));
7036     }
7037   else
7038     {
7039       return gen_rtx_PLUS (GET_MODE (x),
7040                            sge_plus_constant (XEXP (x, 1), c), XEXP (x, 0));
7041     }
7042 }
7043
7044 static rtx
7045 sge_plus (mode, x, y)
7046      enum machine_mode mode;
7047      rtx x, y;
7048 {
7049   while (GET_CODE (y) == PLUS)
7050     {
7051       rtx a = XEXP (y, 0);
7052       if (GET_CODE (a) == CONST_INT)
7053         x = sge_plus_constant (x, a);
7054       else
7055         x = gen_rtx_PLUS (mode, x, a);
7056       y = XEXP (y, 1);
7057     }
7058   if (GET_CODE (y) == CONST_INT)
7059     x = sge_plus_constant (x, y);
7060   else
7061     x = gen_rtx_PLUS (mode, x, y);
7062   return x;
7063 }
7064 \f
7065 /* Help detect a giv that is calculated by several consecutive insns;
7066    for example,
7067       giv = biv * M
7068       giv = giv + A
7069    The caller has already identified the first insn P as having a giv as dest;
7070    we check that all other insns that set the same register follow
7071    immediately after P, that they alter nothing else,
7072    and that the result of the last is still a giv.
7073
7074    The value is 0 if the reg set in P is not really a giv.
7075    Otherwise, the value is the amount gained by eliminating
7076    all the consecutive insns that compute the value.
7077
7078    FIRST_BENEFIT is the amount gained by eliminating the first insn, P.
7079    SRC_REG is the reg of the biv; DEST_REG is the reg of the giv.
7080
7081    The coefficients of the ultimate giv value are stored in
7082    *MULT_VAL and *ADD_VAL.  */
7083
7084 static int
7085 consec_sets_giv (loop, first_benefit, p, src_reg, dest_reg,
7086                  add_val, mult_val, ext_val, last_consec_insn)
7087      const struct loop *loop;
7088      int first_benefit;
7089      rtx p;
7090      rtx src_reg;
7091      rtx dest_reg;
7092      rtx *add_val;
7093      rtx *mult_val;
7094      rtx *ext_val;
7095      rtx *last_consec_insn;
7096 {
7097   struct loop_ivs *ivs = LOOP_IVS (loop);
7098   struct loop_regs *regs = LOOP_REGS (loop);
7099   int count;
7100   enum rtx_code code;
7101   int benefit;
7102   rtx temp;
7103   rtx set;
7104
7105   /* Indicate that this is a giv so that we can update the value produced in
7106      each insn of the multi-insn sequence.
7107
7108      This induction structure will be used only by the call to
7109      general_induction_var below, so we can allocate it on our stack.
7110      If this is a giv, our caller will replace the induct var entry with
7111      a new induction structure.  */
7112   struct induction *v;
7113
7114   if (REG_IV_TYPE (ivs, REGNO (dest_reg)) != UNKNOWN_INDUCT)
7115     return 0;
7116
7117   v = (struct induction *) alloca (sizeof (struct induction));
7118   v->src_reg = src_reg;
7119   v->mult_val = *mult_val;
7120   v->add_val = *add_val;
7121   v->benefit = first_benefit;
7122   v->cant_derive = 0;
7123   v->derive_adjustment = 0;
7124   v->ext_dependent = NULL_RTX;
7125
7126   REG_IV_TYPE (ivs, REGNO (dest_reg)) = GENERAL_INDUCT;
7127   REG_IV_INFO (ivs, REGNO (dest_reg)) = v;
7128
7129   count = regs->array[REGNO (dest_reg)].n_times_set - 1;
7130
7131   while (count > 0)
7132     {
7133       p = NEXT_INSN (p);
7134       code = GET_CODE (p);
7135
7136       /* If libcall, skip to end of call sequence.  */
7137       if (code == INSN && (temp = find_reg_note (p, REG_LIBCALL, NULL_RTX)))
7138         p = XEXP (temp, 0);
7139
7140       if (code == INSN
7141           && (set = single_set (p))
7142           && GET_CODE (SET_DEST (set)) == REG
7143           && SET_DEST (set) == dest_reg
7144           && (general_induction_var (loop, SET_SRC (set), &src_reg,
7145                                      add_val, mult_val, ext_val, 0,
7146                                      &benefit, VOIDmode)
7147               /* Giv created by equivalent expression.  */
7148               || ((temp = find_reg_note (p, REG_EQUAL, NULL_RTX))
7149                   && general_induction_var (loop, XEXP (temp, 0), &src_reg,
7150                                             add_val, mult_val, ext_val, 0,
7151                                             &benefit, VOIDmode)))
7152           && src_reg == v->src_reg)
7153         {
7154           if (find_reg_note (p, REG_RETVAL, NULL_RTX))
7155             benefit += libcall_benefit (p);
7156
7157           count--;
7158           v->mult_val = *mult_val;
7159           v->add_val = *add_val;
7160           v->benefit += benefit;
7161         }
7162       else if (code != NOTE)
7163         {
7164           /* Allow insns that set something other than this giv to a
7165              constant.  Such insns are needed on machines which cannot
7166              include long constants and should not disqualify a giv.  */
7167           if (code == INSN
7168               && (set = single_set (p))
7169               && SET_DEST (set) != dest_reg
7170               && CONSTANT_P (SET_SRC (set)))
7171             continue;
7172
7173           REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
7174           return 0;
7175         }
7176     }
7177
7178   REG_IV_TYPE (ivs, REGNO (dest_reg)) = UNKNOWN_INDUCT;
7179   *last_consec_insn = p;
7180   return v->benefit;
7181 }
7182 \f
7183 /* Return an rtx, if any, that expresses giv G2 as a function of the register
7184    represented by G1.  If no such expression can be found, or it is clear that
7185    it cannot possibly be a valid address, 0 is returned.
7186
7187    To perform the computation, we note that
7188         G1 = x * v + a          and
7189         G2 = y * v + b
7190    where `v' is the biv.
7191
7192    So G2 = (y/b) * G1 + (b - a*y/x).
7193
7194    Note that MULT = y/x.
7195
7196    Update: A and B are now allowed to be additive expressions such that
7197    B contains all variables in A.  That is, computing B-A will not require
7198    subtracting variables.  */
7199
7200 static rtx
7201 express_from_1 (a, b, mult)
7202      rtx a, b, mult;
7203 {
7204   /* If MULT is zero, then A*MULT is zero, and our expression is B.  */
7205
7206   if (mult == const0_rtx)
7207     return b;
7208
7209   /* If MULT is not 1, we cannot handle A with non-constants, since we
7210      would then be required to subtract multiples of the registers in A.
7211      This is theoretically possible, and may even apply to some Fortran
7212      constructs, but it is a lot of work and we do not attempt it here.  */
7213
7214   if (mult != const1_rtx && GET_CODE (a) != CONST_INT)
7215     return NULL_RTX;
7216
7217   /* In general these structures are sorted top to bottom (down the PLUS
7218      chain), but not left to right across the PLUS.  If B is a higher
7219      order giv than A, we can strip one level and recurse.  If A is higher
7220      order, we'll eventually bail out, but won't know that until the end.
7221      If they are the same, we'll strip one level around this loop.  */
7222
7223   while (GET_CODE (a) == PLUS && GET_CODE (b) == PLUS)
7224     {
7225       rtx ra, rb, oa, ob, tmp;
7226
7227       ra = XEXP (a, 0), oa = XEXP (a, 1);
7228       if (GET_CODE (ra) == PLUS)
7229         tmp = ra, ra = oa, oa = tmp;
7230
7231       rb = XEXP (b, 0), ob = XEXP (b, 1);
7232       if (GET_CODE (rb) == PLUS)
7233         tmp = rb, rb = ob, ob = tmp;
7234
7235       if (rtx_equal_p (ra, rb))
7236         /* We matched: remove one reg completely.  */
7237         a = oa, b = ob;
7238       else if (GET_CODE (ob) != PLUS && rtx_equal_p (ra, ob))
7239         /* An alternate match.  */
7240         a = oa, b = rb;
7241       else if (GET_CODE (oa) != PLUS && rtx_equal_p (oa, rb))
7242         /* An alternate match.  */
7243         a = ra, b = ob;
7244       else
7245         {
7246           /* Indicates an extra register in B.  Strip one level from B and
7247              recurse, hoping B was the higher order expression.  */
7248           ob = express_from_1 (a, ob, mult);
7249           if (ob == NULL_RTX)
7250             return NULL_RTX;
7251           return gen_rtx_PLUS (GET_MODE (b), rb, ob);
7252         }
7253     }
7254
7255   /* Here we are at the last level of A, go through the cases hoping to
7256      get rid of everything but a constant.  */
7257
7258   if (GET_CODE (a) == PLUS)
7259     {
7260       rtx ra, oa;
7261
7262       ra = XEXP (a, 0), oa = XEXP (a, 1);
7263       if (rtx_equal_p (oa, b))
7264         oa = ra;
7265       else if (!rtx_equal_p (ra, b))
7266         return NULL_RTX;
7267
7268       if (GET_CODE (oa) != CONST_INT)
7269         return NULL_RTX;
7270
7271       return GEN_INT (-INTVAL (oa) * INTVAL (mult));
7272     }
7273   else if (GET_CODE (a) == CONST_INT)
7274     {
7275       return plus_constant (b, -INTVAL (a) * INTVAL (mult));
7276     }
7277   else if (CONSTANT_P (a))
7278     {
7279       enum machine_mode mode_a = GET_MODE (a);
7280       enum machine_mode mode_b = GET_MODE (b);
7281       enum machine_mode mode = mode_b == VOIDmode ? mode_a : mode_b;
7282       return simplify_gen_binary (MINUS, mode, b, a);
7283     }
7284   else if (GET_CODE (b) == PLUS)
7285     {
7286       if (rtx_equal_p (a, XEXP (b, 0)))
7287         return XEXP (b, 1);
7288       else if (rtx_equal_p (a, XEXP (b, 1)))
7289         return XEXP (b, 0);
7290       else
7291         return NULL_RTX;
7292     }
7293   else if (rtx_equal_p (a, b))
7294     return const0_rtx;
7295
7296   return NULL_RTX;
7297 }
7298
7299 rtx
7300 express_from (g1, g2)
7301      struct induction *g1, *g2;
7302 {
7303   rtx mult, add;
7304
7305   /* The value that G1 will be multiplied by must be a constant integer.  Also,
7306      the only chance we have of getting a valid address is if b*c/a (see above
7307      for notation) is also an integer.  */
7308   if (GET_CODE (g1->mult_val) == CONST_INT
7309       && GET_CODE (g2->mult_val) == CONST_INT)
7310     {
7311       if (g1->mult_val == const0_rtx
7312           || INTVAL (g2->mult_val) % INTVAL (g1->mult_val) != 0)
7313         return NULL_RTX;
7314       mult = GEN_INT (INTVAL (g2->mult_val) / INTVAL (g1->mult_val));
7315     }
7316   else if (rtx_equal_p (g1->mult_val, g2->mult_val))
7317     mult = const1_rtx;
7318   else
7319     {
7320       /* ??? Find out if the one is a multiple of the other?  */
7321       return NULL_RTX;
7322     }
7323
7324   add = express_from_1 (g1->add_val, g2->add_val, mult);
7325   if (add == NULL_RTX)
7326     {
7327       /* Failed.  If we've got a multiplication factor between G1 and G2,
7328          scale G1's addend and try again.  */
7329       if (INTVAL (mult) > 1)
7330         {
7331           rtx g1_add_val = g1->add_val;
7332           if (GET_CODE (g1_add_val) == MULT
7333               && GET_CODE (XEXP (g1_add_val, 1)) == CONST_INT)
7334             {
7335               HOST_WIDE_INT m;
7336               m = INTVAL (mult) * INTVAL (XEXP (g1_add_val, 1));
7337               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val),
7338                                          XEXP (g1_add_val, 0), GEN_INT (m));
7339             }
7340           else
7341             {
7342               g1_add_val = gen_rtx_MULT (GET_MODE (g1_add_val), g1_add_val,
7343                                          mult);
7344             }
7345
7346           add = express_from_1 (g1_add_val, g2->add_val, const1_rtx);
7347         }
7348     }
7349   if (add == NULL_RTX)
7350     return NULL_RTX;
7351
7352   /* Form simplified final result.  */
7353   if (mult == const0_rtx)
7354     return add;
7355   else if (mult == const1_rtx)
7356     mult = g1->dest_reg;
7357   else
7358     mult = gen_rtx_MULT (g2->mode, g1->dest_reg, mult);
7359
7360   if (add == const0_rtx)
7361     return mult;
7362   else
7363     {
7364       if (GET_CODE (add) == PLUS
7365           && CONSTANT_P (XEXP (add, 1)))
7366         {
7367           rtx tem = XEXP (add, 1);
7368           mult = gen_rtx_PLUS (g2->mode, mult, XEXP (add, 0));
7369           add = tem;
7370         }
7371
7372       return gen_rtx_PLUS (g2->mode, mult, add);
7373     }
7374 }
7375 \f
7376 /* Return an rtx, if any, that expresses giv G2 as a function of the register
7377    represented by G1.  This indicates that G2 should be combined with G1 and
7378    that G2 can use (either directly or via an address expression) a register
7379    used to represent G1.  */
7380
7381 static rtx
7382 combine_givs_p (g1, g2)
7383      struct induction *g1, *g2;
7384 {
7385   rtx comb, ret;
7386
7387   /* With the introduction of ext dependent givs, we must care for modes.
7388      G2 must not use a wider mode than G1.  */
7389   if (GET_MODE_SIZE (g1->mode) < GET_MODE_SIZE (g2->mode))
7390     return NULL_RTX;
7391
7392   ret = comb = express_from (g1, g2);
7393   if (comb == NULL_RTX)
7394     return NULL_RTX;
7395   if (g1->mode != g2->mode)
7396     ret = gen_lowpart (g2->mode, comb);
7397
7398   /* If these givs are identical, they can be combined.  We use the results
7399      of express_from because the addends are not in a canonical form, so
7400      rtx_equal_p is a weaker test.  */
7401   /* But don't combine a DEST_REG giv with a DEST_ADDR giv; we want the
7402      combination to be the other way round.  */
7403   if (comb == g1->dest_reg
7404       && (g1->giv_type == DEST_REG || g2->giv_type == DEST_ADDR))
7405     {
7406       return ret;
7407     }
7408
7409   /* If G2 can be expressed as a function of G1 and that function is valid
7410      as an address and no more expensive than using a register for G2,
7411      the expression of G2 in terms of G1 can be used.  */
7412   if (ret != NULL_RTX
7413       && g2->giv_type == DEST_ADDR
7414       && memory_address_p (GET_MODE (g2->mem), ret))
7415     return ret;
7416
7417   return NULL_RTX;
7418 }
7419 \f
7420 /* Check each extension dependent giv in this class to see if its
7421    root biv is safe from wrapping in the interior mode, which would
7422    make the giv illegal.  */
7423
7424 static void
7425 check_ext_dependent_givs (bl, loop_info)
7426      struct iv_class *bl;
7427      struct loop_info *loop_info;
7428 {
7429   int ze_ok = 0, se_ok = 0, info_ok = 0;
7430   enum machine_mode biv_mode = GET_MODE (bl->biv->src_reg);
7431   HOST_WIDE_INT start_val;
7432   unsigned HOST_WIDE_INT u_end_val = 0;
7433   unsigned HOST_WIDE_INT u_start_val = 0;
7434   rtx incr = pc_rtx;
7435   struct induction *v;
7436
7437   /* Make sure the iteration data is available.  We must have
7438      constants in order to be certain of no overflow.  */
7439   /* ??? An unknown iteration count with an increment of +-1
7440      combined with friendly exit tests of against an invariant
7441      value is also amenable to optimization.  Not implemented.  */
7442   if (loop_info->n_iterations > 0
7443       && bl->initial_value
7444       && GET_CODE (bl->initial_value) == CONST_INT
7445       && (incr = biv_total_increment (bl))
7446       && GET_CODE (incr) == CONST_INT
7447       /* Make sure the host can represent the arithmetic.  */
7448       && HOST_BITS_PER_WIDE_INT >= GET_MODE_BITSIZE (biv_mode))
7449     {
7450       unsigned HOST_WIDE_INT abs_incr, total_incr;
7451       HOST_WIDE_INT s_end_val;
7452       int neg_incr;
7453
7454       info_ok = 1;
7455       start_val = INTVAL (bl->initial_value);
7456       u_start_val = start_val;
7457
7458       neg_incr = 0, abs_incr = INTVAL (incr);
7459       if (INTVAL (incr) < 0)
7460         neg_incr = 1, abs_incr = -abs_incr;
7461       total_incr = abs_incr * loop_info->n_iterations;
7462
7463       /* Check for host arithmetic overflow.  */
7464       if (total_incr / loop_info->n_iterations == abs_incr)
7465         {
7466           unsigned HOST_WIDE_INT u_max;
7467           HOST_WIDE_INT s_max;
7468
7469           u_end_val = start_val + (neg_incr ? -total_incr : total_incr);
7470           s_end_val = u_end_val;
7471           u_max = GET_MODE_MASK (biv_mode);
7472           s_max = u_max >> 1;
7473
7474           /* Check zero extension of biv ok.  */
7475           if (start_val >= 0
7476               /* Check for host arithmetic overflow.  */
7477               && (neg_incr
7478                   ? u_end_val < u_start_val
7479                   : u_end_val > u_start_val)
7480               /* Check for target arithmetic overflow.  */
7481               && (neg_incr
7482                   ? 1 /* taken care of with host overflow */
7483                   : u_end_val <= u_max))
7484             {
7485               ze_ok = 1;
7486             }
7487
7488           /* Check sign extension of biv ok.  */
7489           /* ??? While it is true that overflow with signed and pointer
7490              arithmetic is undefined, I fear too many programmers don't
7491              keep this fact in mind -- myself included on occasion.
7492              So leave alone with the signed overflow optimizations.  */
7493           if (start_val >= -s_max - 1
7494               /* Check for host arithmetic overflow.  */
7495               && (neg_incr
7496                   ? s_end_val < start_val
7497                   : s_end_val > start_val)
7498               /* Check for target arithmetic overflow.  */
7499               && (neg_incr
7500                   ? s_end_val >= -s_max - 1
7501                   : s_end_val <= s_max))
7502             {
7503               se_ok = 1;
7504             }
7505         }
7506     }
7507
7508   /* Invalidate givs that fail the tests.  */
7509   for (v = bl->giv; v; v = v->next_iv)
7510     if (v->ext_dependent)
7511       {
7512         enum rtx_code code = GET_CODE (v->ext_dependent);
7513         int ok = 0;
7514
7515         switch (code)
7516           {
7517           case SIGN_EXTEND:
7518             ok = se_ok;
7519             break;
7520           case ZERO_EXTEND:
7521             ok = ze_ok;
7522             break;
7523
7524           case TRUNCATE:
7525             /* We don't know whether this value is being used as either
7526                signed or unsigned, so to safely truncate we must satisfy
7527                both.  The initial check here verifies the BIV itself;
7528                once that is successful we may check its range wrt the
7529                derived GIV.  */
7530             if (se_ok && ze_ok)
7531               {
7532                 enum machine_mode outer_mode = GET_MODE (v->ext_dependent);
7533                 unsigned HOST_WIDE_INT max = GET_MODE_MASK (outer_mode) >> 1;
7534
7535                 /* We know from the above that both endpoints are nonnegative,
7536                    and that there is no wrapping.  Verify that both endpoints
7537                    are within the (signed) range of the outer mode.  */
7538                 if (u_start_val <= max && u_end_val <= max)
7539                   ok = 1;
7540               }
7541             break;
7542
7543           default:
7544             abort ();
7545           }
7546
7547         if (ok)
7548           {
7549             if (loop_dump_stream)
7550               {
7551                 fprintf (loop_dump_stream,
7552                          "Verified ext dependent giv at %d of reg %d\n",
7553                          INSN_UID (v->insn), bl->regno);
7554               }
7555           }
7556         else
7557           {
7558             if (loop_dump_stream)
7559               {
7560                 const char *why;
7561
7562                 if (info_ok)
7563                   why = "biv iteration values overflowed";
7564                 else
7565                   {
7566                     if (incr == pc_rtx)
7567                       incr = biv_total_increment (bl);
7568                     if (incr == const1_rtx)
7569                       why = "biv iteration info incomplete; incr by 1";
7570                     else
7571                       why = "biv iteration info incomplete";
7572                   }
7573
7574                 fprintf (loop_dump_stream,
7575                          "Failed ext dependent giv at %d, %s\n",
7576                          INSN_UID (v->insn), why);
7577               }
7578             v->ignore = 1;
7579             bl->all_reduced = 0;
7580           }
7581       }
7582 }
7583
7584 /* Generate a version of VALUE in a mode appropriate for initializing V.  */
7585
7586 rtx
7587 extend_value_for_giv (v, value)
7588      struct induction *v;
7589      rtx value;
7590 {
7591   rtx ext_dep = v->ext_dependent;
7592
7593   if (! ext_dep)
7594     return value;
7595
7596   /* Recall that check_ext_dependent_givs verified that the known bounds
7597      of a biv did not overflow or wrap with respect to the extension for
7598      the giv.  Therefore, constants need no additional adjustment.  */
7599   if (CONSTANT_P (value) && GET_MODE (value) == VOIDmode)
7600     return value;
7601
7602   /* Otherwise, we must adjust the value to compensate for the
7603      differing modes of the biv and the giv.  */
7604   return gen_rtx_fmt_e (GET_CODE (ext_dep), GET_MODE (ext_dep), value);
7605 }
7606 \f
7607 struct combine_givs_stats
7608 {
7609   int giv_number;
7610   int total_benefit;
7611 };
7612
7613 static int
7614 cmp_combine_givs_stats (xp, yp)
7615      const PTR xp;
7616      const PTR yp;
7617 {
7618   const struct combine_givs_stats * const x =
7619     (const struct combine_givs_stats *) xp;
7620   const struct combine_givs_stats * const y =
7621     (const struct combine_givs_stats *) yp;
7622   int d;
7623   d = y->total_benefit - x->total_benefit;
7624   /* Stabilize the sort.  */
7625   if (!d)
7626     d = x->giv_number - y->giv_number;
7627   return d;
7628 }
7629
7630 /* Check all pairs of givs for iv_class BL and see if any can be combined with
7631    any other.  If so, point SAME to the giv combined with and set NEW_REG to
7632    be an expression (in terms of the other giv's DEST_REG) equivalent to the
7633    giv.  Also, update BENEFIT and related fields for cost/benefit analysis.  */
7634
7635 static void
7636 combine_givs (regs, bl)
7637      struct loop_regs *regs;
7638      struct iv_class *bl;
7639 {
7640   /* Additional benefit to add for being combined multiple times.  */
7641   const int extra_benefit = 3;
7642
7643   struct induction *g1, *g2, **giv_array;
7644   int i, j, k, giv_count;
7645   struct combine_givs_stats *stats;
7646   rtx *can_combine;
7647
7648   /* Count givs, because bl->giv_count is incorrect here.  */
7649   giv_count = 0;
7650   for (g1 = bl->giv; g1; g1 = g1->next_iv)
7651     if (!g1->ignore)
7652       giv_count++;
7653
7654   giv_array
7655     = (struct induction **) alloca (giv_count * sizeof (struct induction *));
7656   i = 0;
7657   for (g1 = bl->giv; g1; g1 = g1->next_iv)
7658     if (!g1->ignore)
7659       giv_array[i++] = g1;
7660
7661   stats = (struct combine_givs_stats *) xcalloc (giv_count, sizeof (*stats));
7662   can_combine = (rtx *) xcalloc (giv_count, giv_count * sizeof (rtx));
7663
7664   for (i = 0; i < giv_count; i++)
7665     {
7666       int this_benefit;
7667       rtx single_use;
7668
7669       g1 = giv_array[i];
7670       stats[i].giv_number = i;
7671
7672       /* If a DEST_REG GIV is used only once, do not allow it to combine
7673          with anything, for in doing so we will gain nothing that cannot
7674          be had by simply letting the GIV with which we would have combined
7675          to be reduced on its own.  The losage shows up in particular with
7676          DEST_ADDR targets on hosts with reg+reg addressing, though it can
7677          be seen elsewhere as well.  */
7678       if (g1->giv_type == DEST_REG
7679           && (single_use = regs->array[REGNO (g1->dest_reg)].single_usage)
7680           && single_use != const0_rtx)
7681         continue;
7682
7683       this_benefit = g1->benefit;
7684       /* Add an additional weight for zero addends.  */
7685       if (g1->no_const_addval)
7686         this_benefit += 1;
7687
7688       for (j = 0; j < giv_count; j++)
7689         {
7690           rtx this_combine;
7691
7692           g2 = giv_array[j];
7693           if (g1 != g2
7694               && (this_combine = combine_givs_p (g1, g2)) != NULL_RTX)
7695             {
7696               can_combine[i * giv_count + j] = this_combine;
7697               this_benefit += g2->benefit + extra_benefit;
7698             }
7699         }
7700       stats[i].total_benefit = this_benefit;
7701     }
7702
7703   /* Iterate, combining until we can't.  */
7704 restart:
7705   qsort (stats, giv_count, sizeof (*stats), cmp_combine_givs_stats);
7706
7707   if (loop_dump_stream)
7708     {
7709       fprintf (loop_dump_stream, "Sorted combine statistics:\n");
7710       for (k = 0; k < giv_count; k++)
7711         {
7712           g1 = giv_array[stats[k].giv_number];
7713           if (!g1->combined_with && !g1->same)
7714             fprintf (loop_dump_stream, " {%d, %d}",
7715                      INSN_UID (giv_array[stats[k].giv_number]->insn),
7716                      stats[k].total_benefit);
7717         }
7718       putc ('\n', loop_dump_stream);
7719     }
7720
7721   for (k = 0; k < giv_count; k++)
7722     {
7723       int g1_add_benefit = 0;
7724
7725       i = stats[k].giv_number;
7726       g1 = giv_array[i];
7727
7728       /* If it has already been combined, skip.  */
7729       if (g1->combined_with || g1->same)
7730         continue;
7731
7732       for (j = 0; j < giv_count; j++)
7733         {
7734           g2 = giv_array[j];
7735           if (g1 != g2 && can_combine[i * giv_count + j]
7736               /* If it has already been combined, skip.  */
7737               && ! g2->same && ! g2->combined_with)
7738             {
7739               int l;
7740
7741               g2->new_reg = can_combine[i * giv_count + j];
7742               g2->same = g1;
7743               /* For destination, we now may replace by mem expression instead
7744                  of register.  This changes the costs considerably, so add the
7745                  compensation.  */
7746               if (g2->giv_type == DEST_ADDR)
7747                 g2->benefit = (g2->benefit + reg_address_cost
7748                                - address_cost (g2->new_reg,
7749                                GET_MODE (g2->mem)));
7750               g1->combined_with++;
7751               g1->lifetime += g2->lifetime;
7752
7753               g1_add_benefit += g2->benefit;
7754
7755               /* ??? The new final_[bg]iv_value code does a much better job
7756                  of finding replaceable giv's, and hence this code may no
7757                  longer be necessary.  */
7758               if (! g2->replaceable && REG_USERVAR_P (g2->dest_reg))
7759                 g1_add_benefit -= copy_cost;
7760
7761               /* To help optimize the next set of combinations, remove
7762                  this giv from the benefits of other potential mates.  */
7763               for (l = 0; l < giv_count; ++l)
7764                 {
7765                   int m = stats[l].giv_number;
7766                   if (can_combine[m * giv_count + j])
7767                     stats[l].total_benefit -= g2->benefit + extra_benefit;
7768                 }
7769
7770               if (loop_dump_stream)
7771                 fprintf (loop_dump_stream,
7772                          "giv at %d combined with giv at %d; new benefit %d + %d, lifetime %d\n",
7773                          INSN_UID (g2->insn), INSN_UID (g1->insn),
7774                          g1->benefit, g1_add_benefit, g1->lifetime);
7775             }
7776         }
7777
7778       /* To help optimize the next set of combinations, remove
7779          this giv from the benefits of other potential mates.  */
7780       if (g1->combined_with)
7781         {
7782           for (j = 0; j < giv_count; ++j)
7783             {
7784               int m = stats[j].giv_number;
7785               if (can_combine[m * giv_count + i])
7786                 stats[j].total_benefit -= g1->benefit + extra_benefit;
7787             }
7788
7789           g1->benefit += g1_add_benefit;
7790
7791           /* We've finished with this giv, and everything it touched.
7792              Restart the combination so that proper weights for the
7793              rest of the givs are properly taken into account.  */
7794           /* ??? Ideally we would compact the arrays at this point, so
7795              as to not cover old ground.  But sanely compacting
7796              can_combine is tricky.  */
7797           goto restart;
7798         }
7799     }
7800
7801   /* Clean up.  */
7802   free (stats);
7803   free (can_combine);
7804 }
7805 \f
7806 /* Generate sequence for REG = B * M + A.  */
7807
7808 static rtx
7809 gen_add_mult (b, m, a, reg)
7810      rtx b;          /* initial value of basic induction variable */
7811      rtx m;          /* multiplicative constant */
7812      rtx a;          /* additive constant */
7813      rtx reg;        /* destination register */
7814 {
7815   rtx seq;
7816   rtx result;
7817
7818   start_sequence ();
7819   /* Use unsigned arithmetic.  */
7820   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
7821   if (reg != result)
7822     emit_move_insn (reg, result);
7823   seq = get_insns ();
7824   end_sequence ();
7825
7826   return seq;
7827 }
7828
7829
7830 /* Update registers created in insn sequence SEQ.  */
7831
7832 static void
7833 loop_regs_update (loop, seq)
7834      const struct loop *loop ATTRIBUTE_UNUSED;
7835      rtx seq;
7836 {
7837   rtx insn;
7838
7839   /* Update register info for alias analysis.  */
7840
7841   if (seq == NULL_RTX)
7842     return;
7843
7844   if (INSN_P (seq))
7845     {
7846       insn = seq;
7847       while (insn != NULL_RTX)
7848         {
7849           rtx set = single_set (insn);
7850
7851           if (set && GET_CODE (SET_DEST (set)) == REG)
7852             record_base_value (REGNO (SET_DEST (set)), SET_SRC (set), 0);
7853
7854           insn = NEXT_INSN (insn);
7855         }
7856     }
7857   else if (GET_CODE (seq) == SET
7858            && GET_CODE (SET_DEST (seq)) == REG)
7859     record_base_value (REGNO (SET_DEST (seq)), SET_SRC (seq), 0);
7860 }
7861
7862
7863 /* EMIT code before BEFORE_BB/BEFORE_INSN to set REG = B * M + A.  */
7864
7865 void
7866 loop_iv_add_mult_emit_before (loop, b, m, a, reg, before_bb, before_insn)
7867      const struct loop *loop;
7868      rtx b;          /* initial value of basic induction variable */
7869      rtx m;          /* multiplicative constant */
7870      rtx a;          /* additive constant */
7871      rtx reg;        /* destination register */
7872      basic_block before_bb;
7873      rtx before_insn;
7874 {
7875   rtx seq;
7876
7877   if (! before_insn)
7878     {
7879       loop_iv_add_mult_hoist (loop, b, m, a, reg);
7880       return;
7881     }
7882
7883   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7884   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7885
7886   /* Increase the lifetime of any invariants moved further in code.  */
7887   update_reg_last_use (a, before_insn);
7888   update_reg_last_use (b, before_insn);
7889   update_reg_last_use (m, before_insn);
7890
7891   loop_insn_emit_before (loop, before_bb, before_insn, seq);
7892
7893   /* It is possible that the expansion created lots of new registers.
7894      Iterate over the sequence we just created and record them all.  */
7895   loop_regs_update (loop, seq);
7896 }
7897
7898
7899 /* Emit insns in loop pre-header to set REG = B * M + A.  */
7900
7901 void
7902 loop_iv_add_mult_sink (loop, b, m, a, reg)
7903      const struct loop *loop;
7904      rtx b;          /* initial value of basic induction variable */
7905      rtx m;          /* multiplicative constant */
7906      rtx a;          /* additive constant */
7907      rtx reg;        /* destination register */
7908 {
7909   rtx seq;
7910
7911   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7912   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7913
7914   /* Increase the lifetime of any invariants moved further in code.
7915      ???? Is this really necessary?  */
7916   update_reg_last_use (a, loop->sink);
7917   update_reg_last_use (b, loop->sink);
7918   update_reg_last_use (m, loop->sink);
7919
7920   loop_insn_sink (loop, seq);
7921
7922   /* It is possible that the expansion created lots of new registers.
7923      Iterate over the sequence we just created and record them all.  */
7924   loop_regs_update (loop, seq);
7925 }
7926
7927
7928 /* Emit insns after loop to set REG = B * M + A.  */
7929
7930 void
7931 loop_iv_add_mult_hoist (loop, b, m, a, reg)
7932      const struct loop *loop;
7933      rtx b;          /* initial value of basic induction variable */
7934      rtx m;          /* multiplicative constant */
7935      rtx a;          /* additive constant */
7936      rtx reg;        /* destination register */
7937 {
7938   rtx seq;
7939
7940   /* Use copy_rtx to prevent unexpected sharing of these rtx.  */
7941   seq = gen_add_mult (copy_rtx (b), copy_rtx (m), copy_rtx (a), reg);
7942
7943   loop_insn_hoist (loop, seq);
7944
7945   /* It is possible that the expansion created lots of new registers.
7946      Iterate over the sequence we just created and record them all.  */
7947   loop_regs_update (loop, seq);
7948 }
7949
7950
7951
7952 /* Similar to gen_add_mult, but compute cost rather than generating
7953    sequence.  */
7954
7955 static int
7956 iv_add_mult_cost (b, m, a, reg)
7957      rtx b;          /* initial value of basic induction variable */
7958      rtx m;          /* multiplicative constant */
7959      rtx a;          /* additive constant */
7960      rtx reg;        /* destination register */
7961 {
7962   int cost = 0;
7963   rtx last, result;
7964
7965   start_sequence ();
7966   result = expand_mult_add (b, reg, m, a, GET_MODE (reg), 1);
7967   if (reg != result)
7968     emit_move_insn (reg, result);
7969   last = get_last_insn ();
7970   while (last)
7971     {
7972       rtx t = single_set (last);
7973       if (t)
7974         cost += rtx_cost (SET_SRC (t), SET);
7975       last = PREV_INSN (last);
7976     }
7977   end_sequence ();
7978   return cost;
7979 }
7980 \f
7981 /* Test whether A * B can be computed without
7982    an actual multiply insn.  Value is 1 if so.
7983
7984   ??? This function stinks because it generates a ton of wasted RTL
7985   ??? and as a result fragments GC memory to no end.  There are other
7986   ??? places in the compiler which are invoked a lot and do the same
7987   ??? thing, generate wasted RTL just to see if something is possible.  */
7988
7989 static int
7990 product_cheap_p (a, b)
7991      rtx a;
7992      rtx b;
7993 {
7994   rtx tmp;
7995   int win, n_insns;
7996
7997   /* If only one is constant, make it B.  */
7998   if (GET_CODE (a) == CONST_INT)
7999     tmp = a, a = b, b = tmp;
8000
8001   /* If first constant, both constant, so don't need multiply.  */
8002   if (GET_CODE (a) == CONST_INT)
8003     return 1;
8004
8005   /* If second not constant, neither is constant, so would need multiply.  */
8006   if (GET_CODE (b) != CONST_INT)
8007     return 0;
8008
8009   /* One operand is constant, so might not need multiply insn.  Generate the
8010      code for the multiply and see if a call or multiply, or long sequence
8011      of insns is generated.  */
8012
8013   start_sequence ();
8014   expand_mult (GET_MODE (a), a, b, NULL_RTX, 1);
8015   tmp = get_insns ();
8016   end_sequence ();
8017
8018   win = 1;
8019   if (INSN_P (tmp))
8020     {
8021       n_insns = 0;
8022       while (tmp != NULL_RTX)
8023         {
8024           rtx next = NEXT_INSN (tmp);
8025
8026           if (++n_insns > 3
8027               || GET_CODE (tmp) != INSN
8028               || (GET_CODE (PATTERN (tmp)) == SET
8029                   && GET_CODE (SET_SRC (PATTERN (tmp))) == MULT)
8030               || (GET_CODE (PATTERN (tmp)) == PARALLEL
8031                   && GET_CODE (XVECEXP (PATTERN (tmp), 0, 0)) == SET
8032                   && GET_CODE (SET_SRC (XVECEXP (PATTERN (tmp), 0, 0))) == MULT))
8033             {
8034               win = 0;
8035               break;
8036             }
8037
8038           tmp = next;
8039         }
8040     }
8041   else if (GET_CODE (tmp) == SET
8042            && GET_CODE (SET_SRC (tmp)) == MULT)
8043     win = 0;
8044   else if (GET_CODE (tmp) == PARALLEL
8045            && GET_CODE (XVECEXP (tmp, 0, 0)) == SET
8046            && GET_CODE (SET_SRC (XVECEXP (tmp, 0, 0))) == MULT)
8047     win = 0;
8048
8049   return win;
8050 }
8051 \f
8052 /* Check to see if loop can be terminated by a "decrement and branch until
8053    zero" instruction.  If so, add a REG_NONNEG note to the branch insn if so.
8054    Also try reversing an increment loop to a decrement loop
8055    to see if the optimization can be performed.
8056    Value is nonzero if optimization was performed.  */
8057
8058 /* This is useful even if the architecture doesn't have such an insn,
8059    because it might change a loops which increments from 0 to n to a loop
8060    which decrements from n to 0.  A loop that decrements to zero is usually
8061    faster than one that increments from zero.  */
8062
8063 /* ??? This could be rewritten to use some of the loop unrolling procedures,
8064    such as approx_final_value, biv_total_increment, loop_iterations, and
8065    final_[bg]iv_value.  */
8066
8067 static int
8068 check_dbra_loop (loop, insn_count)
8069      struct loop *loop;
8070      int insn_count;
8071 {
8072   struct loop_info *loop_info = LOOP_INFO (loop);
8073   struct loop_regs *regs = LOOP_REGS (loop);
8074   struct loop_ivs *ivs = LOOP_IVS (loop);
8075   struct iv_class *bl;
8076   rtx reg;
8077   rtx jump_label;
8078   rtx final_value;
8079   rtx start_value;
8080   rtx new_add_val;
8081   rtx comparison;
8082   rtx before_comparison;
8083   rtx p;
8084   rtx jump;
8085   rtx first_compare;
8086   int compare_and_branch;
8087   rtx loop_start = loop->start;
8088   rtx loop_end = loop->end;
8089
8090   /* If last insn is a conditional branch, and the insn before tests a
8091      register value, try to optimize it.  Otherwise, we can't do anything.  */
8092
8093   jump = PREV_INSN (loop_end);
8094   comparison = get_condition_for_loop (loop, jump);
8095   if (comparison == 0)
8096     return 0;
8097   if (!onlyjump_p (jump))
8098     return 0;
8099
8100   /* Try to compute whether the compare/branch at the loop end is one or
8101      two instructions.  */
8102   get_condition (jump, &first_compare);
8103   if (first_compare == jump)
8104     compare_and_branch = 1;
8105   else if (first_compare == prev_nonnote_insn (jump))
8106     compare_and_branch = 2;
8107   else
8108     return 0;
8109
8110   {
8111     /* If more than one condition is present to control the loop, then
8112        do not proceed, as this function does not know how to rewrite
8113        loop tests with more than one condition.
8114
8115        Look backwards from the first insn in the last comparison
8116        sequence and see if we've got another comparison sequence.  */
8117
8118     rtx jump1;
8119     if ((jump1 = prev_nonnote_insn (first_compare)) != loop->cont)
8120       if (GET_CODE (jump1) == JUMP_INSN)
8121         return 0;
8122   }
8123
8124   /* Check all of the bivs to see if the compare uses one of them.
8125      Skip biv's set more than once because we can't guarantee that
8126      it will be zero on the last iteration.  Also skip if the biv is
8127      used between its update and the test insn.  */
8128
8129   for (bl = ivs->list; bl; bl = bl->next)
8130     {
8131       if (bl->biv_count == 1
8132           && ! bl->biv->maybe_multiple
8133           && bl->biv->dest_reg == XEXP (comparison, 0)
8134           && ! reg_used_between_p (regno_reg_rtx[bl->regno], bl->biv->insn,
8135                                    first_compare))
8136         break;
8137     }
8138
8139   if (! bl)
8140     return 0;
8141
8142   /* Look for the case where the basic induction variable is always
8143      nonnegative, and equals zero on the last iteration.
8144      In this case, add a reg_note REG_NONNEG, which allows the
8145      m68k DBRA instruction to be used.  */
8146
8147   if (((GET_CODE (comparison) == GT
8148         && GET_CODE (XEXP (comparison, 1)) == CONST_INT
8149         && INTVAL (XEXP (comparison, 1)) == -1)
8150        || (GET_CODE (comparison) == NE && XEXP (comparison, 1) == const0_rtx))
8151       && GET_CODE (bl->biv->add_val) == CONST_INT
8152       && INTVAL (bl->biv->add_val) < 0)
8153     {
8154       /* Initial value must be greater than 0,
8155          init_val % -dec_value == 0 to ensure that it equals zero on
8156          the last iteration */
8157
8158       if (GET_CODE (bl->initial_value) == CONST_INT
8159           && INTVAL (bl->initial_value) > 0
8160           && (INTVAL (bl->initial_value)
8161               % (-INTVAL (bl->biv->add_val))) == 0)
8162         {
8163           /* register always nonnegative, add REG_NOTE to branch */
8164           if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
8165             REG_NOTES (jump)
8166               = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
8167                                    REG_NOTES (jump));
8168           bl->nonneg = 1;
8169
8170           return 1;
8171         }
8172
8173       /* If the decrement is 1 and the value was tested as >= 0 before
8174          the loop, then we can safely optimize.  */
8175       for (p = loop_start; p; p = PREV_INSN (p))
8176         {
8177           if (GET_CODE (p) == CODE_LABEL)
8178             break;
8179           if (GET_CODE (p) != JUMP_INSN)
8180             continue;
8181
8182           before_comparison = get_condition_for_loop (loop, p);
8183           if (before_comparison
8184               && XEXP (before_comparison, 0) == bl->biv->dest_reg
8185               && GET_CODE (before_comparison) == LT
8186               && XEXP (before_comparison, 1) == const0_rtx
8187               && ! reg_set_between_p (bl->biv->dest_reg, p, loop_start)
8188               && INTVAL (bl->biv->add_val) == -1)
8189             {
8190               if (! find_reg_note (jump, REG_NONNEG, NULL_RTX))
8191                 REG_NOTES (jump)
8192                   = gen_rtx_EXPR_LIST (REG_NONNEG, bl->biv->dest_reg,
8193                                        REG_NOTES (jump));
8194               bl->nonneg = 1;
8195
8196               return 1;
8197             }
8198         }
8199     }
8200   else if (GET_CODE (bl->biv->add_val) == CONST_INT
8201            && INTVAL (bl->biv->add_val) > 0)
8202     {
8203       /* Try to change inc to dec, so can apply above optimization.  */
8204       /* Can do this if:
8205          all registers modified are induction variables or invariant,
8206          all memory references have non-overlapping addresses
8207          (obviously true if only one write)
8208          allow 2 insns for the compare/jump at the end of the loop.  */
8209       /* Also, we must avoid any instructions which use both the reversed
8210          biv and another biv.  Such instructions will fail if the loop is
8211          reversed.  We meet this condition by requiring that either
8212          no_use_except_counting is true, or else that there is only
8213          one biv.  */
8214       int num_nonfixed_reads = 0;
8215       /* 1 if the iteration var is used only to count iterations.  */
8216       int no_use_except_counting = 0;
8217       /* 1 if the loop has no memory store, or it has a single memory store
8218          which is reversible.  */
8219       int reversible_mem_store = 1;
8220
8221       if (bl->giv_count == 0
8222           && !loop->exit_count
8223           && !loop_info->has_multiple_exit_targets)
8224         {
8225           rtx bivreg = regno_reg_rtx[bl->regno];
8226           struct iv_class *blt;
8227
8228           /* If there are no givs for this biv, and the only exit is the
8229              fall through at the end of the loop, then
8230              see if perhaps there are no uses except to count.  */
8231           no_use_except_counting = 1;
8232           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8233             if (INSN_P (p))
8234               {
8235                 rtx set = single_set (p);
8236
8237                 if (set && GET_CODE (SET_DEST (set)) == REG
8238                     && REGNO (SET_DEST (set)) == bl->regno)
8239                   /* An insn that sets the biv is okay.  */
8240                   ;
8241                 else if ((p == prev_nonnote_insn (prev_nonnote_insn (loop_end))
8242                           || p == prev_nonnote_insn (loop_end))
8243                          && reg_mentioned_p (bivreg, PATTERN (p)))
8244                   {
8245                     /* If either of these insns uses the biv and sets a pseudo
8246                        that has more than one usage, then the biv has uses
8247                        other than counting since it's used to derive a value
8248                        that is used more than one time.  */
8249                     note_stores (PATTERN (p), note_set_pseudo_multiple_uses,
8250                                  regs);
8251                     if (regs->multiple_uses)
8252                       {
8253                         no_use_except_counting = 0;
8254                         break;
8255                       }
8256                   }
8257                 else if (reg_mentioned_p (bivreg, PATTERN (p)))
8258                   {
8259                     no_use_except_counting = 0;
8260                     break;
8261                   }
8262               }
8263
8264           /* A biv has uses besides counting if it is used to set
8265              another biv.  */
8266           for (blt = ivs->list; blt; blt = blt->next)
8267             if (blt->init_set
8268                 && reg_mentioned_p (bivreg, SET_SRC (blt->init_set)))
8269               {
8270                 no_use_except_counting = 0;
8271                 break;
8272               }
8273         }
8274
8275       if (no_use_except_counting)
8276         /* No need to worry about MEMs.  */
8277         ;
8278       else if (loop_info->num_mem_sets <= 1)
8279         {
8280           for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8281             if (INSN_P (p))
8282               num_nonfixed_reads += count_nonfixed_reads (loop, PATTERN (p));
8283
8284           /* If the loop has a single store, and the destination address is
8285              invariant, then we can't reverse the loop, because this address
8286              might then have the wrong value at loop exit.
8287              This would work if the source was invariant also, however, in that
8288              case, the insn should have been moved out of the loop.  */
8289
8290           if (loop_info->num_mem_sets == 1)
8291             {
8292               struct induction *v;
8293
8294               /* If we could prove that each of the memory locations
8295                  written to was different, then we could reverse the
8296                  store -- but we don't presently have any way of
8297                  knowing that.  */
8298               reversible_mem_store = 0;
8299
8300               /* If the store depends on a register that is set after the
8301                  store, it depends on the initial value, and is thus not
8302                  reversible.  */
8303               for (v = bl->giv; reversible_mem_store && v; v = v->next_iv)
8304                 {
8305                   if (v->giv_type == DEST_REG
8306                       && reg_mentioned_p (v->dest_reg,
8307                                           PATTERN (loop_info->first_loop_store_insn))
8308                       && loop_insn_first_p (loop_info->first_loop_store_insn,
8309                                             v->insn))
8310                     reversible_mem_store = 0;
8311                 }
8312             }
8313         }
8314       else
8315         return 0;
8316
8317       /* This code only acts for innermost loops.  Also it simplifies
8318          the memory address check by only reversing loops with
8319          zero or one memory access.
8320          Two memory accesses could involve parts of the same array,
8321          and that can't be reversed.
8322          If the biv is used only for counting, than we don't need to worry
8323          about all these things.  */
8324
8325       if ((num_nonfixed_reads <= 1
8326            && ! loop_info->has_nonconst_call
8327            && ! loop_info->has_prefetch
8328            && ! loop_info->has_volatile
8329            && reversible_mem_store
8330            && (bl->giv_count + bl->biv_count + loop_info->num_mem_sets
8331                + num_unmoved_movables (loop) + compare_and_branch == insn_count)
8332            && (bl == ivs->list && bl->next == 0))
8333           || (no_use_except_counting && ! loop_info->has_prefetch))
8334         {
8335           rtx tem;
8336
8337           /* Loop can be reversed.  */
8338           if (loop_dump_stream)
8339             fprintf (loop_dump_stream, "Can reverse loop\n");
8340
8341           /* Now check other conditions:
8342
8343              The increment must be a constant, as must the initial value,
8344              and the comparison code must be LT.
8345
8346              This test can probably be improved since +/- 1 in the constant
8347              can be obtained by changing LT to LE and vice versa; this is
8348              confusing.  */
8349
8350           if (comparison
8351               /* for constants, LE gets turned into LT */
8352               && (GET_CODE (comparison) == LT
8353                   || (GET_CODE (comparison) == LE
8354                       && no_use_except_counting)))
8355             {
8356               HOST_WIDE_INT add_val, add_adjust, comparison_val = 0;
8357               rtx initial_value, comparison_value;
8358               int nonneg = 0;
8359               enum rtx_code cmp_code;
8360               int comparison_const_width;
8361               unsigned HOST_WIDE_INT comparison_sign_mask;
8362
8363               add_val = INTVAL (bl->biv->add_val);
8364               comparison_value = XEXP (comparison, 1);
8365               if (GET_MODE (comparison_value) == VOIDmode)
8366                 comparison_const_width
8367                   = GET_MODE_BITSIZE (GET_MODE (XEXP (comparison, 0)));
8368               else
8369                 comparison_const_width
8370                   = GET_MODE_BITSIZE (GET_MODE (comparison_value));
8371               if (comparison_const_width > HOST_BITS_PER_WIDE_INT)
8372                 comparison_const_width = HOST_BITS_PER_WIDE_INT;
8373               comparison_sign_mask
8374                 = (unsigned HOST_WIDE_INT) 1 << (comparison_const_width - 1);
8375
8376               /* If the comparison value is not a loop invariant, then we
8377                  can not reverse this loop.
8378
8379                  ??? If the insns which initialize the comparison value as
8380                  a whole compute an invariant result, then we could move
8381                  them out of the loop and proceed with loop reversal.  */
8382               if (! loop_invariant_p (loop, comparison_value))
8383                 return 0;
8384
8385               if (GET_CODE (comparison_value) == CONST_INT)
8386                 comparison_val = INTVAL (comparison_value);
8387               initial_value = bl->initial_value;
8388
8389               /* Normalize the initial value if it is an integer and
8390                  has no other use except as a counter.  This will allow
8391                  a few more loops to be reversed.  */
8392               if (no_use_except_counting
8393                   && GET_CODE (comparison_value) == CONST_INT
8394                   && GET_CODE (initial_value) == CONST_INT)
8395                 {
8396                   comparison_val = comparison_val - INTVAL (bl->initial_value);
8397                   /* The code below requires comparison_val to be a multiple
8398                      of add_val in order to do the loop reversal, so
8399                      round up comparison_val to a multiple of add_val.
8400                      Since comparison_value is constant, we know that the
8401                      current comparison code is LT.  */
8402                   comparison_val = comparison_val + add_val - 1;
8403                   comparison_val
8404                     -= (unsigned HOST_WIDE_INT) comparison_val % add_val;
8405                   /* We postpone overflow checks for COMPARISON_VAL here;
8406                      even if there is an overflow, we might still be able to
8407                      reverse the loop, if converting the loop exit test to
8408                      NE is possible.  */
8409                   initial_value = const0_rtx;
8410                 }
8411
8412               /* First check if we can do a vanilla loop reversal.  */
8413               if (initial_value == const0_rtx
8414                   /* If we have a decrement_and_branch_on_count,
8415                      prefer the NE test, since this will allow that
8416                      instruction to be generated.  Note that we must
8417                      use a vanilla loop reversal if the biv is used to
8418                      calculate a giv or has a non-counting use.  */
8419 #if ! defined (HAVE_decrement_and_branch_until_zero) \
8420 && defined (HAVE_decrement_and_branch_on_count)
8421                   && (! (add_val == 1 && loop->vtop
8422                          && (bl->biv_count == 0
8423                              || no_use_except_counting)))
8424 #endif
8425                   && GET_CODE (comparison_value) == CONST_INT
8426                      /* Now do postponed overflow checks on COMPARISON_VAL.  */
8427                   && ! (((comparison_val - add_val) ^ INTVAL (comparison_value))
8428                         & comparison_sign_mask))
8429                 {
8430                   /* Register will always be nonnegative, with value
8431                      0 on last iteration */
8432                   add_adjust = add_val;
8433                   nonneg = 1;
8434                   cmp_code = GE;
8435                 }
8436               else if (add_val == 1 && loop->vtop
8437                        && (bl->biv_count == 0
8438                            || no_use_except_counting))
8439                 {
8440                   add_adjust = 0;
8441                   cmp_code = NE;
8442                 }
8443               else
8444                 return 0;
8445
8446               if (GET_CODE (comparison) == LE)
8447                 add_adjust -= add_val;
8448
8449               /* If the initial value is not zero, or if the comparison
8450                  value is not an exact multiple of the increment, then we
8451                  can not reverse this loop.  */
8452               if (initial_value == const0_rtx
8453                   && GET_CODE (comparison_value) == CONST_INT)
8454                 {
8455                   if (((unsigned HOST_WIDE_INT) comparison_val % add_val) != 0)
8456                     return 0;
8457                 }
8458               else
8459                 {
8460                   if (! no_use_except_counting || add_val != 1)
8461                     return 0;
8462                 }
8463
8464               final_value = comparison_value;
8465
8466               /* Reset these in case we normalized the initial value
8467                  and comparison value above.  */
8468               if (GET_CODE (comparison_value) == CONST_INT
8469                   && GET_CODE (initial_value) == CONST_INT)
8470                 {
8471                   comparison_value = GEN_INT (comparison_val);
8472                   final_value
8473                     = GEN_INT (comparison_val + INTVAL (bl->initial_value));
8474                 }
8475               bl->initial_value = initial_value;
8476
8477               /* Save some info needed to produce the new insns.  */
8478               reg = bl->biv->dest_reg;
8479               jump_label = condjump_label (PREV_INSN (loop_end));
8480               new_add_val = GEN_INT (-INTVAL (bl->biv->add_val));
8481
8482               /* Set start_value; if this is not a CONST_INT, we need
8483                  to generate a SUB.
8484                  Initialize biv to start_value before loop start.
8485                  The old initializing insn will be deleted as a
8486                  dead store by flow.c.  */
8487               if (initial_value == const0_rtx
8488                   && GET_CODE (comparison_value) == CONST_INT)
8489                 {
8490                   start_value = GEN_INT (comparison_val - add_adjust);
8491                   loop_insn_hoist (loop, gen_move_insn (reg, start_value));
8492                 }
8493               else if (GET_CODE (initial_value) == CONST_INT)
8494                 {
8495                   enum machine_mode mode = GET_MODE (reg);
8496                   rtx offset = GEN_INT (-INTVAL (initial_value) - add_adjust);
8497                   rtx add_insn = gen_add3_insn (reg, comparison_value, offset);
8498
8499                   if (add_insn == 0)
8500                     return 0;
8501
8502                   start_value
8503                     = gen_rtx_PLUS (mode, comparison_value, offset);
8504                   loop_insn_hoist (loop, add_insn);
8505                   if (GET_CODE (comparison) == LE)
8506                     final_value = gen_rtx_PLUS (mode, comparison_value,
8507                                                 GEN_INT (add_val));
8508                 }
8509               else if (! add_adjust)
8510                 {
8511                   enum machine_mode mode = GET_MODE (reg);
8512                   rtx sub_insn = gen_sub3_insn (reg, comparison_value,
8513                                                 initial_value);
8514
8515                   if (sub_insn == 0)
8516                     return 0;
8517                   start_value
8518                     = gen_rtx_MINUS (mode, comparison_value, initial_value);
8519                   loop_insn_hoist (loop, sub_insn);
8520                 }
8521               else
8522                 /* We could handle the other cases too, but it'll be
8523                    better to have a testcase first.  */
8524                 return 0;
8525
8526               /* We may not have a single insn which can increment a reg, so
8527                  create a sequence to hold all the insns from expand_inc.  */
8528               start_sequence ();
8529               expand_inc (reg, new_add_val);
8530               tem = get_insns ();
8531               end_sequence ();
8532
8533               p = loop_insn_emit_before (loop, 0, bl->biv->insn, tem);
8534               delete_insn (bl->biv->insn);
8535
8536               /* Update biv info to reflect its new status.  */
8537               bl->biv->insn = p;
8538               bl->initial_value = start_value;
8539               bl->biv->add_val = new_add_val;
8540
8541               /* Update loop info.  */
8542               loop_info->initial_value = reg;
8543               loop_info->initial_equiv_value = reg;
8544               loop_info->final_value = const0_rtx;
8545               loop_info->final_equiv_value = const0_rtx;
8546               loop_info->comparison_value = const0_rtx;
8547               loop_info->comparison_code = cmp_code;
8548               loop_info->increment = new_add_val;
8549
8550               /* Inc LABEL_NUSES so that delete_insn will
8551                  not delete the label.  */
8552               LABEL_NUSES (XEXP (jump_label, 0))++;
8553
8554               /* Emit an insn after the end of the loop to set the biv's
8555                  proper exit value if it is used anywhere outside the loop.  */
8556               if ((REGNO_LAST_UID (bl->regno) != INSN_UID (first_compare))
8557                   || ! bl->init_insn
8558                   || REGNO_FIRST_UID (bl->regno) != INSN_UID (bl->init_insn))
8559                 loop_insn_sink (loop, gen_load_of_final_value (reg, final_value));
8560
8561               /* Delete compare/branch at end of loop.  */
8562               delete_related_insns (PREV_INSN (loop_end));
8563               if (compare_and_branch == 2)
8564                 delete_related_insns (first_compare);
8565
8566               /* Add new compare/branch insn at end of loop.  */
8567               start_sequence ();
8568               emit_cmp_and_jump_insns (reg, const0_rtx, cmp_code, NULL_RTX,
8569                                        GET_MODE (reg), 0,
8570                                        XEXP (jump_label, 0));
8571               tem = get_insns ();
8572               end_sequence ();
8573               emit_jump_insn_before (tem, loop_end);
8574
8575               for (tem = PREV_INSN (loop_end);
8576                    tem && GET_CODE (tem) != JUMP_INSN;
8577                    tem = PREV_INSN (tem))
8578                 ;
8579
8580               if (tem)
8581                 JUMP_LABEL (tem) = XEXP (jump_label, 0);
8582
8583               if (nonneg)
8584                 {
8585                   if (tem)
8586                     {
8587                       /* Increment of LABEL_NUSES done above.  */
8588                       /* Register is now always nonnegative,
8589                          so add REG_NONNEG note to the branch.  */
8590                       REG_NOTES (tem) = gen_rtx_EXPR_LIST (REG_NONNEG, reg,
8591                                                            REG_NOTES (tem));
8592                     }
8593                   bl->nonneg = 1;
8594                 }
8595
8596               /* No insn may reference both the reversed and another biv or it
8597                  will fail (see comment near the top of the loop reversal
8598                  code).
8599                  Earlier on, we have verified that the biv has no use except
8600                  counting, or it is the only biv in this function.
8601                  However, the code that computes no_use_except_counting does
8602                  not verify reg notes.  It's possible to have an insn that
8603                  references another biv, and has a REG_EQUAL note with an
8604                  expression based on the reversed biv.  To avoid this case,
8605                  remove all REG_EQUAL notes based on the reversed biv
8606                  here.  */
8607               for (p = loop_start; p != loop_end; p = NEXT_INSN (p))
8608                 if (INSN_P (p))
8609                   {
8610                     rtx *pnote;
8611                     rtx set = single_set (p);
8612                     /* If this is a set of a GIV based on the reversed biv, any
8613                        REG_EQUAL notes should still be correct.  */
8614                     if (! set
8615                         || GET_CODE (SET_DEST (set)) != REG
8616                         || (size_t) REGNO (SET_DEST (set)) >= ivs->n_regs
8617                         || REG_IV_TYPE (ivs, REGNO (SET_DEST (set))) != GENERAL_INDUCT
8618                         || REG_IV_INFO (ivs, REGNO (SET_DEST (set)))->src_reg != bl->biv->src_reg)
8619                       for (pnote = &REG_NOTES (p); *pnote;)
8620                         {
8621                           if (REG_NOTE_KIND (*pnote) == REG_EQUAL
8622                               && reg_mentioned_p (regno_reg_rtx[bl->regno],
8623                                                   XEXP (*pnote, 0)))
8624                             *pnote = XEXP (*pnote, 1);
8625                           else
8626                             pnote = &XEXP (*pnote, 1);
8627                         }
8628                   }
8629
8630               /* Mark that this biv has been reversed.  Each giv which depends
8631                  on this biv, and which is also live past the end of the loop
8632                  will have to be fixed up.  */
8633
8634               bl->reversed = 1;
8635
8636               if (loop_dump_stream)
8637                 {
8638                   fprintf (loop_dump_stream, "Reversed loop");
8639                   if (bl->nonneg)
8640                     fprintf (loop_dump_stream, " and added reg_nonneg\n");
8641                   else
8642                     fprintf (loop_dump_stream, "\n");
8643                 }
8644
8645               return 1;
8646             }
8647         }
8648     }
8649
8650   return 0;
8651 }
8652 \f
8653 /* Verify whether the biv BL appears to be eliminable,
8654    based on the insns in the loop that refer to it.
8655
8656    If ELIMINATE_P is nonzero, actually do the elimination.
8657
8658    THRESHOLD and INSN_COUNT are from loop_optimize and are used to
8659    determine whether invariant insns should be placed inside or at the
8660    start of the loop.  */
8661
8662 static int
8663 maybe_eliminate_biv (loop, bl, eliminate_p, threshold, insn_count)
8664      const struct loop *loop;
8665      struct iv_class *bl;
8666      int eliminate_p;
8667      int threshold, insn_count;
8668 {
8669   struct loop_ivs *ivs = LOOP_IVS (loop);
8670   rtx reg = bl->biv->dest_reg;
8671   rtx p;
8672
8673   /* Scan all insns in the loop, stopping if we find one that uses the
8674      biv in a way that we cannot eliminate.  */
8675
8676   for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
8677     {
8678       enum rtx_code code = GET_CODE (p);
8679       basic_block where_bb = 0;
8680       rtx where_insn = threshold >= insn_count ? 0 : p;
8681       rtx note;
8682
8683       /* If this is a libcall that sets a giv, skip ahead to its end.  */
8684       if (GET_RTX_CLASS (code) == 'i')
8685         {
8686           note = find_reg_note (p, REG_LIBCALL, NULL_RTX);
8687
8688           if (note)
8689             {
8690               rtx last = XEXP (note, 0);
8691               rtx set = single_set (last);
8692
8693               if (set && GET_CODE (SET_DEST (set)) == REG)
8694                 {
8695                   unsigned int regno = REGNO (SET_DEST (set));
8696
8697                   if (regno < ivs->n_regs
8698                       && REG_IV_TYPE (ivs, regno) == GENERAL_INDUCT
8699                       && REG_IV_INFO (ivs, regno)->src_reg == bl->biv->src_reg)
8700                     p = last;
8701                 }
8702             }
8703         }
8704
8705       /* Closely examine the insn if the biv is mentioned.  */
8706       if ((code == INSN || code == JUMP_INSN || code == CALL_INSN)
8707           && reg_mentioned_p (reg, PATTERN (p))
8708           && ! maybe_eliminate_biv_1 (loop, PATTERN (p), p, bl,
8709                                       eliminate_p, where_bb, where_insn))
8710         {
8711           if (loop_dump_stream)
8712             fprintf (loop_dump_stream,
8713                      "Cannot eliminate biv %d: biv used in insn %d.\n",
8714                      bl->regno, INSN_UID (p));
8715           break;
8716         }
8717
8718       /* If we are eliminating, kill REG_EQUAL notes mentioning the biv.  */
8719       if (eliminate_p
8720           && (note = find_reg_note (p, REG_EQUAL, NULL_RTX)) != NULL_RTX
8721           && reg_mentioned_p (reg, XEXP (note, 0)))
8722         remove_note (p, note);
8723     }
8724
8725   if (p == loop->end)
8726     {
8727       if (loop_dump_stream)
8728         fprintf (loop_dump_stream, "biv %d %s eliminated.\n",
8729                  bl->regno, eliminate_p ? "was" : "can be");
8730       return 1;
8731     }
8732
8733   return 0;
8734 }
8735 \f
8736 /* INSN and REFERENCE are instructions in the same insn chain.
8737    Return nonzero if INSN is first.  */
8738
8739 int
8740 loop_insn_first_p (insn, reference)
8741      rtx insn, reference;
8742 {
8743   rtx p, q;
8744
8745   for (p = insn, q = reference;;)
8746     {
8747       /* Start with test for not first so that INSN == REFERENCE yields not
8748          first.  */
8749       if (q == insn || ! p)
8750         return 0;
8751       if (p == reference || ! q)
8752         return 1;
8753
8754       /* Either of P or Q might be a NOTE.  Notes have the same LUID as the
8755          previous insn, hence the <= comparison below does not work if
8756          P is a note.  */
8757       if (INSN_UID (p) < max_uid_for_loop
8758           && INSN_UID (q) < max_uid_for_loop
8759           && GET_CODE (p) != NOTE)
8760         return INSN_LUID (p) <= INSN_LUID (q);
8761
8762       if (INSN_UID (p) >= max_uid_for_loop
8763           || GET_CODE (p) == NOTE)
8764         p = NEXT_INSN (p);
8765       if (INSN_UID (q) >= max_uid_for_loop)
8766         q = NEXT_INSN (q);
8767     }
8768 }
8769
8770 /* We are trying to eliminate BIV in INSN using GIV.  Return nonzero if
8771    the offset that we have to take into account due to auto-increment /
8772    div derivation is zero.  */
8773 static int
8774 biv_elimination_giv_has_0_offset (biv, giv, insn)
8775      struct induction *biv, *giv;
8776      rtx insn;
8777 {
8778   /* If the giv V had the auto-inc address optimization applied
8779      to it, and INSN occurs between the giv insn and the biv
8780      insn, then we'd have to adjust the value used here.
8781      This is rare, so we don't bother to make this possible.  */
8782   if (giv->auto_inc_opt
8783       && ((loop_insn_first_p (giv->insn, insn)
8784            && loop_insn_first_p (insn, biv->insn))
8785           || (loop_insn_first_p (biv->insn, insn)
8786               && loop_insn_first_p (insn, giv->insn))))
8787     return 0;
8788
8789   return 1;
8790 }
8791
8792 /* If BL appears in X (part of the pattern of INSN), see if we can
8793    eliminate its use.  If so, return 1.  If not, return 0.
8794
8795    If BIV does not appear in X, return 1.
8796
8797    If ELIMINATE_P is nonzero, actually do the elimination.
8798    WHERE_INSN/WHERE_BB indicate where extra insns should be added.
8799    Depending on how many items have been moved out of the loop, it
8800    will either be before INSN (when WHERE_INSN is nonzero) or at the
8801    start of the loop (when WHERE_INSN is zero).  */
8802
8803 static int
8804 maybe_eliminate_biv_1 (loop, x, insn, bl, eliminate_p, where_bb, where_insn)
8805      const struct loop *loop;
8806      rtx x, insn;
8807      struct iv_class *bl;
8808      int eliminate_p;
8809      basic_block where_bb;
8810      rtx where_insn;
8811 {
8812   enum rtx_code code = GET_CODE (x);
8813   rtx reg = bl->biv->dest_reg;
8814   enum machine_mode mode = GET_MODE (reg);
8815   struct induction *v;
8816   rtx arg, tem;
8817 #ifdef HAVE_cc0
8818   rtx new;
8819 #endif
8820   int arg_operand;
8821   const char *fmt;
8822   int i, j;
8823
8824   switch (code)
8825     {
8826     case REG:
8827       /* If we haven't already been able to do something with this BIV,
8828          we can't eliminate it.  */
8829       if (x == reg)
8830         return 0;
8831       return 1;
8832
8833     case SET:
8834       /* If this sets the BIV, it is not a problem.  */
8835       if (SET_DEST (x) == reg)
8836         return 1;
8837
8838       /* If this is an insn that defines a giv, it is also ok because
8839          it will go away when the giv is reduced.  */
8840       for (v = bl->giv; v; v = v->next_iv)
8841         if (v->giv_type == DEST_REG && SET_DEST (x) == v->dest_reg)
8842           return 1;
8843
8844 #ifdef HAVE_cc0
8845       if (SET_DEST (x) == cc0_rtx && SET_SRC (x) == reg)
8846         {
8847           /* Can replace with any giv that was reduced and
8848              that has (MULT_VAL != 0) and (ADD_VAL == 0).
8849              Require a constant for MULT_VAL, so we know it's nonzero.
8850              ??? We disable this optimization to avoid potential
8851              overflows.  */
8852
8853           for (v = bl->giv; v; v = v->next_iv)
8854             if (GET_CODE (v->mult_val) == CONST_INT && v->mult_val != const0_rtx
8855                 && v->add_val == const0_rtx
8856                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8857                 && v->mode == mode
8858                 && 0)
8859               {
8860                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8861                   continue;
8862
8863                 if (! eliminate_p)
8864                   return 1;
8865
8866                 /* If the giv has the opposite direction of change,
8867                    then reverse the comparison.  */
8868                 if (INTVAL (v->mult_val) < 0)
8869                   new = gen_rtx_COMPARE (GET_MODE (v->new_reg),
8870                                          const0_rtx, v->new_reg);
8871                 else
8872                   new = v->new_reg;
8873
8874                 /* We can probably test that giv's reduced reg.  */
8875                 if (validate_change (insn, &SET_SRC (x), new, 0))
8876                   return 1;
8877               }
8878
8879           /* Look for a giv with (MULT_VAL != 0) and (ADD_VAL != 0);
8880              replace test insn with a compare insn (cmp REDUCED_GIV ADD_VAL).
8881              Require a constant for MULT_VAL, so we know it's nonzero.
8882              ??? Do this only if ADD_VAL is a pointer to avoid a potential
8883              overflow problem.  */
8884
8885           for (v = bl->giv; v; v = v->next_iv)
8886             if (GET_CODE (v->mult_val) == CONST_INT
8887                 && v->mult_val != const0_rtx
8888                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8889                 && v->mode == mode
8890                 && (GET_CODE (v->add_val) == SYMBOL_REF
8891                     || GET_CODE (v->add_val) == LABEL_REF
8892                     || GET_CODE (v->add_val) == CONST
8893                     || (GET_CODE (v->add_val) == REG
8894                         && REG_POINTER (v->add_val))))
8895               {
8896                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8897                   continue;
8898
8899                 if (! eliminate_p)
8900                   return 1;
8901
8902                 /* If the giv has the opposite direction of change,
8903                    then reverse the comparison.  */
8904                 if (INTVAL (v->mult_val) < 0)
8905                   new = gen_rtx_COMPARE (VOIDmode, copy_rtx (v->add_val),
8906                                          v->new_reg);
8907                 else
8908                   new = gen_rtx_COMPARE (VOIDmode, v->new_reg,
8909                                          copy_rtx (v->add_val));
8910
8911                 /* Replace biv with the giv's reduced register.  */
8912                 update_reg_last_use (v->add_val, insn);
8913                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
8914                   return 1;
8915
8916                 /* Insn doesn't support that constant or invariant.  Copy it
8917                    into a register (it will be a loop invariant.)  */
8918                 tem = gen_reg_rtx (GET_MODE (v->new_reg));
8919
8920                 loop_insn_emit_before (loop, 0, where_insn,
8921                                        gen_move_insn (tem,
8922                                                       copy_rtx (v->add_val)));
8923
8924                 /* Substitute the new register for its invariant value in
8925                    the compare expression.  */
8926                 XEXP (new, (INTVAL (v->mult_val) < 0) ? 0 : 1) = tem;
8927                 if (validate_change (insn, &SET_SRC (PATTERN (insn)), new, 0))
8928                   return 1;
8929               }
8930         }
8931 #endif
8932       break;
8933
8934     case COMPARE:
8935     case EQ:  case NE:
8936     case GT:  case GE:  case GTU:  case GEU:
8937     case LT:  case LE:  case LTU:  case LEU:
8938       /* See if either argument is the biv.  */
8939       if (XEXP (x, 0) == reg)
8940         arg = XEXP (x, 1), arg_operand = 1;
8941       else if (XEXP (x, 1) == reg)
8942         arg = XEXP (x, 0), arg_operand = 0;
8943       else
8944         break;
8945
8946       if (CONSTANT_P (arg))
8947         {
8948           /* First try to replace with any giv that has constant positive
8949              mult_val and constant add_val.  We might be able to support
8950              negative mult_val, but it seems complex to do it in general.  */
8951
8952           for (v = bl->giv; v; v = v->next_iv)
8953             if (GET_CODE (v->mult_val) == CONST_INT
8954                 && INTVAL (v->mult_val) > 0
8955                 && (GET_CODE (v->add_val) == SYMBOL_REF
8956                     || GET_CODE (v->add_val) == LABEL_REF
8957                     || GET_CODE (v->add_val) == CONST
8958                     || (GET_CODE (v->add_val) == REG
8959                         && REG_POINTER (v->add_val)))
8960                 && ! v->ignore && ! v->maybe_dead && v->always_computable
8961                 && v->mode == mode)
8962               {
8963                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
8964                   continue;
8965
8966                 /* Don't eliminate if the linear combination that makes up
8967                    the giv overflows when it is applied to ARG.  */
8968                 if (GET_CODE (arg) == CONST_INT)
8969                   {
8970                     rtx add_val;
8971
8972                     if (GET_CODE (v->add_val) == CONST_INT)
8973                       add_val = v->add_val;
8974                     else
8975                       add_val = const0_rtx;
8976
8977                     if (const_mult_add_overflow_p (arg, v->mult_val,
8978                                                    add_val, mode, 1))
8979                       continue;
8980                   }
8981
8982                 if (! eliminate_p)
8983                   return 1;
8984
8985                 /* Replace biv with the giv's reduced reg.  */
8986                 validate_change (insn, &XEXP (x, 1 - arg_operand), v->new_reg, 1);
8987
8988                 /* If all constants are actually constant integers and
8989                    the derived constant can be directly placed in the COMPARE,
8990                    do so.  */
8991                 if (GET_CODE (arg) == CONST_INT
8992                     && GET_CODE (v->add_val) == CONST_INT)
8993                   {
8994                     tem = expand_mult_add (arg, NULL_RTX, v->mult_val,
8995                                            v->add_val, mode, 1);
8996                   }
8997                 else
8998                   {
8999                     /* Otherwise, load it into a register.  */
9000                     tem = gen_reg_rtx (mode);
9001                     loop_iv_add_mult_emit_before (loop, arg,
9002                                                   v->mult_val, v->add_val,
9003                                                   tem, where_bb, where_insn);
9004                   }
9005
9006                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
9007
9008                 if (apply_change_group ())
9009                   return 1;
9010               }
9011
9012           /* Look for giv with positive constant mult_val and nonconst add_val.
9013              Insert insns to calculate new compare value.
9014              ??? Turn this off due to possible overflow.  */
9015
9016           for (v = bl->giv; v; v = v->next_iv)
9017             if (GET_CODE (v->mult_val) == CONST_INT
9018                 && INTVAL (v->mult_val) > 0
9019                 && ! v->ignore && ! v->maybe_dead && v->always_computable
9020                 && v->mode == mode
9021                 && 0)
9022               {
9023                 rtx tem;
9024
9025                 if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
9026                   continue;
9027
9028                 if (! eliminate_p)
9029                   return 1;
9030
9031                 tem = gen_reg_rtx (mode);
9032
9033                 /* Replace biv with giv's reduced register.  */
9034                 validate_change (insn, &XEXP (x, 1 - arg_operand),
9035                                  v->new_reg, 1);
9036
9037                 /* Compute value to compare against.  */
9038                 loop_iv_add_mult_emit_before (loop, arg,
9039                                               v->mult_val, v->add_val,
9040                                               tem, where_bb, where_insn);
9041                 /* Use it in this insn.  */
9042                 validate_change (insn, &XEXP (x, arg_operand), tem, 1);
9043                 if (apply_change_group ())
9044                   return 1;
9045               }
9046         }
9047       else if (GET_CODE (arg) == REG || GET_CODE (arg) == MEM)
9048         {
9049           if (loop_invariant_p (loop, arg) == 1)
9050             {
9051               /* Look for giv with constant positive mult_val and nonconst
9052                  add_val. Insert insns to compute new compare value.
9053                  ??? Turn this off due to possible overflow.  */
9054
9055               for (v = bl->giv; v; v = v->next_iv)
9056                 if (GET_CODE (v->mult_val) == CONST_INT && INTVAL (v->mult_val) > 0
9057                     && ! v->ignore && ! v->maybe_dead && v->always_computable
9058                     && v->mode == mode
9059                     && 0)
9060                   {
9061                     rtx tem;
9062
9063                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
9064                       continue;
9065
9066                     if (! eliminate_p)
9067                       return 1;
9068
9069                     tem = gen_reg_rtx (mode);
9070
9071                     /* Replace biv with giv's reduced register.  */
9072                     validate_change (insn, &XEXP (x, 1 - arg_operand),
9073                                      v->new_reg, 1);
9074
9075                     /* Compute value to compare against.  */
9076                     loop_iv_add_mult_emit_before (loop, arg,
9077                                                   v->mult_val, v->add_val,
9078                                                   tem, where_bb, where_insn);
9079                     validate_change (insn, &XEXP (x, arg_operand), tem, 1);
9080                     if (apply_change_group ())
9081                       return 1;
9082                   }
9083             }
9084
9085           /* This code has problems.  Basically, you can't know when
9086              seeing if we will eliminate BL, whether a particular giv
9087              of ARG will be reduced.  If it isn't going to be reduced,
9088              we can't eliminate BL.  We can try forcing it to be reduced,
9089              but that can generate poor code.
9090
9091              The problem is that the benefit of reducing TV, below should
9092              be increased if BL can actually be eliminated, but this means
9093              we might have to do a topological sort of the order in which
9094              we try to process biv.  It doesn't seem worthwhile to do
9095              this sort of thing now.  */
9096
9097 #if 0
9098           /* Otherwise the reg compared with had better be a biv.  */
9099           if (GET_CODE (arg) != REG
9100               || REG_IV_TYPE (ivs, REGNO (arg)) != BASIC_INDUCT)
9101             return 0;
9102
9103           /* Look for a pair of givs, one for each biv,
9104              with identical coefficients.  */
9105           for (v = bl->giv; v; v = v->next_iv)
9106             {
9107               struct induction *tv;
9108
9109               if (v->ignore || v->maybe_dead || v->mode != mode)
9110                 continue;
9111
9112               for (tv = REG_IV_CLASS (ivs, REGNO (arg))->giv; tv;
9113                    tv = tv->next_iv)
9114                 if (! tv->ignore && ! tv->maybe_dead
9115                     && rtx_equal_p (tv->mult_val, v->mult_val)
9116                     && rtx_equal_p (tv->add_val, v->add_val)
9117                     && tv->mode == mode)
9118                   {
9119                     if (! biv_elimination_giv_has_0_offset (bl->biv, v, insn))
9120                       continue;
9121
9122                     if (! eliminate_p)
9123                       return 1;
9124
9125                     /* Replace biv with its giv's reduced reg.  */
9126                     XEXP (x, 1 - arg_operand) = v->new_reg;
9127                     /* Replace other operand with the other giv's
9128                        reduced reg.  */
9129                     XEXP (x, arg_operand) = tv->new_reg;
9130                     return 1;
9131                   }
9132             }
9133 #endif
9134         }
9135
9136       /* If we get here, the biv can't be eliminated.  */
9137       return 0;
9138
9139     case MEM:
9140       /* If this address is a DEST_ADDR giv, it doesn't matter if the
9141          biv is used in it, since it will be replaced.  */
9142       for (v = bl->giv; v; v = v->next_iv)
9143         if (v->giv_type == DEST_ADDR && v->location == &XEXP (x, 0))
9144           return 1;
9145       break;
9146
9147     default:
9148       break;
9149     }
9150
9151   /* See if any subexpression fails elimination.  */
9152   fmt = GET_RTX_FORMAT (code);
9153   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
9154     {
9155       switch (fmt[i])
9156         {
9157         case 'e':
9158           if (! maybe_eliminate_biv_1 (loop, XEXP (x, i), insn, bl,
9159                                        eliminate_p, where_bb, where_insn))
9160             return 0;
9161           break;
9162
9163         case 'E':
9164           for (j = XVECLEN (x, i) - 1; j >= 0; j--)
9165             if (! maybe_eliminate_biv_1 (loop, XVECEXP (x, i, j), insn, bl,
9166                                          eliminate_p, where_bb, where_insn))
9167               return 0;
9168           break;
9169         }
9170     }
9171
9172   return 1;
9173 }
9174 \f
9175 /* Return nonzero if the last use of REG
9176    is in an insn following INSN in the same basic block.  */
9177
9178 static int
9179 last_use_this_basic_block (reg, insn)
9180      rtx reg;
9181      rtx insn;
9182 {
9183   rtx n;
9184   for (n = insn;
9185        n && GET_CODE (n) != CODE_LABEL && GET_CODE (n) != JUMP_INSN;
9186        n = NEXT_INSN (n))
9187     {
9188       if (REGNO_LAST_UID (REGNO (reg)) == INSN_UID (n))
9189         return 1;
9190     }
9191   return 0;
9192 }
9193 \f
9194 /* Called via `note_stores' to record the initial value of a biv.  Here we
9195    just record the location of the set and process it later.  */
9196
9197 static void
9198 record_initial (dest, set, data)
9199      rtx dest;
9200      rtx set;
9201      void *data ATTRIBUTE_UNUSED;
9202 {
9203   struct loop_ivs *ivs = (struct loop_ivs *) data;
9204   struct iv_class *bl;
9205
9206   if (GET_CODE (dest) != REG
9207       || REGNO (dest) >= ivs->n_regs
9208       || REG_IV_TYPE (ivs, REGNO (dest)) != BASIC_INDUCT)
9209     return;
9210
9211   bl = REG_IV_CLASS (ivs, REGNO (dest));
9212
9213   /* If this is the first set found, record it.  */
9214   if (bl->init_insn == 0)
9215     {
9216       bl->init_insn = note_insn;
9217       bl->init_set = set;
9218     }
9219 }
9220 \f
9221 /* If any of the registers in X are "old" and currently have a last use earlier
9222    than INSN, update them to have a last use of INSN.  Their actual last use
9223    will be the previous insn but it will not have a valid uid_luid so we can't
9224    use it.  X must be a source expression only.  */
9225
9226 static void
9227 update_reg_last_use (x, insn)
9228      rtx x;
9229      rtx insn;
9230 {
9231   /* Check for the case where INSN does not have a valid luid.  In this case,
9232      there is no need to modify the regno_last_uid, as this can only happen
9233      when code is inserted after the loop_end to set a pseudo's final value,
9234      and hence this insn will never be the last use of x.
9235      ???? This comment is not correct.  See for example loop_givs_reduce.
9236      This may insert an insn before another new insn.  */
9237   if (GET_CODE (x) == REG && REGNO (x) < max_reg_before_loop
9238       && INSN_UID (insn) < max_uid_for_loop
9239       && REGNO_LAST_LUID (REGNO (x)) < INSN_LUID (insn))
9240     {
9241       REGNO_LAST_UID (REGNO (x)) = INSN_UID (insn);
9242     }
9243   else
9244     {
9245       int i, j;
9246       const char *fmt = GET_RTX_FORMAT (GET_CODE (x));
9247       for (i = GET_RTX_LENGTH (GET_CODE (x)) - 1; i >= 0; i--)
9248         {
9249           if (fmt[i] == 'e')
9250             update_reg_last_use (XEXP (x, i), insn);
9251           else if (fmt[i] == 'E')
9252             for (j = XVECLEN (x, i) - 1; j >= 0; j--)
9253               update_reg_last_use (XVECEXP (x, i, j), insn);
9254         }
9255     }
9256 }
9257 \f
9258 /* Given an insn INSN and condition COND, return the condition in a
9259    canonical form to simplify testing by callers.  Specifically:
9260
9261    (1) The code will always be a comparison operation (EQ, NE, GT, etc.).
9262    (2) Both operands will be machine operands; (cc0) will have been replaced.
9263    (3) If an operand is a constant, it will be the second operand.
9264    (4) (LE x const) will be replaced with (LT x <const+1>) and similarly
9265        for GE, GEU, and LEU.
9266
9267    If the condition cannot be understood, or is an inequality floating-point
9268    comparison which needs to be reversed, 0 will be returned.
9269
9270    If REVERSE is nonzero, then reverse the condition prior to canonizing it.
9271
9272    If EARLIEST is nonzero, it is a pointer to a place where the earliest
9273    insn used in locating the condition was found.  If a replacement test
9274    of the condition is desired, it should be placed in front of that
9275    insn and we will be sure that the inputs are still valid.
9276
9277    If WANT_REG is nonzero, we wish the condition to be relative to that
9278    register, if possible.  Therefore, do not canonicalize the condition
9279    further.  */
9280
9281 rtx
9282 canonicalize_condition (insn, cond, reverse, earliest, want_reg)
9283      rtx insn;
9284      rtx cond;
9285      int reverse;
9286      rtx *earliest;
9287      rtx want_reg;
9288 {
9289   enum rtx_code code;
9290   rtx prev = insn;
9291   rtx set;
9292   rtx tem;
9293   rtx op0, op1;
9294   int reverse_code = 0;
9295   enum machine_mode mode;
9296
9297   code = GET_CODE (cond);
9298   mode = GET_MODE (cond);
9299   op0 = XEXP (cond, 0);
9300   op1 = XEXP (cond, 1);
9301
9302   if (reverse)
9303     code = reversed_comparison_code (cond, insn);
9304   if (code == UNKNOWN)
9305     return 0;
9306
9307   if (earliest)
9308     *earliest = insn;
9309
9310   /* If we are comparing a register with zero, see if the register is set
9311      in the previous insn to a COMPARE or a comparison operation.  Perform
9312      the same tests as a function of STORE_FLAG_VALUE as find_comparison_args
9313      in cse.c  */
9314
9315   while (GET_RTX_CLASS (code) == '<'
9316          && op1 == CONST0_RTX (GET_MODE (op0))
9317          && op0 != want_reg)
9318     {
9319       /* Set nonzero when we find something of interest.  */
9320       rtx x = 0;
9321
9322 #ifdef HAVE_cc0
9323       /* If comparison with cc0, import actual comparison from compare
9324          insn.  */
9325       if (op0 == cc0_rtx)
9326         {
9327           if ((prev = prev_nonnote_insn (prev)) == 0
9328               || GET_CODE (prev) != INSN
9329               || (set = single_set (prev)) == 0
9330               || SET_DEST (set) != cc0_rtx)
9331             return 0;
9332
9333           op0 = SET_SRC (set);
9334           op1 = CONST0_RTX (GET_MODE (op0));
9335           if (earliest)
9336             *earliest = prev;
9337         }
9338 #endif
9339
9340       /* If this is a COMPARE, pick up the two things being compared.  */
9341       if (GET_CODE (op0) == COMPARE)
9342         {
9343           op1 = XEXP (op0, 1);
9344           op0 = XEXP (op0, 0);
9345           continue;
9346         }
9347       else if (GET_CODE (op0) != REG)
9348         break;
9349
9350       /* Go back to the previous insn.  Stop if it is not an INSN.  We also
9351          stop if it isn't a single set or if it has a REG_INC note because
9352          we don't want to bother dealing with it.  */
9353
9354       if ((prev = prev_nonnote_insn (prev)) == 0
9355           || GET_CODE (prev) != INSN
9356           || FIND_REG_INC_NOTE (prev, NULL_RTX))
9357         break;
9358
9359       set = set_of (op0, prev);
9360
9361       if (set
9362           && (GET_CODE (set) != SET
9363               || !rtx_equal_p (SET_DEST (set), op0)))
9364         break;
9365
9366       /* If this is setting OP0, get what it sets it to if it looks
9367          relevant.  */
9368       if (set)
9369         {
9370           enum machine_mode inner_mode = GET_MODE (SET_DEST (set));
9371 #ifdef FLOAT_STORE_FLAG_VALUE
9372           REAL_VALUE_TYPE fsfv;
9373 #endif
9374
9375           /* ??? We may not combine comparisons done in a CCmode with
9376              comparisons not done in a CCmode.  This is to aid targets
9377              like Alpha that have an IEEE compliant EQ instruction, and
9378              a non-IEEE compliant BEQ instruction.  The use of CCmode is
9379              actually artificial, simply to prevent the combination, but
9380              should not affect other platforms.
9381
9382              However, we must allow VOIDmode comparisons to match either
9383              CCmode or non-CCmode comparison, because some ports have
9384              modeless comparisons inside branch patterns.
9385
9386              ??? This mode check should perhaps look more like the mode check
9387              in simplify_comparison in combine.  */
9388
9389           if ((GET_CODE (SET_SRC (set)) == COMPARE
9390                || (((code == NE
9391                      || (code == LT
9392                          && GET_MODE_CLASS (inner_mode) == MODE_INT
9393                          && (GET_MODE_BITSIZE (inner_mode)
9394                              <= HOST_BITS_PER_WIDE_INT)
9395                          && (STORE_FLAG_VALUE
9396                              & ((HOST_WIDE_INT) 1
9397                                 << (GET_MODE_BITSIZE (inner_mode) - 1))))
9398 #ifdef FLOAT_STORE_FLAG_VALUE
9399                      || (code == LT
9400                          && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
9401                          && (fsfv = FLOAT_STORE_FLAG_VALUE (inner_mode),
9402                              REAL_VALUE_NEGATIVE (fsfv)))
9403 #endif
9404                      ))
9405                    && GET_RTX_CLASS (GET_CODE (SET_SRC (set))) == '<'))
9406               && (((GET_MODE_CLASS (mode) == MODE_CC)
9407                    == (GET_MODE_CLASS (inner_mode) == MODE_CC))
9408                   || mode == VOIDmode || inner_mode == VOIDmode))
9409             x = SET_SRC (set);
9410           else if (((code == EQ
9411                      || (code == GE
9412                          && (GET_MODE_BITSIZE (inner_mode)
9413                              <= HOST_BITS_PER_WIDE_INT)
9414                          && GET_MODE_CLASS (inner_mode) == MODE_INT
9415                          && (STORE_FLAG_VALUE
9416                              & ((HOST_WIDE_INT) 1
9417                                 << (GET_MODE_BITSIZE (inner_mode) - 1))))
9418 #ifdef FLOAT_STORE_FLAG_VALUE
9419                      || (code == GE
9420                          && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
9421                          && (fsfv = FLOAT_STORE_FLAG_VALUE (inner_mode),
9422                              REAL_VALUE_NEGATIVE (fsfv)))
9423 #endif
9424                      ))
9425                    && GET_RTX_CLASS (GET_CODE (SET_SRC (set))) == '<'
9426                    && (((GET_MODE_CLASS (mode) == MODE_CC)
9427                         == (GET_MODE_CLASS (inner_mode) == MODE_CC))
9428                        || mode == VOIDmode || inner_mode == VOIDmode))
9429
9430             {
9431               reverse_code = 1;
9432               x = SET_SRC (set);
9433             }
9434           else
9435             break;
9436         }
9437
9438       else if (reg_set_p (op0, prev))
9439         /* If this sets OP0, but not directly, we have to give up.  */
9440         break;
9441
9442       if (x)
9443         {
9444           if (GET_RTX_CLASS (GET_CODE (x)) == '<')
9445             code = GET_CODE (x);
9446           if (reverse_code)
9447             {
9448               code = reversed_comparison_code (x, prev);
9449               if (code == UNKNOWN)
9450                 return 0;
9451               reverse_code = 0;
9452             }
9453
9454           op0 = XEXP (x, 0), op1 = XEXP (x, 1);
9455           if (earliest)
9456             *earliest = prev;
9457         }
9458     }
9459
9460   /* If constant is first, put it last.  */
9461   if (CONSTANT_P (op0))
9462     code = swap_condition (code), tem = op0, op0 = op1, op1 = tem;
9463
9464   /* If OP0 is the result of a comparison, we weren't able to find what
9465      was really being compared, so fail.  */
9466   if (GET_MODE_CLASS (GET_MODE (op0)) == MODE_CC)
9467     return 0;
9468
9469   /* Canonicalize any ordered comparison with integers involving equality
9470      if we can do computations in the relevant mode and we do not
9471      overflow.  */
9472
9473   if (GET_CODE (op1) == CONST_INT
9474       && GET_MODE (op0) != VOIDmode
9475       && GET_MODE_BITSIZE (GET_MODE (op0)) <= HOST_BITS_PER_WIDE_INT)
9476     {
9477       HOST_WIDE_INT const_val = INTVAL (op1);
9478       unsigned HOST_WIDE_INT uconst_val = const_val;
9479       unsigned HOST_WIDE_INT max_val
9480         = (unsigned HOST_WIDE_INT) GET_MODE_MASK (GET_MODE (op0));
9481
9482       switch (code)
9483         {
9484         case LE:
9485           if ((unsigned HOST_WIDE_INT) const_val != max_val >> 1)
9486             code = LT, op1 = gen_int_mode (const_val + 1, GET_MODE (op0));
9487           break;
9488
9489         /* When cross-compiling, const_val might be sign-extended from
9490            BITS_PER_WORD to HOST_BITS_PER_WIDE_INT */
9491         case GE:
9492           if ((HOST_WIDE_INT) (const_val & max_val)
9493               != (((HOST_WIDE_INT) 1
9494                    << (GET_MODE_BITSIZE (GET_MODE (op0)) - 1))))
9495             code = GT, op1 = gen_int_mode (const_val - 1, GET_MODE (op0));
9496           break;
9497
9498         case LEU:
9499           if (uconst_val < max_val)
9500             code = LTU, op1 = gen_int_mode (uconst_val + 1, GET_MODE (op0));
9501           break;
9502
9503         case GEU:
9504           if (uconst_val != 0)
9505             code = GTU, op1 = gen_int_mode (uconst_val - 1, GET_MODE (op0));
9506           break;
9507
9508         default:
9509           break;
9510         }
9511     }
9512
9513   /* Never return CC0; return zero instead.  */
9514   if (CC0_P (op0))
9515     return 0;
9516
9517   return gen_rtx_fmt_ee (code, VOIDmode, op0, op1);
9518 }
9519
9520 /* Given a jump insn JUMP, return the condition that will cause it to branch
9521    to its JUMP_LABEL.  If the condition cannot be understood, or is an
9522    inequality floating-point comparison which needs to be reversed, 0 will
9523    be returned.
9524
9525    If EARLIEST is nonzero, it is a pointer to a place where the earliest
9526    insn used in locating the condition was found.  If a replacement test
9527    of the condition is desired, it should be placed in front of that
9528    insn and we will be sure that the inputs are still valid.  */
9529
9530 rtx
9531 get_condition (jump, earliest)
9532      rtx jump;
9533      rtx *earliest;
9534 {
9535   rtx cond;
9536   int reverse;
9537   rtx set;
9538
9539   /* If this is not a standard conditional jump, we can't parse it.  */
9540   if (GET_CODE (jump) != JUMP_INSN
9541       || ! any_condjump_p (jump))
9542     return 0;
9543   set = pc_set (jump);
9544
9545   cond = XEXP (SET_SRC (set), 0);
9546
9547   /* If this branches to JUMP_LABEL when the condition is false, reverse
9548      the condition.  */
9549   reverse
9550     = GET_CODE (XEXP (SET_SRC (set), 2)) == LABEL_REF
9551       && XEXP (XEXP (SET_SRC (set), 2), 0) == JUMP_LABEL (jump);
9552
9553   return canonicalize_condition (jump, cond, reverse, earliest, NULL_RTX);
9554 }
9555
9556 /* Similar to above routine, except that we also put an invariant last
9557    unless both operands are invariants.  */
9558
9559 rtx
9560 get_condition_for_loop (loop, x)
9561      const struct loop *loop;
9562      rtx x;
9563 {
9564   rtx comparison = get_condition (x, (rtx*) 0);
9565
9566   if (comparison == 0
9567       || ! loop_invariant_p (loop, XEXP (comparison, 0))
9568       || loop_invariant_p (loop, XEXP (comparison, 1)))
9569     return comparison;
9570
9571   return gen_rtx_fmt_ee (swap_condition (GET_CODE (comparison)), VOIDmode,
9572                          XEXP (comparison, 1), XEXP (comparison, 0));
9573 }
9574
9575 /* Scan the function and determine whether it has indirect (computed) jumps.
9576
9577    This is taken mostly from flow.c; similar code exists elsewhere
9578    in the compiler.  It may be useful to put this into rtlanal.c.  */
9579 static int
9580 indirect_jump_in_function_p (start)
9581      rtx start;
9582 {
9583   rtx insn;
9584
9585   for (insn = start; insn; insn = NEXT_INSN (insn))
9586     if (computed_jump_p (insn))
9587       return 1;
9588
9589   return 0;
9590 }
9591
9592 /* Add MEM to the LOOP_MEMS array, if appropriate.  See the
9593    documentation for LOOP_MEMS for the definition of `appropriate'.
9594    This function is called from prescan_loop via for_each_rtx.  */
9595
9596 static int
9597 insert_loop_mem (mem, data)
9598      rtx *mem;
9599      void *data ATTRIBUTE_UNUSED;
9600 {
9601   struct loop_info *loop_info = data;
9602   int i;
9603   rtx m = *mem;
9604
9605   if (m == NULL_RTX)
9606     return 0;
9607
9608   switch (GET_CODE (m))
9609     {
9610     case MEM:
9611       break;
9612
9613     case CLOBBER:
9614       /* We're not interested in MEMs that are only clobbered.  */
9615       return -1;
9616
9617     case CONST_DOUBLE:
9618       /* We're not interested in the MEM associated with a
9619          CONST_DOUBLE, so there's no need to traverse into this.  */
9620       return -1;
9621
9622     case EXPR_LIST:
9623       /* We're not interested in any MEMs that only appear in notes.  */
9624       return -1;
9625
9626     default:
9627       /* This is not a MEM.  */
9628       return 0;
9629     }
9630
9631   /* See if we've already seen this MEM.  */
9632   for (i = 0; i < loop_info->mems_idx; ++i)
9633     if (rtx_equal_p (m, loop_info->mems[i].mem))
9634       {
9635         if (GET_MODE (m) != GET_MODE (loop_info->mems[i].mem))
9636           /* The modes of the two memory accesses are different.  If
9637              this happens, something tricky is going on, and we just
9638              don't optimize accesses to this MEM.  */
9639           loop_info->mems[i].optimize = 0;
9640
9641         return 0;
9642       }
9643
9644   /* Resize the array, if necessary.  */
9645   if (loop_info->mems_idx == loop_info->mems_allocated)
9646     {
9647       if (loop_info->mems_allocated != 0)
9648         loop_info->mems_allocated *= 2;
9649       else
9650         loop_info->mems_allocated = 32;
9651
9652       loop_info->mems = (loop_mem_info *)
9653         xrealloc (loop_info->mems,
9654                   loop_info->mems_allocated * sizeof (loop_mem_info));
9655     }
9656
9657   /* Actually insert the MEM.  */
9658   loop_info->mems[loop_info->mems_idx].mem = m;
9659   /* We can't hoist this MEM out of the loop if it's a BLKmode MEM
9660      because we can't put it in a register.  We still store it in the
9661      table, though, so that if we see the same address later, but in a
9662      non-BLK mode, we'll not think we can optimize it at that point.  */
9663   loop_info->mems[loop_info->mems_idx].optimize = (GET_MODE (m) != BLKmode);
9664   loop_info->mems[loop_info->mems_idx].reg = NULL_RTX;
9665   ++loop_info->mems_idx;
9666
9667   return 0;
9668 }
9669
9670
9671 /* Allocate REGS->ARRAY or reallocate it if it is too small.
9672
9673    Increment REGS->ARRAY[I].SET_IN_LOOP at the index I of each
9674    register that is modified by an insn between FROM and TO.  If the
9675    value of an element of REGS->array[I].SET_IN_LOOP becomes 127 or
9676    more, stop incrementing it, to avoid overflow.
9677
9678    Store in REGS->ARRAY[I].SINGLE_USAGE the single insn in which
9679    register I is used, if it is only used once.  Otherwise, it is set
9680    to 0 (for no uses) or const0_rtx for more than one use.  This
9681    parameter may be zero, in which case this processing is not done.
9682
9683    Set REGS->ARRAY[I].MAY_NOT_OPTIMIZE nonzero if we should not
9684    optimize register I.  */
9685
9686 static void
9687 loop_regs_scan (loop, extra_size)
9688      const struct loop *loop;
9689      int extra_size;
9690 {
9691   struct loop_regs *regs = LOOP_REGS (loop);
9692   int old_nregs;
9693   /* last_set[n] is nonzero iff reg n has been set in the current
9694    basic block.  In that case, it is the insn that last set reg n.  */
9695   rtx *last_set;
9696   rtx insn;
9697   int i;
9698
9699   old_nregs = regs->num;
9700   regs->num = max_reg_num ();
9701
9702   /* Grow the regs array if not allocated or too small.  */
9703   if (regs->num >= regs->size)
9704     {
9705       regs->size = regs->num + extra_size;
9706
9707       regs->array = (struct loop_reg *)
9708         xrealloc (regs->array, regs->size * sizeof (*regs->array));
9709
9710       /* Zero the new elements.  */
9711       memset (regs->array + old_nregs, 0,
9712               (regs->size - old_nregs) * sizeof (*regs->array));
9713     }
9714
9715   /* Clear previously scanned fields but do not clear n_times_set.  */
9716   for (i = 0; i < old_nregs; i++)
9717     {
9718       regs->array[i].set_in_loop = 0;
9719       regs->array[i].may_not_optimize = 0;
9720       regs->array[i].single_usage = NULL_RTX;
9721     }
9722
9723   last_set = (rtx *) xcalloc (regs->num, sizeof (rtx));
9724
9725   /* Scan the loop, recording register usage.  */
9726   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
9727        insn = NEXT_INSN (insn))
9728     {
9729       if (INSN_P (insn))
9730         {
9731           /* Record registers that have exactly one use.  */
9732           find_single_use_in_loop (regs, insn, PATTERN (insn));
9733
9734           /* Include uses in REG_EQUAL notes.  */
9735           if (REG_NOTES (insn))
9736             find_single_use_in_loop (regs, insn, REG_NOTES (insn));
9737
9738           if (GET_CODE (PATTERN (insn)) == SET
9739               || GET_CODE (PATTERN (insn)) == CLOBBER)
9740             count_one_set (regs, insn, PATTERN (insn), last_set);
9741           else if (GET_CODE (PATTERN (insn)) == PARALLEL)
9742             {
9743               int i;
9744               for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
9745                 count_one_set (regs, insn, XVECEXP (PATTERN (insn), 0, i),
9746                                last_set);
9747             }
9748         }
9749
9750       if (GET_CODE (insn) == CODE_LABEL || GET_CODE (insn) == JUMP_INSN)
9751         memset (last_set, 0, regs->num * sizeof (rtx));
9752
9753       /* Invalidate all registers used for function argument passing.
9754          We check rtx_varies_p for the same reason as below, to allow
9755          optimizing PIC calculations.  */
9756       if (GET_CODE (insn) == CALL_INSN)
9757         {
9758           rtx link;
9759           for (link = CALL_INSN_FUNCTION_USAGE (insn);
9760                link;
9761                link = XEXP (link, 1))
9762             {
9763               rtx op, reg;
9764
9765               if (GET_CODE (op = XEXP (link, 0)) == USE
9766                   && GET_CODE (reg = XEXP (op, 0)) == REG
9767                   && rtx_varies_p (reg, 1))
9768                 regs->array[REGNO (reg)].may_not_optimize = 1;
9769             }
9770         }
9771     }
9772
9773   /* Invalidate all hard registers clobbered by calls.  With one exception:
9774      a call-clobbered PIC register is still function-invariant for our
9775      purposes, since we can hoist any PIC calculations out of the loop.
9776      Thus the call to rtx_varies_p.  */
9777   if (LOOP_INFO (loop)->has_call)
9778     for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
9779       if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i)
9780           && rtx_varies_p (regno_reg_rtx[i], 1))
9781         {
9782           regs->array[i].may_not_optimize = 1;
9783           regs->array[i].set_in_loop = 1;
9784         }
9785
9786 #ifdef AVOID_CCMODE_COPIES
9787   /* Don't try to move insns which set CC registers if we should not
9788      create CCmode register copies.  */
9789   for (i = regs->num - 1; i >= FIRST_PSEUDO_REGISTER; i--)
9790     if (GET_MODE_CLASS (GET_MODE (regno_reg_rtx[i])) == MODE_CC)
9791       regs->array[i].may_not_optimize = 1;
9792 #endif
9793
9794   /* Set regs->array[I].n_times_set for the new registers.  */
9795   for (i = old_nregs; i < regs->num; i++)
9796     regs->array[i].n_times_set = regs->array[i].set_in_loop;
9797
9798   free (last_set);
9799 }
9800
9801 /* Returns the number of real INSNs in the LOOP.  */
9802
9803 static int
9804 count_insns_in_loop (loop)
9805      const struct loop *loop;
9806 {
9807   int count = 0;
9808   rtx insn;
9809
9810   for (insn = loop->top ? loop->top : loop->start; insn != loop->end;
9811        insn = NEXT_INSN (insn))
9812     if (INSN_P (insn))
9813       ++count;
9814
9815   return count;
9816 }
9817
9818 /* Move MEMs into registers for the duration of the loop.  */
9819
9820 static void
9821 load_mems (loop)
9822      const struct loop *loop;
9823 {
9824   struct loop_info *loop_info = LOOP_INFO (loop);
9825   struct loop_regs *regs = LOOP_REGS (loop);
9826   int maybe_never = 0;
9827   int i;
9828   rtx p, prev_ebb_head;
9829   rtx label = NULL_RTX;
9830   rtx end_label;
9831   /* Nonzero if the next instruction may never be executed.  */
9832   int next_maybe_never = 0;
9833   unsigned int last_max_reg = max_reg_num ();
9834
9835   if (loop_info->mems_idx == 0)
9836     return;
9837
9838   /* We cannot use next_label here because it skips over normal insns.  */
9839   end_label = next_nonnote_insn (loop->end);
9840   if (end_label && GET_CODE (end_label) != CODE_LABEL)
9841     end_label = NULL_RTX;
9842
9843   /* Check to see if it's possible that some instructions in the loop are
9844      never executed.  Also check if there is a goto out of the loop other
9845      than right after the end of the loop.  */
9846   for (p = next_insn_in_loop (loop, loop->scan_start);
9847        p != NULL_RTX;
9848        p = next_insn_in_loop (loop, p))
9849     {
9850       if (GET_CODE (p) == CODE_LABEL)
9851         maybe_never = 1;
9852       else if (GET_CODE (p) == JUMP_INSN
9853                /* If we enter the loop in the middle, and scan
9854                   around to the beginning, don't set maybe_never
9855                   for that.  This must be an unconditional jump,
9856                   otherwise the code at the top of the loop might
9857                   never be executed.  Unconditional jumps are
9858                   followed a by barrier then loop end.  */
9859                && ! (GET_CODE (p) == JUMP_INSN
9860                      && JUMP_LABEL (p) == loop->top
9861                      && NEXT_INSN (NEXT_INSN (p)) == loop->end
9862                      && any_uncondjump_p (p)))
9863         {
9864           /* If this is a jump outside of the loop but not right
9865              after the end of the loop, we would have to emit new fixup
9866              sequences for each such label.  */
9867           if (/* If we can't tell where control might go when this
9868                  JUMP_INSN is executed, we must be conservative.  */
9869               !JUMP_LABEL (p)
9870               || (JUMP_LABEL (p) != end_label
9871                   && (INSN_UID (JUMP_LABEL (p)) >= max_uid_for_loop
9872                       || INSN_LUID (JUMP_LABEL (p)) < INSN_LUID (loop->start)
9873                       || INSN_LUID (JUMP_LABEL (p)) > INSN_LUID (loop->end))))
9874             return;
9875
9876           if (!any_condjump_p (p))
9877             /* Something complicated.  */
9878             maybe_never = 1;
9879           else
9880             /* If there are any more instructions in the loop, they
9881                might not be reached.  */
9882             next_maybe_never = 1;
9883         }
9884       else if (next_maybe_never)
9885         maybe_never = 1;
9886     }
9887
9888   /* Find start of the extended basic block that enters the loop.  */
9889   for (p = loop->start;
9890        PREV_INSN (p) && GET_CODE (p) != CODE_LABEL;
9891        p = PREV_INSN (p))
9892     ;
9893   prev_ebb_head = p;
9894
9895   cselib_init ();
9896
9897   /* Build table of mems that get set to constant values before the
9898      loop.  */
9899   for (; p != loop->start; p = NEXT_INSN (p))
9900     cselib_process_insn (p);
9901
9902   /* Actually move the MEMs.  */
9903   for (i = 0; i < loop_info->mems_idx; ++i)
9904     {
9905       regset_head load_copies;
9906       regset_head store_copies;
9907       int written = 0;
9908       rtx reg;
9909       rtx mem = loop_info->mems[i].mem;
9910       rtx mem_list_entry;
9911
9912       if (MEM_VOLATILE_P (mem)
9913           || loop_invariant_p (loop, XEXP (mem, 0)) != 1)
9914         /* There's no telling whether or not MEM is modified.  */
9915         loop_info->mems[i].optimize = 0;
9916
9917       /* Go through the MEMs written to in the loop to see if this
9918          one is aliased by one of them.  */
9919       mem_list_entry = loop_info->store_mems;
9920       while (mem_list_entry)
9921         {
9922           if (rtx_equal_p (mem, XEXP (mem_list_entry, 0)))
9923             written = 1;
9924           else if (true_dependence (XEXP (mem_list_entry, 0), VOIDmode,
9925                                     mem, rtx_varies_p))
9926             {
9927               /* MEM is indeed aliased by this store.  */
9928               loop_info->mems[i].optimize = 0;
9929               break;
9930             }
9931           mem_list_entry = XEXP (mem_list_entry, 1);
9932         }
9933
9934       if (flag_float_store && written
9935           && GET_MODE_CLASS (GET_MODE (mem)) == MODE_FLOAT)
9936         loop_info->mems[i].optimize = 0;
9937
9938       /* If this MEM is written to, we must be sure that there
9939          are no reads from another MEM that aliases this one.  */
9940       if (loop_info->mems[i].optimize && written)
9941         {
9942           int j;
9943
9944           for (j = 0; j < loop_info->mems_idx; ++j)
9945             {
9946               if (j == i)
9947                 continue;
9948               else if (true_dependence (mem,
9949                                         VOIDmode,
9950                                         loop_info->mems[j].mem,
9951                                         rtx_varies_p))
9952                 {
9953                   /* It's not safe to hoist loop_info->mems[i] out of
9954                      the loop because writes to it might not be
9955                      seen by reads from loop_info->mems[j].  */
9956                   loop_info->mems[i].optimize = 0;
9957                   break;
9958                 }
9959             }
9960         }
9961
9962       if (maybe_never && may_trap_p (mem))
9963         /* We can't access the MEM outside the loop; it might
9964            cause a trap that wouldn't have happened otherwise.  */
9965         loop_info->mems[i].optimize = 0;
9966
9967       if (!loop_info->mems[i].optimize)
9968         /* We thought we were going to lift this MEM out of the
9969            loop, but later discovered that we could not.  */
9970         continue;
9971
9972       INIT_REG_SET (&load_copies);
9973       INIT_REG_SET (&store_copies);
9974
9975       /* Allocate a pseudo for this MEM.  We set REG_USERVAR_P in
9976          order to keep scan_loop from moving stores to this MEM
9977          out of the loop just because this REG is neither a
9978          user-variable nor used in the loop test.  */
9979       reg = gen_reg_rtx (GET_MODE (mem));
9980       REG_USERVAR_P (reg) = 1;
9981       loop_info->mems[i].reg = reg;
9982
9983       /* Now, replace all references to the MEM with the
9984          corresponding pseudos.  */
9985       maybe_never = 0;
9986       for (p = next_insn_in_loop (loop, loop->scan_start);
9987            p != NULL_RTX;
9988            p = next_insn_in_loop (loop, p))
9989         {
9990           if (INSN_P (p))
9991             {
9992               rtx set;
9993
9994               set = single_set (p);
9995
9996               /* See if this copies the mem into a register that isn't
9997                  modified afterwards.  We'll try to do copy propagation
9998                  a little further on.  */
9999               if (set
10000                   /* @@@ This test is _way_ too conservative.  */
10001                   && ! maybe_never
10002                   && GET_CODE (SET_DEST (set)) == REG
10003                   && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER
10004                   && REGNO (SET_DEST (set)) < last_max_reg
10005                   && regs->array[REGNO (SET_DEST (set))].n_times_set == 1
10006                   && rtx_equal_p (SET_SRC (set), mem))
10007                 SET_REGNO_REG_SET (&load_copies, REGNO (SET_DEST (set)));
10008
10009               /* See if this copies the mem from a register that isn't
10010                  modified afterwards.  We'll try to remove the
10011                  redundant copy later on by doing a little register
10012                  renaming and copy propagation.   This will help
10013                  to untangle things for the BIV detection code.  */
10014               if (set
10015                   && ! maybe_never
10016                   && GET_CODE (SET_SRC (set)) == REG
10017                   && REGNO (SET_SRC (set)) >= FIRST_PSEUDO_REGISTER
10018                   && REGNO (SET_SRC (set)) < last_max_reg
10019                   && regs->array[REGNO (SET_SRC (set))].n_times_set == 1
10020                   && rtx_equal_p (SET_DEST (set), mem))
10021                 SET_REGNO_REG_SET (&store_copies, REGNO (SET_SRC (set)));
10022
10023               /* If this is a call which uses / clobbers this memory
10024                  location, we must not change the interface here.  */
10025               if (GET_CODE (p) == CALL_INSN
10026                   && reg_mentioned_p (loop_info->mems[i].mem,
10027                                       CALL_INSN_FUNCTION_USAGE (p)))
10028                 {
10029                   cancel_changes (0);
10030                   loop_info->mems[i].optimize = 0;
10031                   break;
10032                 }
10033               else
10034                 /* Replace the memory reference with the shadow register.  */
10035                 replace_loop_mems (p, loop_info->mems[i].mem,
10036                                    loop_info->mems[i].reg);
10037             }
10038
10039           if (GET_CODE (p) == CODE_LABEL
10040               || GET_CODE (p) == JUMP_INSN)
10041             maybe_never = 1;
10042         }
10043
10044       if (! loop_info->mems[i].optimize)
10045         ; /* We found we couldn't do the replacement, so do nothing.  */
10046       else if (! apply_change_group ())
10047         /* We couldn't replace all occurrences of the MEM.  */
10048         loop_info->mems[i].optimize = 0;
10049       else
10050         {
10051           /* Load the memory immediately before LOOP->START, which is
10052              the NOTE_LOOP_BEG.  */
10053           cselib_val *e = cselib_lookup (mem, VOIDmode, 0);
10054           rtx set;
10055           rtx best = mem;
10056           int j;
10057           struct elt_loc_list *const_equiv = 0;
10058
10059           if (e)
10060             {
10061               struct elt_loc_list *equiv;
10062               struct elt_loc_list *best_equiv = 0;
10063               for (equiv = e->locs; equiv; equiv = equiv->next)
10064                 {
10065                   if (CONSTANT_P (equiv->loc))
10066                     const_equiv = equiv;
10067                   else if (GET_CODE (equiv->loc) == REG
10068                            /* Extending hard register lifetimes causes crash
10069                               on SRC targets.  Doing so on non-SRC is
10070                               probably also not good idea, since we most
10071                               probably have pseudoregister equivalence as
10072                               well.  */
10073                            && REGNO (equiv->loc) >= FIRST_PSEUDO_REGISTER)
10074                     best_equiv = equiv;
10075                 }
10076               /* Use the constant equivalence if that is cheap enough.  */
10077               if (! best_equiv)
10078                 best_equiv = const_equiv;
10079               else if (const_equiv
10080                        && (rtx_cost (const_equiv->loc, SET)
10081                            <= rtx_cost (best_equiv->loc, SET)))
10082                 {
10083                   best_equiv = const_equiv;
10084                   const_equiv = 0;
10085                 }
10086
10087               /* If best_equiv is nonzero, we know that MEM is set to a
10088                  constant or register before the loop.  We will use this
10089                  knowledge to initialize the shadow register with that
10090                  constant or reg rather than by loading from MEM.  */
10091               if (best_equiv)
10092                 best = copy_rtx (best_equiv->loc);
10093             }
10094
10095           set = gen_move_insn (reg, best);
10096           set = loop_insn_hoist (loop, set);
10097           if (REG_P (best))
10098             {
10099               for (p = prev_ebb_head; p != loop->start; p = NEXT_INSN (p))
10100                 if (REGNO_LAST_UID (REGNO (best)) == INSN_UID (p))
10101                   {
10102                     REGNO_LAST_UID (REGNO (best)) = INSN_UID (set);
10103                     break;
10104                   }
10105             }
10106
10107           if (const_equiv)
10108             set_unique_reg_note (set, REG_EQUAL, copy_rtx (const_equiv->loc));
10109
10110           if (written)
10111             {
10112               if (label == NULL_RTX)
10113                 {
10114                   label = gen_label_rtx ();
10115                   emit_label_after (label, loop->end);
10116                 }
10117
10118               /* Store the memory immediately after END, which is
10119                  the NOTE_LOOP_END.  */
10120               set = gen_move_insn (copy_rtx (mem), reg);
10121               loop_insn_emit_after (loop, 0, label, set);
10122             }
10123
10124           if (loop_dump_stream)
10125             {
10126               fprintf (loop_dump_stream, "Hoisted regno %d %s from ",
10127                        REGNO (reg), (written ? "r/w" : "r/o"));
10128               print_rtl (loop_dump_stream, mem);
10129               fputc ('\n', loop_dump_stream);
10130             }
10131
10132           /* Attempt a bit of copy propagation.  This helps untangle the
10133              data flow, and enables {basic,general}_induction_var to find
10134              more bivs/givs.  */
10135           EXECUTE_IF_SET_IN_REG_SET
10136             (&load_copies, FIRST_PSEUDO_REGISTER, j,
10137              {
10138                try_copy_prop (loop, reg, j);
10139              });
10140           CLEAR_REG_SET (&load_copies);
10141
10142           EXECUTE_IF_SET_IN_REG_SET
10143             (&store_copies, FIRST_PSEUDO_REGISTER, j,
10144              {
10145                try_swap_copy_prop (loop, reg, j);
10146              });
10147           CLEAR_REG_SET (&store_copies);
10148         }
10149     }
10150
10151   if (label != NULL_RTX && end_label != NULL_RTX)
10152     {
10153       /* Now, we need to replace all references to the previous exit
10154          label with the new one.  */
10155       replace_label_data rr;
10156       rr.r1 = end_label;
10157       rr.r2 = label;
10158       rr.update_label_nuses = true;
10159
10160       for (p = loop->start; p != loop->end; p = NEXT_INSN (p))
10161         {
10162           for_each_rtx (&p, replace_label, &rr);
10163         }
10164     }
10165
10166   cselib_finish ();
10167 }
10168
10169 /* For communication between note_reg_stored and its caller.  */
10170 struct note_reg_stored_arg
10171 {
10172   int set_seen;
10173   rtx reg;
10174 };
10175
10176 /* Called via note_stores, record in SET_SEEN whether X, which is written,
10177    is equal to ARG.  */
10178 static void
10179 note_reg_stored (x, setter, arg)
10180      rtx x, setter ATTRIBUTE_UNUSED;
10181      void *arg;
10182 {
10183   struct note_reg_stored_arg *t = (struct note_reg_stored_arg *) arg;
10184   if (t->reg == x)
10185     t->set_seen = 1;
10186 }
10187
10188 /* Try to replace every occurrence of pseudo REGNO with REPLACEMENT.
10189    There must be exactly one insn that sets this pseudo; it will be
10190    deleted if all replacements succeed and we can prove that the register
10191    is not used after the loop.  */
10192
10193 static void
10194 try_copy_prop (loop, replacement, regno)
10195      const struct loop *loop;
10196      rtx replacement;
10197      unsigned int regno;
10198 {
10199   /* This is the reg that we are copying from.  */
10200   rtx reg_rtx = regno_reg_rtx[regno];
10201   rtx init_insn = 0;
10202   rtx insn;
10203   /* These help keep track of whether we replaced all uses of the reg.  */
10204   int replaced_last = 0;
10205   int store_is_first = 0;
10206
10207   for (insn = next_insn_in_loop (loop, loop->scan_start);
10208        insn != NULL_RTX;
10209        insn = next_insn_in_loop (loop, insn))
10210     {
10211       rtx set;
10212
10213       /* Only substitute within one extended basic block from the initializing
10214          insn.  */
10215       if (GET_CODE (insn) == CODE_LABEL && init_insn)
10216         break;
10217
10218       if (! INSN_P (insn))
10219         continue;
10220
10221       /* Is this the initializing insn?  */
10222       set = single_set (insn);
10223       if (set
10224           && GET_CODE (SET_DEST (set)) == REG
10225           && REGNO (SET_DEST (set)) == regno)
10226         {
10227           if (init_insn)
10228             abort ();
10229
10230           init_insn = insn;
10231           if (REGNO_FIRST_UID (regno) == INSN_UID (insn))
10232             store_is_first = 1;
10233         }
10234
10235       /* Only substitute after seeing the initializing insn.  */
10236       if (init_insn && insn != init_insn)
10237         {
10238           struct note_reg_stored_arg arg;
10239
10240           replace_loop_regs (insn, reg_rtx, replacement);
10241           if (REGNO_LAST_UID (regno) == INSN_UID (insn))
10242             replaced_last = 1;
10243
10244           /* Stop replacing when REPLACEMENT is modified.  */
10245           arg.reg = replacement;
10246           arg.set_seen = 0;
10247           note_stores (PATTERN (insn), note_reg_stored, &arg);
10248           if (arg.set_seen)
10249             {
10250               rtx note = find_reg_note (insn, REG_EQUAL, NULL);
10251
10252               /* It is possible that we've turned previously valid REG_EQUAL to
10253                  invalid, as we change the REGNO to REPLACEMENT and unlike REGNO,
10254                  REPLACEMENT is modified, we get different meaning.  */
10255               if (note && reg_mentioned_p (replacement, XEXP (note, 0)))
10256                 remove_note (insn, note);
10257               break;
10258             }
10259         }
10260     }
10261   if (! init_insn)
10262     abort ();
10263   if (apply_change_group ())
10264     {
10265       if (loop_dump_stream)
10266         fprintf (loop_dump_stream, "  Replaced reg %d", regno);
10267       if (store_is_first && replaced_last)
10268         {
10269           rtx first;
10270           rtx retval_note;
10271
10272           /* Assume we're just deleting INIT_INSN.  */
10273           first = init_insn;
10274           /* Look for REG_RETVAL note.  If we're deleting the end of
10275              the libcall sequence, the whole sequence can go.  */
10276           retval_note = find_reg_note (init_insn, REG_RETVAL, NULL_RTX);
10277           /* If we found a REG_RETVAL note, find the first instruction
10278              in the sequence.  */
10279           if (retval_note)
10280             first = XEXP (retval_note, 0);
10281
10282           /* Delete the instructions.  */
10283           loop_delete_insns (first, init_insn);
10284         }
10285       if (loop_dump_stream)
10286         fprintf (loop_dump_stream, ".\n");
10287     }
10288 }
10289
10290 /* Replace all the instructions from FIRST up to and including LAST
10291    with NOTE_INSN_DELETED notes.  */
10292
10293 static void
10294 loop_delete_insns (first, last)
10295      rtx first;
10296      rtx last;
10297 {
10298   while (1)
10299     {
10300       if (loop_dump_stream)
10301         fprintf (loop_dump_stream, ", deleting init_insn (%d)",
10302                  INSN_UID (first));
10303       delete_insn (first);
10304
10305       /* If this was the LAST instructions we're supposed to delete,
10306          we're done.  */
10307       if (first == last)
10308         break;
10309
10310       first = NEXT_INSN (first);
10311     }
10312 }
10313
10314 /* Try to replace occurrences of pseudo REGNO with REPLACEMENT within
10315    loop LOOP if the order of the sets of these registers can be
10316    swapped.  There must be exactly one insn within the loop that sets
10317    this pseudo followed immediately by a move insn that sets
10318    REPLACEMENT with REGNO.  */
10319 static void
10320 try_swap_copy_prop (loop, replacement, regno)
10321      const struct loop *loop;
10322      rtx replacement;
10323      unsigned int regno;
10324 {
10325   rtx insn;
10326   rtx set = NULL_RTX;
10327   unsigned int new_regno;
10328
10329   new_regno = REGNO (replacement);
10330
10331   for (insn = next_insn_in_loop (loop, loop->scan_start);
10332        insn != NULL_RTX;
10333        insn = next_insn_in_loop (loop, insn))
10334     {
10335       /* Search for the insn that copies REGNO to NEW_REGNO?  */
10336       if (INSN_P (insn)
10337           && (set = single_set (insn))
10338           && GET_CODE (SET_DEST (set)) == REG
10339           && REGNO (SET_DEST (set)) == new_regno
10340           && GET_CODE (SET_SRC (set)) == REG
10341           && REGNO (SET_SRC (set)) == regno)
10342         break;
10343     }
10344
10345   if (insn != NULL_RTX)
10346     {
10347       rtx prev_insn;
10348       rtx prev_set;
10349
10350       /* Some DEF-USE info would come in handy here to make this
10351          function more general.  For now, just check the previous insn
10352          which is the most likely candidate for setting REGNO.  */
10353
10354       prev_insn = PREV_INSN (insn);
10355
10356       if (INSN_P (insn)
10357           && (prev_set = single_set (prev_insn))
10358           && GET_CODE (SET_DEST (prev_set)) == REG
10359           && REGNO (SET_DEST (prev_set)) == regno)
10360         {
10361           /* We have:
10362              (set (reg regno) (expr))
10363              (set (reg new_regno) (reg regno))
10364
10365              so try converting this to:
10366              (set (reg new_regno) (expr))
10367              (set (reg regno) (reg new_regno))
10368
10369              The former construct is often generated when a global
10370              variable used for an induction variable is shadowed by a
10371              register (NEW_REGNO).  The latter construct improves the
10372              chances of GIV replacement and BIV elimination.  */
10373
10374           validate_change (prev_insn, &SET_DEST (prev_set),
10375                            replacement, 1);
10376           validate_change (insn, &SET_DEST (set),
10377                            SET_SRC (set), 1);
10378           validate_change (insn, &SET_SRC (set),
10379                            replacement, 1);
10380
10381           if (apply_change_group ())
10382             {
10383               if (loop_dump_stream)
10384                 fprintf (loop_dump_stream,
10385                          "  Swapped set of reg %d at %d with reg %d at %d.\n",
10386                          regno, INSN_UID (insn),
10387                          new_regno, INSN_UID (prev_insn));
10388
10389               /* Update first use of REGNO.  */
10390               if (REGNO_FIRST_UID (regno) == INSN_UID (prev_insn))
10391                 REGNO_FIRST_UID (regno) = INSN_UID (insn);
10392
10393               /* Now perform copy propagation to hopefully
10394                  remove all uses of REGNO within the loop.  */
10395               try_copy_prop (loop, replacement, regno);
10396             }
10397         }
10398     }
10399 }
10400
10401 /* Replace MEM with its associated pseudo register.  This function is
10402    called from load_mems via for_each_rtx.  DATA is actually a pointer
10403    to a structure describing the instruction currently being scanned
10404    and the MEM we are currently replacing.  */
10405
10406 static int
10407 replace_loop_mem (mem, data)
10408      rtx *mem;
10409      void *data;
10410 {
10411   loop_replace_args *args = (loop_replace_args *) data;
10412   rtx m = *mem;
10413
10414   if (m == NULL_RTX)
10415     return 0;
10416
10417   switch (GET_CODE (m))
10418     {
10419     case MEM:
10420       break;
10421
10422     case CONST_DOUBLE:
10423       /* We're not interested in the MEM associated with a
10424          CONST_DOUBLE, so there's no need to traverse into one.  */
10425       return -1;
10426
10427     default:
10428       /* This is not a MEM.  */
10429       return 0;
10430     }
10431
10432   if (!rtx_equal_p (args->match, m))
10433     /* This is not the MEM we are currently replacing.  */
10434     return 0;
10435
10436   /* Actually replace the MEM.  */
10437   validate_change (args->insn, mem, args->replacement, 1);
10438
10439   return 0;
10440 }
10441
10442 static void
10443 replace_loop_mems (insn, mem, reg)
10444      rtx insn;
10445      rtx mem;
10446      rtx reg;
10447 {
10448   loop_replace_args args;
10449
10450   args.insn = insn;
10451   args.match = mem;
10452   args.replacement = reg;
10453
10454   for_each_rtx (&insn, replace_loop_mem, &args);
10455 }
10456
10457 /* Replace one register with another.  Called through for_each_rtx; PX points
10458    to the rtx being scanned.  DATA is actually a pointer to
10459    a structure of arguments.  */
10460
10461 static int
10462 replace_loop_reg (px, data)
10463      rtx *px;
10464      void *data;
10465 {
10466   rtx x = *px;
10467   loop_replace_args *args = (loop_replace_args *) data;
10468
10469   if (x == NULL_RTX)
10470     return 0;
10471
10472   if (x == args->match)
10473     validate_change (args->insn, px, args->replacement, 1);
10474
10475   return 0;
10476 }
10477
10478 static void
10479 replace_loop_regs (insn, reg, replacement)
10480      rtx insn;
10481      rtx reg;
10482      rtx replacement;
10483 {
10484   loop_replace_args args;
10485
10486   args.insn = insn;
10487   args.match = reg;
10488   args.replacement = replacement;
10489
10490   for_each_rtx (&insn, replace_loop_reg, &args);
10491 }
10492 \f
10493 /* Emit insn for PATTERN after WHERE_INSN in basic block WHERE_BB
10494    (ignored in the interim).  */
10495
10496 static rtx
10497 loop_insn_emit_after (loop, where_bb, where_insn, pattern)
10498      const struct loop *loop ATTRIBUTE_UNUSED;
10499      basic_block where_bb ATTRIBUTE_UNUSED;
10500      rtx where_insn;
10501      rtx pattern;
10502 {
10503   return emit_insn_after (pattern, where_insn);
10504 }
10505
10506
10507 /* If WHERE_INSN is nonzero emit insn for PATTERN before WHERE_INSN
10508    in basic block WHERE_BB (ignored in the interim) within the loop
10509    otherwise hoist PATTERN into the loop pre-header.  */
10510
10511 rtx
10512 loop_insn_emit_before (loop, where_bb, where_insn, pattern)
10513      const struct loop *loop;
10514      basic_block where_bb ATTRIBUTE_UNUSED;
10515      rtx where_insn;
10516      rtx pattern;
10517 {
10518   if (! where_insn)
10519     return loop_insn_hoist (loop, pattern);
10520   return emit_insn_before (pattern, where_insn);
10521 }
10522
10523
10524 /* Emit call insn for PATTERN before WHERE_INSN in basic block
10525    WHERE_BB (ignored in the interim) within the loop.  */
10526
10527 static rtx
10528 loop_call_insn_emit_before (loop, where_bb, where_insn, pattern)
10529      const struct loop *loop ATTRIBUTE_UNUSED;
10530      basic_block where_bb ATTRIBUTE_UNUSED;
10531      rtx where_insn;
10532      rtx pattern;
10533 {
10534   return emit_call_insn_before (pattern, where_insn);
10535 }
10536
10537
10538 /* Hoist insn for PATTERN into the loop pre-header.  */
10539
10540 rtx
10541 loop_insn_hoist (loop, pattern)
10542      const struct loop *loop;
10543      rtx pattern;
10544 {
10545   return loop_insn_emit_before (loop, 0, loop->start, pattern);
10546 }
10547
10548
10549 /* Hoist call insn for PATTERN into the loop pre-header.  */
10550
10551 static rtx
10552 loop_call_insn_hoist (loop, pattern)
10553      const struct loop *loop;
10554      rtx pattern;
10555 {
10556   return loop_call_insn_emit_before (loop, 0, loop->start, pattern);
10557 }
10558
10559
10560 /* Sink insn for PATTERN after the loop end.  */
10561
10562 rtx
10563 loop_insn_sink (loop, pattern)
10564      const struct loop *loop;
10565      rtx pattern;
10566 {
10567   return loop_insn_emit_before (loop, 0, loop->sink, pattern);
10568 }
10569
10570 /* bl->final_value can be eighter general_operand or PLUS of general_operand
10571    and constant.  Emit sequence of instructions to load it into REG.  */
10572 static rtx
10573 gen_load_of_final_value (reg, final_value)
10574      rtx reg, final_value;
10575 {
10576   rtx seq;
10577   start_sequence ();
10578   final_value = force_operand (final_value, reg);
10579   if (final_value != reg)
10580     emit_move_insn (reg, final_value);
10581   seq = get_insns ();
10582   end_sequence ();
10583   return seq;
10584 }
10585
10586 /* If the loop has multiple exits, emit insn for PATTERN before the
10587    loop to ensure that it will always be executed no matter how the
10588    loop exits.  Otherwise, emit the insn for PATTERN after the loop,
10589    since this is slightly more efficient.  */
10590
10591 static rtx
10592 loop_insn_sink_or_swim (loop, pattern)
10593      const struct loop *loop;
10594      rtx pattern;
10595 {
10596   if (loop->exit_count)
10597     return loop_insn_hoist (loop, pattern);
10598   else
10599     return loop_insn_sink (loop, pattern);
10600 }
10601 \f
10602 static void
10603 loop_ivs_dump (loop, file, verbose)
10604      const struct loop *loop;
10605      FILE *file;
10606      int verbose;
10607 {
10608   struct iv_class *bl;
10609   int iv_num = 0;
10610
10611   if (! loop || ! file)
10612     return;
10613
10614   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
10615     iv_num++;
10616
10617   fprintf (file, "Loop %d: %d IV classes\n", loop->num, iv_num);
10618
10619   for (bl = LOOP_IVS (loop)->list; bl; bl = bl->next)
10620     {
10621       loop_iv_class_dump (bl, file, verbose);
10622       fputc ('\n', file);
10623     }
10624 }
10625
10626
10627 static void
10628 loop_iv_class_dump (bl, file, verbose)
10629      const struct iv_class *bl;
10630      FILE *file;
10631      int verbose ATTRIBUTE_UNUSED;
10632 {
10633   struct induction *v;
10634   rtx incr;
10635   int i;
10636
10637   if (! bl || ! file)
10638     return;
10639
10640   fprintf (file, "IV class for reg %d, benefit %d\n",
10641            bl->regno, bl->total_benefit);
10642
10643   fprintf (file, " Init insn %d", INSN_UID (bl->init_insn));
10644   if (bl->initial_value)
10645     {
10646       fprintf (file, ", init val: ");
10647       print_simple_rtl (file, bl->initial_value);
10648     }
10649   if (bl->initial_test)
10650     {
10651       fprintf (file, ", init test: ");
10652       print_simple_rtl (file, bl->initial_test);
10653     }
10654   fputc ('\n', file);
10655
10656   if (bl->final_value)
10657     {
10658       fprintf (file, " Final val: ");
10659       print_simple_rtl (file, bl->final_value);
10660       fputc ('\n', file);
10661     }
10662
10663   if ((incr = biv_total_increment (bl)))
10664     {
10665       fprintf (file, " Total increment: ");
10666       print_simple_rtl (file, incr);
10667       fputc ('\n', file);
10668     }
10669
10670   /* List the increments.  */
10671   for (i = 0, v = bl->biv; v; v = v->next_iv, i++)
10672     {
10673       fprintf (file, " Inc%d: insn %d, incr: ", i, INSN_UID (v->insn));
10674       print_simple_rtl (file, v->add_val);
10675       fputc ('\n', file);
10676     }
10677
10678   /* List the givs.  */
10679   for (i = 0, v = bl->giv; v; v = v->next_iv, i++)
10680     {
10681       fprintf (file, " Giv%d: insn %d, benefit %d, ",
10682                i, INSN_UID (v->insn), v->benefit);
10683       if (v->giv_type == DEST_ADDR)
10684         print_simple_rtl (file, v->mem);
10685       else
10686         print_simple_rtl (file, single_set (v->insn));
10687       fputc ('\n', file);
10688     }
10689 }
10690
10691
10692 static void
10693 loop_biv_dump (v, file, verbose)
10694      const struct induction *v;
10695      FILE *file;
10696      int verbose;
10697 {
10698   if (! v || ! file)
10699     return;
10700
10701   fprintf (file,
10702            "Biv %d: insn %d",
10703            REGNO (v->dest_reg), INSN_UID (v->insn));
10704   fprintf (file, " const ");
10705   print_simple_rtl (file, v->add_val);
10706
10707   if (verbose && v->final_value)
10708     {
10709       fputc ('\n', file);
10710       fprintf (file, " final ");
10711       print_simple_rtl (file, v->final_value);
10712     }
10713
10714   fputc ('\n', file);
10715 }
10716
10717
10718 static void
10719 loop_giv_dump (v, file, verbose)
10720      const struct induction *v;
10721      FILE *file;
10722      int verbose;
10723 {
10724   if (! v || ! file)
10725     return;
10726
10727   if (v->giv_type == DEST_REG)
10728     fprintf (file, "Giv %d: insn %d",
10729              REGNO (v->dest_reg), INSN_UID (v->insn));
10730   else
10731     fprintf (file, "Dest address: insn %d",
10732              INSN_UID (v->insn));
10733
10734   fprintf (file, " src reg %d benefit %d",
10735            REGNO (v->src_reg), v->benefit);
10736   fprintf (file, " lifetime %d",
10737            v->lifetime);
10738
10739   if (v->replaceable)
10740     fprintf (file, " replaceable");
10741
10742   if (v->no_const_addval)
10743     fprintf (file, " ncav");
10744
10745   if (v->ext_dependent)
10746     {
10747       switch (GET_CODE (v->ext_dependent))
10748         {
10749         case SIGN_EXTEND:
10750           fprintf (file, " ext se");
10751           break;
10752         case ZERO_EXTEND:
10753           fprintf (file, " ext ze");
10754           break;
10755         case TRUNCATE:
10756           fprintf (file, " ext tr");
10757           break;
10758         default:
10759           abort ();
10760         }
10761     }
10762
10763   fputc ('\n', file);
10764   fprintf (file, " mult ");
10765   print_simple_rtl (file, v->mult_val);
10766
10767   fputc ('\n', file);
10768   fprintf (file, " add  ");
10769   print_simple_rtl (file, v->add_val);
10770
10771   if (verbose && v->final_value)
10772     {
10773       fputc ('\n', file);
10774       fprintf (file, " final ");
10775       print_simple_rtl (file, v->final_value);
10776     }
10777
10778   fputc ('\n', file);
10779 }
10780
10781
10782 void
10783 debug_ivs (loop)
10784      const struct loop *loop;
10785 {
10786   loop_ivs_dump (loop, stderr, 1);
10787 }
10788
10789
10790 void
10791 debug_iv_class (bl)
10792      const struct iv_class *bl;
10793 {
10794   loop_iv_class_dump (bl, stderr, 1);
10795 }
10796
10797
10798 void
10799 debug_biv (v)
10800      const struct induction *v;
10801 {
10802   loop_biv_dump (v, stderr, 1);
10803 }
10804
10805
10806 void
10807 debug_giv (v)
10808      const struct induction *v;
10809 {
10810   loop_giv_dump (v, stderr, 1);
10811 }
10812
10813
10814 #define LOOP_BLOCK_NUM_1(INSN) \
10815 ((INSN) ? (BLOCK_FOR_INSN (INSN) ? BLOCK_NUM (INSN) : - 1) : -1)
10816
10817 /* The notes do not have an assigned block, so look at the next insn.  */
10818 #define LOOP_BLOCK_NUM(INSN) \
10819 ((INSN) ? (GET_CODE (INSN) == NOTE \
10820             ? LOOP_BLOCK_NUM_1 (next_nonnote_insn (INSN)) \
10821             : LOOP_BLOCK_NUM_1 (INSN)) \
10822         : -1)
10823
10824 #define LOOP_INSN_UID(INSN) ((INSN) ? INSN_UID (INSN) : -1)
10825
10826 static void
10827 loop_dump_aux (loop, file, verbose)
10828      const struct loop *loop;
10829      FILE *file;
10830      int verbose ATTRIBUTE_UNUSED;
10831 {
10832   rtx label;
10833
10834   if (! loop || ! file)
10835     return;
10836
10837   /* Print diagnostics to compare our concept of a loop with
10838      what the loop notes say.  */
10839   if (! PREV_INSN (loop->first->head)
10840       || GET_CODE (PREV_INSN (loop->first->head)) != NOTE
10841       || NOTE_LINE_NUMBER (PREV_INSN (loop->first->head))
10842       != NOTE_INSN_LOOP_BEG)
10843     fprintf (file, ";;  No NOTE_INSN_LOOP_BEG at %d\n",
10844              INSN_UID (PREV_INSN (loop->first->head)));
10845   if (! NEXT_INSN (loop->last->end)
10846       || GET_CODE (NEXT_INSN (loop->last->end)) != NOTE
10847       || NOTE_LINE_NUMBER (NEXT_INSN (loop->last->end))
10848       != NOTE_INSN_LOOP_END)
10849     fprintf (file, ";;  No NOTE_INSN_LOOP_END at %d\n",
10850              INSN_UID (NEXT_INSN (loop->last->end)));
10851
10852   if (loop->start)
10853     {
10854       fprintf (file,
10855                ";;  start %d (%d), cont dom %d (%d), cont %d (%d), vtop %d (%d), end %d (%d)\n",
10856                LOOP_BLOCK_NUM (loop->start),
10857                LOOP_INSN_UID (loop->start),
10858                LOOP_BLOCK_NUM (loop->cont),
10859                LOOP_INSN_UID (loop->cont),
10860                LOOP_BLOCK_NUM (loop->cont),
10861                LOOP_INSN_UID (loop->cont),
10862                LOOP_BLOCK_NUM (loop->vtop),
10863                LOOP_INSN_UID (loop->vtop),
10864                LOOP_BLOCK_NUM (loop->end),
10865                LOOP_INSN_UID (loop->end));
10866       fprintf (file, ";;  top %d (%d), scan start %d (%d)\n",
10867                LOOP_BLOCK_NUM (loop->top),
10868                LOOP_INSN_UID (loop->top),
10869                LOOP_BLOCK_NUM (loop->scan_start),
10870                LOOP_INSN_UID (loop->scan_start));
10871       fprintf (file, ";;  exit_count %d", loop->exit_count);
10872       if (loop->exit_count)
10873         {
10874           fputs (", labels:", file);
10875           for (label = loop->exit_labels; label; label = LABEL_NEXTREF (label))
10876             {
10877               fprintf (file, " %d ",
10878                        LOOP_INSN_UID (XEXP (label, 0)));
10879             }
10880         }
10881       fputs ("\n", file);
10882
10883       /* This can happen when a marked loop appears as two nested loops,
10884          say from while (a || b) {}.  The inner loop won't match
10885          the loop markers but the outer one will.  */
10886       if (LOOP_BLOCK_NUM (loop->cont) != loop->latch->index)
10887         fprintf (file, ";;  NOTE_INSN_LOOP_CONT not in loop latch\n");
10888     }
10889 }
10890
10891 /* Call this function from the debugger to dump LOOP.  */
10892
10893 void
10894 debug_loop (loop)
10895      const struct loop *loop;
10896 {
10897   flow_loop_dump (loop, stderr, loop_dump_aux, 1);
10898 }
10899
10900 /* Call this function from the debugger to dump LOOPS.  */
10901
10902 void
10903 debug_loops (loops)
10904      const struct loops *loops;
10905 {
10906   flow_loops_dump (loops, stderr, loop_dump_aux, 1);
10907 }