gcc/cse.c

   1 /* Common subexpression elimination for GNU compiler.
   2    Copyright (C) 1987, 88, 89, 92, 93, 1994 Free Software Foundation, Inc.
   3
   4 This file is part of GNU CC.
   5
   6 GNU CC is free software; you can redistribute it and/or modify
   7 it under the terms of the GNU General Public License as published by
   8 the Free Software Foundation; either version 2, or (at your option)
   9 any later version.
  10
  11 GNU CC is distributed in the hope that it will be useful,
  12 but WITHOUT ANY WARRANTY; without even the implied warranty of
  13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14 GNU General Public License for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GNU CC; see the file COPYING.  If not, write to
  18 the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */
  19
  20
  21 #include "config.h"
  22 /* Must precede rtl.h for FFS.  */
  23 #include <stdio.h>
  24
  25 #include "rtl.h"
  26 #include "regs.h"
  27 #include "hard-reg-set.h"
  28 #include "flags.h"
  29 #include "real.h"
  30 #include "insn-config.h"
  31 #include "recog.h"
  32
  33 #include <setjmp.h>
  34
  35 /* The basic idea of common subexpression elimination is to go
  36    through the code, keeping a record of expressions that would
  37    have the same value at the current scan point, and replacing
  38    expressions encountered with the cheapest equivalent expression.
  39
  40    It is too complicated to keep track of the different possibilities
  41    when control paths merge; so, at each label, we forget all that is
  42    known and start fresh.  This can be described as processing each
  43    basic block separately.  Note, however, that these are not quite
  44    the same as the basic blocks found by a later pass and used for
  45    data flow analysis and register packing.  We do not need to start fresh
  46    after a conditional jump instruction if there is no label there.
  47
  48    We use two data structures to record the equivalent expressions:
  49    a hash table for most expressions, and several vectors together
  50    with "quantity numbers" to record equivalent (pseudo) registers.
  51
  52    The use of the special data structure for registers is desirable
  53    because it is faster.  It is possible because registers references
  54    contain a fairly small number, the register number, taken from
  55    a contiguously allocated series, and two register references are
  56    identical if they have the same number.  General expressions
  57    do not have any such thing, so the only way to retrieve the
  58    information recorded on an expression other than a register
  59    is to keep it in a hash table.
  60
  61 Registers and "quantity numbers":
  62
  63    At the start of each basic block, all of the (hardware and pseudo)
  64    registers used in the function are given distinct quantity
  65    numbers to indicate their contents.  During scan, when the code
  66    copies one register into another, we copy the quantity number.
  67    When a register is loaded in any other way, we allocate a new
  68    quantity number to describe the value generated by this operation.
  69    `reg_qty' records what quantity a register is currently thought
  70    of as containing.
  71
  72    All real quantity numbers are greater than or equal to `max_reg'.
  73    If register N has not been assigned a quantity, reg_qty[N] will equal N.
  74
  75    Quantity numbers below `max_reg' do not exist and none of the `qty_...'
  76    variables should be referenced with an index below `max_reg'.
  77
  78    We also maintain a bidirectional chain of registers for each
  79    quantity number.  `qty_first_reg', `qty_last_reg',
  80    `reg_next_eqv' and `reg_prev_eqv' hold these chains.
  81
  82    The first register in a chain is the one whose lifespan is least local.
  83    Among equals, it is the one that was seen first.
  84    We replace any equivalent register with that one.
  85
  86    If two registers have the same quantity number, it must be true that
  87    REG expressions with `qty_mode' must be in the hash table for both
  88    registers and must be in the same class.
  89
  90    The converse is not true.  Since hard registers may be referenced in
  91    any mode, two REG expressions might be equivalent in the hash table
  92    but not have the same quantity number if the quantity number of one
  93    of the registers is not the same mode as those expressions.
  94
  95 Constants and quantity numbers
  96
  97    When a quantity has a known constant value, that value is stored
  98    in the appropriate element of qty_const.  This is in addition to
  99    putting the constant in the hash table as is usual for non-regs.
 100
 101    Whether a reg or a constant is preferred is determined by the configuration
 102    macro CONST_COSTS and will often depend on the constant value.  In any
 103    event, expressions containing constants can be simplified, by fold_rtx.
 104
 105    When a quantity has a known nearly constant value (such as an address
 106    of a stack slot), that value is stored in the appropriate element
 107    of qty_const.
 108
 109    Integer constants don't have a machine mode.  However, cse
 110    determines the intended machine mode from the destination
 111    of the instruction that moves the constant.  The machine mode
 112    is recorded in the hash table along with the actual RTL
 113    constant expression so that different modes are kept separate.
 114
 115 Other expressions:
 116
 117    To record known equivalences among expressions in general
 118    we use a hash table called `table'.  It has a fixed number of buckets
 119    that contain chains of `struct table_elt' elements for expressions.
 120    These chains connect the elements whose expressions have the same
 121    hash codes.
 122
 123    Other chains through the same elements connect the elements which
 124    currently have equivalent values.
 125
 126    Register references in an expression are canonicalized before hashing
 127    the expression.  This is done using `reg_qty' and `qty_first_reg'.
 128    The hash code of a register reference is computed using the quantity
 129    number, not the register number.
 130
 131    When the value of an expression changes, it is necessary to remove from the
 132    hash table not just that expression but all expressions whose values
 133    could be different as a result.
 134
 135      1. If the value changing is in memory, except in special cases
 136      ANYTHING referring to memory could be changed.  That is because
 137      nobody knows where a pointer does not point.
 138      The function `invalidate_memory' removes what is necessary.
 139
 140      The special cases are when the address is constant or is
 141      a constant plus a fixed register such as the frame pointer
 142      or a static chain pointer.  When such addresses are stored in,
 143      we can tell exactly which other such addresses must be invalidated
 144      due to overlap.  `invalidate' does this.
 145      All expressions that refer to non-constant
 146      memory addresses are also invalidated.  `invalidate_memory' does this.
 147
 148      2. If the value changing is a register, all expressions
 149      containing references to that register, and only those,
 150      must be removed.
 151
 152    Because searching the entire hash table for expressions that contain
 153    a register is very slow, we try to figure out when it isn't necessary.
 154    Precisely, this is necessary only when expressions have been
 155    entered in the hash table using this register, and then the value has
 156    changed, and then another expression wants to be added to refer to
 157    the register's new value.  This sequence of circumstances is rare
 158    within any one basic block.
 159
 160    The vectors `reg_tick' and `reg_in_table' are used to detect this case.
 161    reg_tick[i] is incremented whenever a value is stored in register i.
 162    reg_in_table[i] holds -1 if no references to register i have been
 163    entered in the table; otherwise, it contains the value reg_tick[i] had
 164    when the references were entered.  If we want to enter a reference
 165    and reg_in_table[i] != reg_tick[i], we must scan and remove old references.
 166    Until we want to enter a new entry, the mere fact that the two vectors
 167    don't match makes the entries be ignored if anyone tries to match them.
 168
 169    Registers themselves are entered in the hash table as well as in
 170    the equivalent-register chains.  However, the vectors `reg_tick'
 171    and `reg_in_table' do not apply to expressions which are simple
 172    register references.  These expressions are removed from the table
 173    immediately when they become invalid, and this can be done even if
 174    we do not immediately search for all the expressions that refer to
 175    the register.
 176
 177    A CLOBBER rtx in an instruction invalidates its operand for further
 178    reuse.  A CLOBBER or SET rtx whose operand is a MEM:BLK
 179    invalidates everything that resides in memory.
 180
 181 Related expressions:
 182
 183    Constant expressions that differ only by an additive integer
 184    are called related.  When a constant expression is put in
 185    the table, the related expression with no constant term
 186    is also entered.  These are made to point at each other
 187    so that it is possible to find out if there exists any
 188    register equivalent to an expression related to a given expression.  */
 189
 190 /* One plus largest register number used in this function.  */
 191
 192 static int max_reg;
 193
 194 /* Length of vectors indexed by quantity number.
 195    We know in advance we will not need a quantity number this big.  */
 196
 197 static int max_qty;
 198
 199 /* Next quantity number to be allocated.
 200    This is 1 + the largest number needed so far.  */
 201
 202 static int next_qty;
 203
 204 /* Indexed by quantity number, gives the first (or last) (pseudo) register
 205    in the chain of registers that currently contain this quantity.  */
 206
 207 static int *qty_first_reg;
 208 static int *qty_last_reg;
 209
 210 /* Index by quantity number, gives the mode of the quantity.  */
 211
 212 static enum machine_mode *qty_mode;
 213
 214 /* Indexed by quantity number, gives the rtx of the constant value of the
 215    quantity, or zero if it does not have a known value.
 216    A sum of the frame pointer (or arg pointer) plus a constant
 217    can also be entered here.  */
 218
 219 static rtx *qty_const;
 220
 221 /* Indexed by qty number, gives the insn that stored the constant value
 222    recorded in `qty_const'.  */
 223
 224 static rtx *qty_const_insn;
 225
 226 /* The next three variables are used to track when a comparison between a
 227    quantity and some constant or register has been passed.  In that case, we
 228    know the results of the comparison in case we see it again.  These variables
 229    record a comparison that is known to be true.  */
 230
 231 /* Indexed by qty number, gives the rtx code of a comparison with a known
 232    result involving this quantity.  If none, it is UNKNOWN.  */
 233 static enum rtx_code *qty_comparison_code;
 234
 235 /* Indexed by qty number, gives the constant being compared against in a
 236    comparison of known result.  If no such comparison, it is undefined.
 237    If the comparison is not with a constant, it is zero.  */
 238
 239 static rtx *qty_comparison_const;
 240
 241 /* Indexed by qty number, gives the quantity being compared against in a
 242    comparison of known result.  If no such comparison, if it undefined.
 243    If the comparison is not with a register, it is -1.  */
 244
 245 static int *qty_comparison_qty;
 246
 247 #ifdef HAVE_cc0
 248 /* For machines that have a CC0, we do not record its value in the hash
 249    table since its use is guaranteed to be the insn immediately following
 250    its definition and any other insn is presumed to invalidate it.
 251
 252    Instead, we store below the value last assigned to CC0.  If it should
 253    happen to be a constant, it is stored in preference to the actual
 254    assigned value.  In case it is a constant, we store the mode in which
 255    the constant should be interpreted.  */
 256
 257 static rtx prev_insn_cc0;
 258 static enum machine_mode prev_insn_cc0_mode;
 259 #endif
 260
 261 /* Previous actual insn.  0 if at first insn of basic block.  */
 262
 263 static rtx prev_insn;
 264
 265 /* Insn being scanned.  */
 266
 267 static rtx this_insn;
 268
 269 /* Index by (pseudo) register number, gives the quantity number
 270    of the register's current contents.  */
 271
 272 static int *reg_qty;
 273
 274 /* Index by (pseudo) register number, gives the number of the next (or
 275    previous) (pseudo) register in the chain of registers sharing the same
 276    value.
 277
 278    Or -1 if this register is at the end of the chain.
 279
 280    If reg_qty[N] == N, reg_next_eqv[N] is undefined.  */
 281
 282 static int *reg_next_eqv;
 283 static int *reg_prev_eqv;
 284
 285 /* Index by (pseudo) register number, gives the number of times
 286    that register has been altered in the current basic block.  */
 287
 288 static int *reg_tick;
 289
 290 /* Index by (pseudo) register number, gives the reg_tick value at which
 291    rtx's containing this register are valid in the hash table.
 292    If this does not equal the current reg_tick value, such expressions
 293    existing in the hash table are invalid.
 294    If this is -1, no expressions containing this register have been
 295    entered in the table.  */
 296
 297 static int *reg_in_table;
 298
 299 /* A HARD_REG_SET containing all the hard registers for which there is
 300    currently a REG expression in the hash table.  Note the difference
 301    from the above variables, which indicate if the REG is mentioned in some
 302    expression in the table.  */
 303
 304 static HARD_REG_SET hard_regs_in_table;
 305
 306 /* A HARD_REG_SET containing all the hard registers that are invalidated
 307    by a CALL_INSN.  */
 308
 309 static HARD_REG_SET regs_invalidated_by_call;
 310
 311 /* Two vectors of ints:
 312    one containing max_reg -1's; the other max_reg + 500 (an approximation
 313    for max_qty) elements where element i contains i.
 314    These are used to initialize various other vectors fast.  */
 315
 316 static int *all_minus_one;
 317 static int *consec_ints;
 318
 319 /* CUID of insn that starts the basic block currently being cse-processed.  */
 320
 321 static int cse_basic_block_start;
 322
 323 /* CUID of insn that ends the basic block currently being cse-processed.  */
 324
 325 static int cse_basic_block_end;
 326
 327 /* Vector mapping INSN_UIDs to cuids.
 328    The cuids are like uids but increase monotonically always.
 329    We use them to see whether a reg is used outside a given basic block.  */
 330
 331 static int *uid_cuid;
 332
 333 /* Highest UID in UID_CUID.  */
 334 static int max_uid;
 335
 336 /* Get the cuid of an insn.  */
 337
 338 #define INSN_CUID(INSN) (uid_cuid[INSN_UID (INSN)])
 339
 340 /* Nonzero if cse has altered conditional jump insns
 341    in such a way that jump optimization should be redone.  */
 342
 343 static int cse_jumps_altered;
 344
 345 /* canon_hash stores 1 in do_not_record
 346    if it notices a reference to CC0, PC, or some other volatile
 347    subexpression.  */
 348
 349 static int do_not_record;
 350
 351 #ifdef LOAD_EXTEND_OP
 352
 353 /* Scratch rtl used when looking for load-extended copy of a MEM.  */
 354 static rtx memory_extend_rtx;
 355 #endif
 356
 357 /* canon_hash stores 1 in hash_arg_in_memory
 358    if it notices a reference to memory within the expression being hashed.  */
 359
 360 static int hash_arg_in_memory;
 361
 362 /* canon_hash stores 1 in hash_arg_in_struct
 363    if it notices a reference to memory that's part of a structure.  */
 364
 365 static int hash_arg_in_struct;
 366
 367 /* The hash table contains buckets which are chains of `struct table_elt's,
 368    each recording one expression's information.
 369    That expression is in the `exp' field.
 370
 371    Those elements with the same hash code are chained in both directions
 372    through the `next_same_hash' and `prev_same_hash' fields.
 373
 374    Each set of expressions with equivalent values
 375    are on a two-way chain through the `next_same_value'
 376    and `prev_same_value' fields, and all point with
 377    the `first_same_value' field at the first element in
 378    that chain.  The chain is in order of increasing cost.
 379    Each element's cost value is in its `cost' field.
 380
 381    The `in_memory' field is nonzero for elements that
 382    involve any reference to memory.  These elements are removed
 383    whenever a write is done to an unidentified location in memory.
 384    To be safe, we assume that a memory address is unidentified unless
 385    the address is either a symbol constant or a constant plus
 386    the frame pointer or argument pointer.
 387
 388    The `in_struct' field is nonzero for elements that
 389    involve any reference to memory inside a structure or array.
 390
 391    The `related_value' field is used to connect related expressions
 392    (that differ by adding an integer).
 393    The related expressions are chained in a circular fashion.
 394    `related_value' is zero for expressions for which this
 395    chain is not useful.
 396
 397    The `cost' field stores the cost of this element's expression.
 398
 399    The `is_const' flag is set if the element is a constant (including
 400    a fixed address).
 401
 402    The `flag' field is used as a temporary during some search routines.
 403
 404    The `mode' field is usually the same as GET_MODE (`exp'), but
 405    if `exp' is a CONST_INT and has no machine mode then the `mode'
 406    field is the mode it was being used as.  Each constant is
 407    recorded separately for each mode it is used with.  */
 408
 409
 410 struct table_elt
 411 {
 412   rtx exp;
 413   struct table_elt *next_same_hash;
 414   struct table_elt *prev_same_hash;
 415   struct table_elt *next_same_value;
 416   struct table_elt *prev_same_value;
 417   struct table_elt *first_same_value;
 418   struct table_elt *related_value;
 419   int cost;
 420   enum machine_mode mode;
 421   char in_memory;
 422   char in_struct;
 423   char is_const;
 424   char flag;
 425 };
 426
 427 /* We don't want a lot of buckets, because we rarely have very many
 428    things stored in the hash table, and a lot of buckets slows
 429    down a lot of loops that happen frequently.  */
 430 #define NBUCKETS 31
 431
 432 /* Compute hash code of X in mode M.  Special-case case where X is a pseudo
 433    register (hard registers may require `do_not_record' to be set).  */
 434
 435 #define HASH(X, M)      \
 436  (GET_CODE (X) == REG && REGNO (X) >= FIRST_PSEUDO_REGISTER     \
 437   ? (((unsigned) REG << 7) + (unsigned) reg_qty[REGNO (X)]) % NBUCKETS  \
 438   : canon_hash (X, M) % NBUCKETS)
 439
 440 /* Determine whether register number N is considered a fixed register for CSE.
 441    It is desirable to replace other regs with fixed regs, to reduce need for
 442    non-fixed hard regs.
 443    A reg wins if it is either the frame pointer or designated as fixed,
 444    but not if it is an overlapping register.  */
 445 #ifdef OVERLAPPING_REGNO_P
 446 #define FIXED_REGNO_P(N)  \
 447   (((N) == FRAME_POINTER_REGNUM || (N) == HARD_FRAME_POINTER_REGNUM \
 448     || fixed_regs[N] || global_regs[N])   \
 449    && ! OVERLAPPING_REGNO_P ((N)))
 450 #else
 451 #define FIXED_REGNO_P(N)  \
 452   ((N) == FRAME_POINTER_REGNUM || (N) == HARD_FRAME_POINTER_REGNUM \
 453    || fixed_regs[N] || global_regs[N])
 454 #endif
 455
 456 /* Compute cost of X, as stored in the `cost' field of a table_elt.  Fixed
 457    hard registers and pointers into the frame are the cheapest with a cost
 458    of 0.  Next come pseudos with a cost of one and other hard registers with
 459    a cost of 2.  Aside from these special cases, call `rtx_cost'.  */
 460
 461 #define CHEAP_REGNO(N) \
 462   ((N) == FRAME_POINTER_REGNUM || (N) == HARD_FRAME_POINTER_REGNUM      \
 463    || (N) == STACK_POINTER_REGNUM || (N) == ARG_POINTER_REGNUM          \
 464    || ((N) >= FIRST_VIRTUAL_REGISTER && (N) <= LAST_VIRTUAL_REGISTER)   \
 465    || ((N) < FIRST_PSEUDO_REGISTER                                      \
 466        && FIXED_REGNO_P (N) && REGNO_REG_CLASS (N) != NO_REGS))
 467
 468 /* A register is cheap if it is a user variable assigned to the register
 469    or if its register number always corresponds to a cheap register.  */
 470
 471 #define CHEAP_REG(N) \
 472   ((REG_USERVAR_P (N) && REGNO (N) < FIRST_PSEUDO_REGISTER)     \
 473    || CHEAP_REGNO (REGNO (N)))
 474
 475 #define COST(X)                                         \
 476   (GET_CODE (X) == REG                                  \
 477    ? (CHEAP_REG (X) ? 0                                 \
 478       : REGNO (X) >= FIRST_PSEUDO_REGISTER ? 1          \
 479       : 2)                                              \
 480    : rtx_cost (X, SET) * 2)
 481
 482 /* Determine if the quantity number for register X represents a valid index
 483    into the `qty_...' variables.  */
 484
 485 #define REGNO_QTY_VALID_P(N) (reg_qty[N] != (N))
 486
 487 static struct table_elt *table[NBUCKETS];
 488
 489 /* Chain of `struct table_elt's made so far for this function
 490    but currently removed from the table.  */
 491
 492 static struct table_elt *free_element_chain;
 493
 494 /* Number of `struct table_elt' structures made so far for this function.  */
 495
 496 static int n_elements_made;
 497
 498 /* Maximum value `n_elements_made' has had so far in this compilation
 499    for functions previously processed.  */
 500
 501 static int max_elements_made;
 502
 503 /* Surviving equivalence class when two equivalence classes are merged
 504    by recording the effects of a jump in the last insn.  Zero if the
 505    last insn was not a conditional jump.  */
 506
 507 static struct table_elt *last_jump_equiv_class;
 508
 509 /* Set to the cost of a constant pool reference if one was found for a
 510    symbolic constant.  If this was found, it means we should try to
 511    convert constants into constant pool entries if they don't fit in
 512    the insn.  */
 513
 514 static int constant_pool_entries_cost;
 515
 516 /* Bits describing what kind of values in memory must be invalidated
 517    for a particular instruction.  If all three bits are zero,
 518    no memory refs need to be invalidated.  Each bit is more powerful
 519    than the preceding ones, and if a bit is set then the preceding
 520    bits are also set.
 521
 522    Here is how the bits are set:
 523    Pushing onto the stack invalidates only the stack pointer,
 524    writing at a fixed address invalidates only variable addresses,
 525    writing in a structure element at variable address
 526      invalidates all but scalar variables,
 527    and writing in anything else at variable address invalidates everything.  */
 528
 529 struct write_data
 530 {
 531   int sp : 1;                   /* Invalidate stack pointer. */
 532   int var : 1;                  /* Invalidate variable addresses.  */
 533   int nonscalar : 1;            /* Invalidate all but scalar variables.  */
 534   int all : 1;                  /* Invalidate all memory refs.  */
 535 };
 536
 537 /* Define maximum length of a branch path.  */
 538
 539 #define PATHLENGTH      10
 540
 541 /* This data describes a block that will be processed by cse_basic_block.  */
 542
 543 struct cse_basic_block_data {
 544   /* Lowest CUID value of insns in block.  */
 545   int low_cuid;
 546   /* Highest CUID value of insns in block.  */
 547   int high_cuid;
 548   /* Total number of SETs in block.  */
 549   int nsets;
 550   /* Last insn in the block.  */
 551   rtx last;
 552   /* Size of current branch path, if any.  */
 553   int path_size;
 554   /* Current branch path, indicating which branches will be taken.  */
 555   struct branch_path {
 556     /* The branch insn. */
 557     rtx branch;
 558     /* Whether it should be taken or not.  AROUND is the same as taken
 559        except that it is used when the destination label is not preceded
 560        by a BARRIER.  */
 561     enum taken {TAKEN, NOT_TAKEN, AROUND} status;
 562   } path[PATHLENGTH];
 563 };
 564
 565 /* Nonzero if X has the form (PLUS frame-pointer integer).  We check for
 566    virtual regs here because the simplify_*_operation routines are called
 567    by integrate.c, which is called before virtual register instantiation.  */
 568
 569 #define FIXED_BASE_PLUS_P(X)                                    \
 570   ((X) == frame_pointer_rtx || (X) == hard_frame_pointer_rtx    \
 571    || (X) == arg_pointer_rtx                                    \
 572    || (X) == virtual_stack_vars_rtx                             \
 573    || (X) == virtual_incoming_args_rtx                          \
 574    || (GET_CODE (X) == PLUS && GET_CODE (XEXP (X, 1)) == CONST_INT \
 575        && (XEXP (X, 0) == frame_pointer_rtx                     \
 576            || XEXP (X, 0) == hard_frame_pointer_rtx             \
 577            || XEXP (X, 0) == arg_pointer_rtx                    \
 578            || XEXP (X, 0) == virtual_stack_vars_rtx             \
 579            || XEXP (X, 0) == virtual_incoming_args_rtx)))
 580
 581 /* Similar, but also allows reference to the stack pointer.
 582
 583    This used to include FIXED_BASE_PLUS_P, however, we can't assume that
 584    arg_pointer_rtx by itself is nonzero, because on at least one machine,
 585    the i960, the arg pointer is zero when it is unused.  */
 586
 587 #define NONZERO_BASE_PLUS_P(X)                                  \
 588   ((X) == frame_pointer_rtx || (X) == hard_frame_pointer_rtx    \
 589    || (X) == virtual_stack_vars_rtx                             \
 590    || (X) == virtual_incoming_args_rtx                          \
 591    || (GET_CODE (X) == PLUS && GET_CODE (XEXP (X, 1)) == CONST_INT \
 592        && (XEXP (X, 0) == frame_pointer_rtx                     \
 593            || XEXP (X, 0) == hard_frame_pointer_rtx             \
 594            || XEXP (X, 0) == arg_pointer_rtx                    \
 595            || XEXP (X, 0) == virtual_stack_vars_rtx             \
 596            || XEXP (X, 0) == virtual_incoming_args_rtx))        \
 597    || (X) == stack_pointer_rtx                                  \
 598    || (X) == virtual_stack_dynamic_rtx                          \
 599    || (X) == virtual_outgoing_args_rtx                          \
 600    || (GET_CODE (X) == PLUS && GET_CODE (XEXP (X, 1)) == CONST_INT \
 601        && (XEXP (X, 0) == stack_pointer_rtx                     \
 602            || XEXP (X, 0) == virtual_stack_dynamic_rtx          \
 603            || XEXP (X, 0) == virtual_outgoing_args_rtx)))
 604
 605 static void new_basic_block     PROTO((void));
 606 static void make_new_qty        PROTO((int));
 607 static void make_regs_eqv       PROTO((int, int));
 608 static void delete_reg_equiv    PROTO((int));
 609 static int mention_regs         PROTO((rtx));
 610 static int insert_regs          PROTO((rtx, struct table_elt *, int));
 611 static void free_element        PROTO((struct table_elt *));
 612 static void remove_from_table   PROTO((struct table_elt *, unsigned));
 613 static struct table_elt *get_element PROTO((void));
 614 static struct table_elt *lookup PROTO((rtx, unsigned, enum machine_mode)),
 615        *lookup_for_remove PROTO((rtx, unsigned, enum machine_mode));
 616 static rtx lookup_as_function   PROTO((rtx, enum rtx_code));
 617 static struct table_elt *insert PROTO((rtx, struct table_elt *, unsigned,
 618                                        enum machine_mode));
 619 static void merge_equiv_classes PROTO((struct table_elt *,
 620                                        struct table_elt *));
 621 static void invalidate          PROTO((rtx));
 622 static void remove_invalid_refs PROTO((int));
 623 static void rehash_using_reg    PROTO((rtx));
 624 static void invalidate_memory   PROTO((struct write_data *));
 625 static void invalidate_for_call PROTO((void));
 626 static rtx use_related_value    PROTO((rtx, struct table_elt *));
 627 static unsigned canon_hash      PROTO((rtx, enum machine_mode));
 628 static unsigned safe_hash       PROTO((rtx, enum machine_mode));
 629 static int exp_equiv_p          PROTO((rtx, rtx, int, int));
 630 static void set_nonvarying_address_components PROTO((rtx, int, rtx *,
 631                                                      HOST_WIDE_INT *,
 632                                                      HOST_WIDE_INT *));
 633 static int refers_to_p          PROTO((rtx, rtx));
 634 static int refers_to_mem_p      PROTO((rtx, rtx, HOST_WIDE_INT,
 635                                        HOST_WIDE_INT));
 636 static int cse_rtx_addr_varies_p PROTO((rtx));
 637 static rtx canon_reg            PROTO((rtx, rtx));
 638 static void find_best_addr      PROTO((rtx, rtx *));
 639 static enum rtx_code find_comparison_args PROTO((enum rtx_code, rtx *, rtx *,
 640                                                  enum machine_mode *,
 641                                                  enum machine_mode *));
 642 static rtx cse_gen_binary       PROTO((enum rtx_code, enum machine_mode,
 643                                        rtx, rtx));
 644 static rtx simplify_plus_minus  PROTO((enum rtx_code, enum machine_mode,
 645                                        rtx, rtx));
 646 static rtx fold_rtx             PROTO((rtx, rtx));
 647 static rtx equiv_constant       PROTO((rtx));
 648 static void record_jump_equiv   PROTO((rtx, int));
 649 static void record_jump_cond    PROTO((enum rtx_code, enum machine_mode,
 650                                        rtx, rtx, int));
 651 static void cse_insn            PROTO((rtx, int));
 652 static void note_mem_written    PROTO((rtx, struct write_data *));
 653 static void invalidate_from_clobbers PROTO((struct write_data *, rtx));
 654 static rtx cse_process_notes    PROTO((rtx, rtx));
 655 static void cse_around_loop     PROTO((rtx));
 656 static void invalidate_skipped_set PROTO((rtx, rtx));
 657 static void invalidate_skipped_block PROTO((rtx));
 658 static void cse_check_loop_start PROTO((rtx, rtx));
 659 static void cse_set_around_loop PROTO((rtx, rtx, rtx));
 660 static rtx cse_basic_block      PROTO((rtx, rtx, struct branch_path *, int));
 661 static void count_reg_usage     PROTO((rtx, int *, rtx, int));
 662
 663 extern int rtx_equal_function_value_matters;
 664 \f
 665 /* Return an estimate of the cost of computing rtx X.
 666    One use is in cse, to decide which expression to keep in the hash table.
 667    Another is in rtl generation, to pick the cheapest way to multiply.
 668    Other uses like the latter are expected in the future.  */
 669
 670 /* Return the right cost to give to an operation
 671    to make the cost of the corresponding register-to-register instruction
 672    N times that of a fast register-to-register instruction.  */
 673
 674 #define COSTS_N_INSNS(N) ((N) * 4 - 2)
 675
 676 int
 677 rtx_cost (x, outer_code)
 678      rtx x;
 679      enum rtx_code outer_code;
 680 {
 681   register int i, j;
 682   register enum rtx_code code;
 683   register char *fmt;
 684   register int total;
 685
 686   if (x == 0)
 687     return 0;
 688
 689   /* Compute the default costs of certain things.
 690      Note that RTX_COSTS can override the defaults.  */
 691
 692   code = GET_CODE (x);
 693   switch (code)
 694     {
 695     case MULT:
 696       /* Count multiplication by 2**n as a shift,
 697          because if we are considering it, we would output it as a shift.  */
 698       if (GET_CODE (XEXP (x, 1)) == CONST_INT
 699           && exact_log2 (INTVAL (XEXP (x, 1))) >= 0)
 700         total = 2;
 701       else
 702         total = COSTS_N_INSNS (5);
 703       break;
 704     case DIV:
 705     case UDIV:
 706     case MOD:
 707     case UMOD:
 708       total = COSTS_N_INSNS (7);
 709       break;
 710     case USE:
 711       /* Used in loop.c and combine.c as a marker.  */
 712       total = 0;
 713       break;
 714     case ASM_OPERANDS:
 715       /* We don't want these to be used in substitutions because
 716          we have no way of validating the resulting insn.  So assign
 717          anything containing an ASM_OPERANDS a very high cost.  */
 718       total = 1000;
 719       break;
 720     default:
 721       total = 2;
 722     }
 723
 724   switch (code)
 725     {
 726     case REG:
 727       return ! CHEAP_REG (x);
 728
 729     case SUBREG:
 730       /* If we can't tie these modes, make this expensive.  The larger
 731          the mode, the more expensive it is.  */
 732       if (! MODES_TIEABLE_P (GET_MODE (x), GET_MODE (SUBREG_REG (x))))
 733         return COSTS_N_INSNS (2
 734                               + GET_MODE_SIZE (GET_MODE (x)) / UNITS_PER_WORD);
 735       return 2;
 736 #ifdef RTX_COSTS
 737       RTX_COSTS (x, code, outer_code);
 738 #endif
 739       CONST_COSTS (x, code, outer_code);
 740     }
 741
 742   /* Sum the costs of the sub-rtx's, plus cost of this operation,
 743      which is already in total.  */
 744
 745   fmt = GET_RTX_FORMAT (code);
 746   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
 747     if (fmt[i] == 'e')
 748       total += rtx_cost (XEXP (x, i), code);
 749     else if (fmt[i] == 'E')
 750       for (j = 0; j < XVECLEN (x, i); j++)
 751         total += rtx_cost (XVECEXP (x, i, j), code);
 752
 753   return total;
 754 }
 755 \f
 756 /* Clear the hash table and initialize each register with its own quantity,
 757    for a new basic block.  */
 758
 759 static void
 760 new_basic_block ()
 761 {
 762   register int i;
 763
 764   next_qty = max_reg;
 765
 766   bzero ((char *) reg_tick, max_reg * sizeof (int));
 767
 768   bcopy ((char *) all_minus_one, (char *) reg_in_table,
 769          max_reg * sizeof (int));
 770   bcopy ((char *) consec_ints, (char *) reg_qty, max_reg * sizeof (int));
 771   CLEAR_HARD_REG_SET (hard_regs_in_table);
 772
 773   /* The per-quantity values used to be initialized here, but it is
 774      much faster to initialize each as it is made in `make_new_qty'.  */
 775
 776   for (i = 0; i < NBUCKETS; i++)
 777     {
 778       register struct table_elt *this, *next;
 779       for (this = table[i]; this; this = next)
 780         {
 781           next = this->next_same_hash;
 782           free_element (this);
 783         }
 784     }
 785
 786   bzero ((char *) table, sizeof table);
 787
 788   prev_insn = 0;
 789
 790 #ifdef HAVE_cc0
 791   prev_insn_cc0 = 0;
 792 #endif
 793 }
 794
 795 /* Say that register REG contains a quantity not in any register before
 796    and initialize that quantity.  */
 797
 798 static void
 799 make_new_qty (reg)
 800      register int reg;
 801 {
 802   register int q;
 803
 804   if (next_qty >= max_qty)
 805     abort ();
 806
 807   q = reg_qty[reg] = next_qty++;
 808   qty_first_reg[q] = reg;
 809   qty_last_reg[q] = reg;
 810   qty_const[q] = qty_const_insn[q] = 0;
 811   qty_comparison_code[q] = UNKNOWN;
 812
 813   reg_next_eqv[reg] = reg_prev_eqv[reg] = -1;
 814 }
 815
 816 /* Make reg NEW equivalent to reg OLD.
 817    OLD is not changing; NEW is.  */
 818
 819 static void
 820 make_regs_eqv (new, old)
 821      register int new, old;
 822 {
 823   register int lastr, firstr;
 824   register int q = reg_qty[old];
 825
 826   /* Nothing should become eqv until it has a "non-invalid" qty number.  */
 827   if (! REGNO_QTY_VALID_P (old))
 828     abort ();
 829
 830   reg_qty[new] = q;
 831   firstr = qty_first_reg[q];
 832   lastr = qty_last_reg[q];
 833
 834   /* Prefer fixed hard registers to anything.  Prefer pseudo regs to other
 835      hard regs.  Among pseudos, if NEW will live longer than any other reg
 836      of the same qty, and that is beyond the current basic block,
 837      make it the new canonical replacement for this qty.  */
 838   if (! (firstr < FIRST_PSEUDO_REGISTER && FIXED_REGNO_P (firstr))
 839       /* Certain fixed registers might be of the class NO_REGS.  This means
 840          that not only can they not be allocated by the compiler, but
 841          they cannot be used in substitutions or canonicalizations
 842          either.  */
 843       && (new >= FIRST_PSEUDO_REGISTER || REGNO_REG_CLASS (new) != NO_REGS)
 844       && ((new < FIRST_PSEUDO_REGISTER && FIXED_REGNO_P (new))
 845           || (new >= FIRST_PSEUDO_REGISTER
 846               && (firstr < FIRST_PSEUDO_REGISTER
 847                   || ((uid_cuid[regno_last_uid[new]] > cse_basic_block_end
 848                        || (uid_cuid[regno_first_uid[new]]
 849                            < cse_basic_block_start))
 850                       && (uid_cuid[regno_last_uid[new]]
 851                           > uid_cuid[regno_last_uid[firstr]]))))))
 852     {
 853       reg_prev_eqv[firstr] = new;
 854       reg_next_eqv[new] = firstr;
 855       reg_prev_eqv[new] = -1;
 856       qty_first_reg[q] = new;
 857     }
 858   else
 859     {
 860       /* If NEW is a hard reg (known to be non-fixed), insert at end.
 861          Otherwise, insert before any non-fixed hard regs that are at the
 862          end.  Registers of class NO_REGS cannot be used as an
 863          equivalent for anything.  */
 864       while (lastr < FIRST_PSEUDO_REGISTER && reg_prev_eqv[lastr] >= 0
 865              && (REGNO_REG_CLASS (lastr) == NO_REGS || ! FIXED_REGNO_P (lastr))
 866              && new >= FIRST_PSEUDO_REGISTER)
 867         lastr = reg_prev_eqv[lastr];
 868       reg_next_eqv[new] = reg_next_eqv[lastr];
 869       if (reg_next_eqv[lastr] >= 0)
 870         reg_prev_eqv[reg_next_eqv[lastr]] = new;
 871       else
 872         qty_last_reg[q] = new;
 873       reg_next_eqv[lastr] = new;
 874       reg_prev_eqv[new] = lastr;
 875     }
 876 }
 877
 878 /* Remove REG from its equivalence class.  */
 879
 880 static void
 881 delete_reg_equiv (reg)
 882      register int reg;
 883 {
 884   register int q = reg_qty[reg];
 885   register int p, n;
 886
 887   /* If invalid, do nothing.  */
 888   if (q == reg)
 889     return;
 890
 891   p = reg_prev_eqv[reg];
 892   n = reg_next_eqv[reg];
 893
 894   if (n != -1)
 895     reg_prev_eqv[n] = p;
 896   else
 897     qty_last_reg[q] = p;
 898   if (p != -1)
 899     reg_next_eqv[p] = n;
 900   else
 901     qty_first_reg[q] = n;
 902
 903   reg_qty[reg] = reg;
 904 }
 905
 906 /* Remove any invalid expressions from the hash table
 907    that refer to any of the registers contained in expression X.
 908
 909    Make sure that newly inserted references to those registers
 910    as subexpressions will be considered valid.
 911
 912    mention_regs is not called when a register itself
 913    is being stored in the table.
 914
 915    Return 1 if we have done something that may have changed the hash code
 916    of X.  */
 917
 918 static int
 919 mention_regs (x)
 920      rtx x;
 921 {
 922   register enum rtx_code code;
 923   register int i, j;
 924   register char *fmt;
 925   register int changed = 0;
 926
 927   if (x == 0)
 928     return 0;
 929
 930   code = GET_CODE (x);
 931   if (code == REG)
 932     {
 933       register int regno = REGNO (x);
 934       register int endregno
 935         = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
 936                    : HARD_REGNO_NREGS (regno, GET_MODE (x)));
 937       int i;
 938
 939       for (i = regno; i < endregno; i++)
 940         {
 941           if (reg_in_table[i] >= 0 && reg_in_table[i] != reg_tick[i])
 942             remove_invalid_refs (i);
 943
 944           reg_in_table[i] = reg_tick[i];
 945         }
 946
 947       return 0;
 948     }
 949
 950   /* If X is a comparison or a COMPARE and either operand is a register
 951      that does not have a quantity, give it one.  This is so that a later
 952      call to record_jump_equiv won't cause X to be assigned a different
 953      hash code and not found in the table after that call.
 954
 955      It is not necessary to do this here, since rehash_using_reg can
 956      fix up the table later, but doing this here eliminates the need to
 957      call that expensive function in the most common case where the only
 958      use of the register is in the comparison.  */
 959
 960   if (code == COMPARE || GET_RTX_CLASS (code) == '<')
 961     {
 962       if (GET_CODE (XEXP (x, 0)) == REG
 963           && ! REGNO_QTY_VALID_P (REGNO (XEXP (x, 0))))
 964         if (insert_regs (XEXP (x, 0), NULL_PTR, 0))
 965           {
 966             rehash_using_reg (XEXP (x, 0));
 967             changed = 1;
 968           }
 969
 970       if (GET_CODE (XEXP (x, 1)) == REG
 971           && ! REGNO_QTY_VALID_P (REGNO (XEXP (x, 1))))
 972         if (insert_regs (XEXP (x, 1), NULL_PTR, 0))
 973           {
 974             rehash_using_reg (XEXP (x, 1));
 975             changed = 1;
 976           }
 977     }
 978
 979   fmt = GET_RTX_FORMAT (code);
 980   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
 981     if (fmt[i] == 'e')
 982       changed |= mention_regs (XEXP (x, i));
 983     else if (fmt[i] == 'E')
 984       for (j = 0; j < XVECLEN (x, i); j++)
 985         changed |= mention_regs (XVECEXP (x, i, j));
 986
 987   return changed;
 988 }
 989
 990 /* Update the register quantities for inserting X into the hash table
 991    with a value equivalent to CLASSP.
 992    (If the class does not contain a REG, it is irrelevant.)
 993    If MODIFIED is nonzero, X is a destination; it is being modified.
 994    Note that delete_reg_equiv should be called on a register
 995    before insert_regs is done on that register with MODIFIED != 0.
 996
 997    Nonzero value means that elements of reg_qty have changed
 998    so X's hash code may be different.  */
 999
1000 static int
1001 insert_regs (x, classp, modified)
1002      rtx x;
1003      struct table_elt *classp;
1004      int modified;
1005 {
1006   if (GET_CODE (x) == REG)
1007     {
1008       register int regno = REGNO (x);
1009
1010       /* If REGNO is in the equivalence table already but is of the
1011          wrong mode for that equivalence, don't do anything here.  */
1012
1013       if (REGNO_QTY_VALID_P (regno)
1014           && qty_mode[reg_qty[regno]] != GET_MODE (x))
1015         return 0;
1016
1017       if (modified || ! REGNO_QTY_VALID_P (regno))
1018         {
1019           if (classp)
1020             for (classp = classp->first_same_value;
1021                  classp != 0;
1022                  classp = classp->next_same_value)
1023               if (GET_CODE (classp->exp) == REG
1024                   && GET_MODE (classp->exp) == GET_MODE (x))
1025                 {
1026                   make_regs_eqv (regno, REGNO (classp->exp));
1027                   return 1;
1028                 }
1029
1030           make_new_qty (regno);
1031           qty_mode[reg_qty[regno]] = GET_MODE (x);
1032           return 1;
1033         }
1034
1035       return 0;
1036     }
1037
1038   /* If X is a SUBREG, we will likely be inserting the inner register in the
1039      table.  If that register doesn't have an assigned quantity number at
1040      this point but does later, the insertion that we will be doing now will
1041      not be accessible because its hash code will have changed.  So assign
1042      a quantity number now.  */
1043
1044   else if (GET_CODE (x) == SUBREG && GET_CODE (SUBREG_REG (x)) == REG
1045            && ! REGNO_QTY_VALID_P (REGNO (SUBREG_REG (x))))
1046     {
1047       insert_regs (SUBREG_REG (x), NULL_PTR, 0);
1048       mention_regs (SUBREG_REG (x));
1049       return 1;
1050     }
1051   else
1052     return mention_regs (x);
1053 }
1054 \f
1055 /* Look in or update the hash table.  */
1056
1057 /* Put the element ELT on the list of free elements.  */
1058
1059 static void
1060 free_element (elt)
1061      struct table_elt *elt;
1062 {
1063   elt->next_same_hash = free_element_chain;
1064   free_element_chain = elt;
1065 }
1066
1067 /* Return an element that is free for use.  */
1068
1069 static struct table_elt *
1070 get_element ()
1071 {
1072   struct table_elt *elt = free_element_chain;
1073   if (elt)
1074     {
1075       free_element_chain = elt->next_same_hash;
1076       return elt;
1077     }
1078   n_elements_made++;
1079   return (struct table_elt *) oballoc (sizeof (struct table_elt));
1080 }
1081
1082 /* Remove table element ELT from use in the table.
1083    HASH is its hash code, made using the HASH macro.
1084    It's an argument because often that is known in advance
1085    and we save much time not recomputing it.  */
1086
1087 static void
1088 remove_from_table (elt, hash)
1089      register struct table_elt *elt;
1090      unsigned hash;
1091 {
1092   if (elt == 0)
1093     return;
1094
1095   /* Mark this element as removed.  See cse_insn.  */
1096   elt->first_same_value = 0;
1097
1098   /* Remove the table element from its equivalence class.  */
1099
1100   {
1101     register struct table_elt *prev = elt->prev_same_value;
1102     register struct table_elt *next = elt->next_same_value;
1103
1104     if (next) next->prev_same_value = prev;
1105
1106     if (prev)
1107       prev->next_same_value = next;
1108     else
1109       {
1110         register struct table_elt *newfirst = next;
1111         while (next)
1112           {
1113             next->first_same_value = newfirst;
1114             next = next->next_same_value;
1115           }
1116       }
1117   }
1118
1119   /* Remove the table element from its hash bucket.  */
1120
1121   {
1122     register struct table_elt *prev = elt->prev_same_hash;
1123     register struct table_elt *next = elt->next_same_hash;
1124
1125     if (next) next->prev_same_hash = prev;
1126
1127     if (prev)
1128       prev->next_same_hash = next;
1129     else if (table[hash] == elt)
1130       table[hash] = next;
1131     else
1132       {
1133         /* This entry is not in the proper hash bucket.  This can happen
1134            when two classes were merged by `merge_equiv_classes'.  Search
1135            for the hash bucket that it heads.  This happens only very
1136            rarely, so the cost is acceptable.  */
1137         for (hash = 0; hash < NBUCKETS; hash++)
1138           if (table[hash] == elt)
1139             table[hash] = next;
1140       }
1141   }
1142
1143   /* Remove the table element from its related-value circular chain.  */
1144
1145   if (elt->related_value != 0 && elt->related_value != elt)
1146     {
1147       register struct table_elt *p = elt->related_value;
1148       while (p->related_value != elt)
1149         p = p->related_value;
1150       p->related_value = elt->related_value;
1151       if (p->related_value == p)
1152         p->related_value = 0;
1153     }
1154
1155   free_element (elt);
1156 }
1157
1158 /* Look up X in the hash table and return its table element,
1159    or 0 if X is not in the table.
1160
1161    MODE is the machine-mode of X, or if X is an integer constant
1162    with VOIDmode then MODE is the mode with which X will be used.
1163
1164    Here we are satisfied to find an expression whose tree structure
1165    looks like X.  */
1166
1167 static struct table_elt *
1168 lookup (x, hash, mode)
1169      rtx x;
1170      unsigned hash;
1171      enum machine_mode mode;
1172 {
1173   register struct table_elt *p;
1174
1175   for (p = table[hash]; p; p = p->next_same_hash)
1176     if (mode == p->mode && ((x == p->exp && GET_CODE (x) == REG)
1177                             || exp_equiv_p (x, p->exp, GET_CODE (x) != REG, 0)))
1178       return p;
1179
1180   return 0;
1181 }
1182
1183 /* Like `lookup' but don't care whether the table element uses invalid regs.
1184    Also ignore discrepancies in the machine mode of a register.  */
1185
1186 static struct table_elt *
1187 lookup_for_remove (x, hash, mode)
1188      rtx x;
1189      unsigned hash;
1190      enum machine_mode mode;
1191 {
1192   register struct table_elt *p;
1193
1194   if (GET_CODE (x) == REG)
1195     {
1196       int regno = REGNO (x);
1197       /* Don't check the machine mode when comparing registers;
1198          invalidating (REG:SI 0) also invalidates (REG:DF 0).  */
1199       for (p = table[hash]; p; p = p->next_same_hash)
1200         if (GET_CODE (p->exp) == REG
1201             && REGNO (p->exp) == regno)
1202           return p;
1203     }
1204   else
1205     {
1206       for (p = table[hash]; p; p = p->next_same_hash)
1207         if (mode == p->mode && (x == p->exp || exp_equiv_p (x, p->exp, 0, 0)))
1208           return p;
1209     }
1210
1211   return 0;
1212 }
1213
1214 /* Look for an expression equivalent to X and with code CODE.
1215    If one is found, return that expression.  */
1216
1217 static rtx
1218 lookup_as_function (x, code)
1219      rtx x;
1220      enum rtx_code code;
1221 {
1222   register struct table_elt *p = lookup (x, safe_hash (x, VOIDmode) % NBUCKETS,
1223                                          GET_MODE (x));
1224   if (p == 0)
1225     return 0;
1226
1227   for (p = p->first_same_value; p; p = p->next_same_value)
1228     {
1229       if (GET_CODE (p->exp) == code
1230           /* Make sure this is a valid entry in the table.  */
1231           && exp_equiv_p (p->exp, p->exp, 1, 0))
1232         return p->exp;
1233     }
1234
1235   return 0;
1236 }
1237
1238 /* Insert X in the hash table, assuming HASH is its hash code
1239    and CLASSP is an element of the class it should go in
1240    (or 0 if a new class should be made).
1241    It is inserted at the proper position to keep the class in
1242    the order cheapest first.
1243
1244    MODE is the machine-mode of X, or if X is an integer constant
1245    with VOIDmode then MODE is the mode with which X will be used.
1246
1247    For elements of equal cheapness, the most recent one
1248    goes in front, except that the first element in the list
1249    remains first unless a cheaper element is added.  The order of
1250    pseudo-registers does not matter, as canon_reg will be called to
1251    find the cheapest when a register is retrieved from the table.
1252
1253    The in_memory field in the hash table element is set to 0.
1254    The caller must set it nonzero if appropriate.
1255
1256    You should call insert_regs (X, CLASSP, MODIFY) before calling here,
1257    and if insert_regs returns a nonzero value
1258    you must then recompute its hash code before calling here.
1259
1260    If necessary, update table showing constant values of quantities.  */
1261
1262 #define CHEAPER(X,Y)   ((X)->cost < (Y)->cost)
1263
1264 static struct table_elt *
1265 insert (x, classp, hash, mode)
1266      register rtx x;
1267      register struct table_elt *classp;
1268      unsigned hash;
1269      enum machine_mode mode;
1270 {
1271   register struct table_elt *elt;
1272
1273   /* If X is a register and we haven't made a quantity for it,
1274      something is wrong.  */
1275   if (GET_CODE (x) == REG && ! REGNO_QTY_VALID_P (REGNO (x)))
1276     abort ();
1277
1278   /* If X is a hard register, show it is being put in the table.  */
1279   if (GET_CODE (x) == REG && REGNO (x) < FIRST_PSEUDO_REGISTER)
1280     {
1281       int regno = REGNO (x);
1282       int endregno = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
1283       int i;
1284
1285       for (i = regno; i < endregno; i++)
1286             SET_HARD_REG_BIT (hard_regs_in_table, i);
1287     }
1288
1289
1290   /* Put an element for X into the right hash bucket.  */
1291
1292   elt = get_element ();
1293   elt->exp = x;
1294   elt->cost = COST (x);
1295   elt->next_same_value = 0;
1296   elt->prev_same_value = 0;
1297   elt->next_same_hash = table[hash];
1298   elt->prev_same_hash = 0;
1299   elt->related_value = 0;
1300   elt->in_memory = 0;
1301   elt->mode = mode;
1302   elt->is_const = (CONSTANT_P (x)
1303                    /* GNU C++ takes advantage of this for `this'
1304                       (and other const values).  */
1305                    || (RTX_UNCHANGING_P (x)
1306                        && GET_CODE (x) == REG
1307                        && REGNO (x) >= FIRST_PSEUDO_REGISTER)
1308                    || FIXED_BASE_PLUS_P (x));
1309
1310   if (table[hash])
1311     table[hash]->prev_same_hash = elt;
1312   table[hash] = elt;
1313
1314   /* Put it into the proper value-class.  */
1315   if (classp)
1316     {
1317       classp = classp->first_same_value;
1318       if (CHEAPER (elt, classp))
1319         /* Insert at the head of the class */
1320         {
1321           register struct table_elt *p;
1322           elt->next_same_value = classp;
1323           classp->prev_same_value = elt;
1324           elt->first_same_value = elt;
1325
1326           for (p = classp; p; p = p->next_same_value)
1327             p->first_same_value = elt;
1328         }
1329       else
1330         {
1331           /* Insert not at head of the class.  */
1332           /* Put it after the last element cheaper than X.  */
1333           register struct table_elt *p, *next;
1334           for (p = classp; (next = p->next_same_value) && CHEAPER (next, elt);
1335                p = next);
1336           /* Put it after P and before NEXT.  */
1337           elt->next_same_value = next;
1338           if (next)
1339             next->prev_same_value = elt;
1340           elt->prev_same_value = p;
1341           p->next_same_value = elt;
1342           elt->first_same_value = classp;
1343         }
1344     }
1345   else
1346     elt->first_same_value = elt;
1347
1348   /* If this is a constant being set equivalent to a register or a register
1349      being set equivalent to a constant, note the constant equivalence.
1350
1351      If this is a constant, it cannot be equivalent to a different constant,
1352      and a constant is the only thing that can be cheaper than a register.  So
1353      we know the register is the head of the class (before the constant was
1354      inserted).
1355
1356      If this is a register that is not already known equivalent to a
1357      constant, we must check the entire class.
1358
1359      If this is a register that is already known equivalent to an insn,
1360      update `qty_const_insn' to show that `this_insn' is the latest
1361      insn making that quantity equivalent to the constant.  */
1362
1363   if (elt->is_const && classp && GET_CODE (classp->exp) == REG)
1364     {
1365       qty_const[reg_qty[REGNO (classp->exp)]]
1366         = gen_lowpart_if_possible (qty_mode[reg_qty[REGNO (classp->exp)]], x);
1367       qty_const_insn[reg_qty[REGNO (classp->exp)]] = this_insn;
1368     }
1369
1370   else if (GET_CODE (x) == REG && classp && ! qty_const[reg_qty[REGNO (x)]])
1371     {
1372       register struct table_elt *p;
1373
1374       for (p = classp; p != 0; p = p->next_same_value)
1375         {
1376           if (p->is_const)
1377             {
1378               qty_const[reg_qty[REGNO (x)]]
1379                 = gen_lowpart_if_possible (GET_MODE (x), p->exp);
1380               qty_const_insn[reg_qty[REGNO (x)]] = this_insn;
1381               break;
1382             }
1383         }
1384     }
1385
1386   else if (GET_CODE (x) == REG && qty_const[reg_qty[REGNO (x)]]
1387            && GET_MODE (x) == qty_mode[reg_qty[REGNO (x)]])
1388     qty_const_insn[reg_qty[REGNO (x)]] = this_insn;
1389
1390   /* If this is a constant with symbolic value,
1391      and it has a term with an explicit integer value,
1392      link it up with related expressions.  */
1393   if (GET_CODE (x) == CONST)
1394     {
1395       rtx subexp = get_related_value (x);
1396       unsigned subhash;
1397       struct table_elt *subelt, *subelt_prev;
1398
1399       if (subexp != 0)
1400         {
1401           /* Get the integer-free subexpression in the hash table.  */
1402           subhash = safe_hash (subexp, mode) % NBUCKETS;
1403           subelt = lookup (subexp, subhash, mode);
1404           if (subelt == 0)
1405             subelt = insert (subexp, NULL_PTR, subhash, mode);
1406           /* Initialize SUBELT's circular chain if it has none.  */
1407           if (subelt->related_value == 0)
1408             subelt->related_value = subelt;
1409           /* Find the element in the circular chain that precedes SUBELT.  */
1410           subelt_prev = subelt;
1411           while (subelt_prev->related_value != subelt)
1412             subelt_prev = subelt_prev->related_value;
1413           /* Put new ELT into SUBELT's circular chain just before SUBELT.
1414              This way the element that follows SUBELT is the oldest one.  */
1415           elt->related_value = subelt_prev->related_value;
1416           subelt_prev->related_value = elt;
1417         }
1418     }
1419
1420   return elt;
1421 }
1422 \f
1423 /* Given two equivalence classes, CLASS1 and CLASS2, put all the entries from
1424    CLASS2 into CLASS1.  This is done when we have reached an insn which makes
1425    the two classes equivalent.
1426
1427    CLASS1 will be the surviving class; CLASS2 should not be used after this
1428    call.
1429
1430    Any invalid entries in CLASS2 will not be copied.  */
1431
1432 static void
1433 merge_equiv_classes (class1, class2)
1434      struct table_elt *class1, *class2;
1435 {
1436   struct table_elt *elt, *next, *new;
1437
1438   /* Ensure we start with the head of the classes.  */
1439   class1 = class1->first_same_value;
1440   class2 = class2->first_same_value;
1441
1442   /* If they were already equal, forget it.  */
1443   if (class1 == class2)
1444     return;
1445
1446   for (elt = class2; elt; elt = next)
1447     {
1448       unsigned hash;
1449       rtx exp = elt->exp;
1450       enum machine_mode mode = elt->mode;
1451
1452       next = elt->next_same_value;
1453
1454       /* Remove old entry, make a new one in CLASS1's class.
1455          Don't do this for invalid entries as we cannot find their
1456          hash code (it also isn't necessary). */
1457       if (GET_CODE (exp) == REG || exp_equiv_p (exp, exp, 1, 0))
1458         {
1459           hash_arg_in_memory = 0;
1460           hash_arg_in_struct = 0;
1461           hash = HASH (exp, mode);
1462
1463           if (GET_CODE (exp) == REG)
1464             delete_reg_equiv (REGNO (exp));
1465
1466           remove_from_table (elt, hash);
1467
1468           if (insert_regs (exp, class1, 0))
1469             hash = HASH (exp, mode);
1470           new = insert (exp, class1, hash, mode);
1471           new->in_memory = hash_arg_in_memory;
1472           new->in_struct = hash_arg_in_struct;
1473         }
1474     }
1475 }
1476 \f
1477 /* Remove from the hash table, or mark as invalid,
1478    all expressions whose values could be altered by storing in X.
1479    X is a register, a subreg, or a memory reference with nonvarying address
1480    (because, when a memory reference with a varying address is stored in,
1481    all memory references are removed by invalidate_memory
1482    so specific invalidation is superfluous).
1483
1484    A nonvarying address may be just a register or just
1485    a symbol reference, or it may be either of those plus
1486    a numeric offset.  */
1487
1488 static void
1489 invalidate (x)
1490      rtx x;
1491 {
1492   register int i;
1493   register struct table_elt *p;
1494   rtx base;
1495   HOST_WIDE_INT start, end;
1496
1497   /* If X is a register, dependencies on its contents
1498      are recorded through the qty number mechanism.
1499      Just change the qty number of the register,
1500      mark it as invalid for expressions that refer to it,
1501      and remove it itself.  */
1502
1503   if (GET_CODE (x) == REG)
1504     {
1505       register int regno = REGNO (x);
1506       register unsigned hash = HASH (x, GET_MODE (x));
1507
1508       /* Remove REGNO from any quantity list it might be on and indicate
1509          that it's value might have changed.  If it is a pseudo, remove its
1510          entry from the hash table.
1511
1512          For a hard register, we do the first two actions above for any
1513          additional hard registers corresponding to X.  Then, if any of these
1514          registers are in the table, we must remove any REG entries that
1515          overlap these registers.  */
1516
1517       delete_reg_equiv (regno);
1518       reg_tick[regno]++;
1519
1520       if (regno >= FIRST_PSEUDO_REGISTER)
1521         remove_from_table (lookup_for_remove (x, hash, GET_MODE (x)), hash);
1522       else
1523         {
1524           HOST_WIDE_INT in_table
1525             = TEST_HARD_REG_BIT (hard_regs_in_table, regno);
1526           int endregno = regno + HARD_REGNO_NREGS (regno, GET_MODE (x));
1527           int tregno, tendregno;
1528           register struct table_elt *p, *next;
1529
1530           CLEAR_HARD_REG_BIT (hard_regs_in_table, regno);
1531
1532           for (i = regno + 1; i < endregno; i++)
1533             {
1534               in_table |= TEST_HARD_REG_BIT (hard_regs_in_table, i);
1535               CLEAR_HARD_REG_BIT (hard_regs_in_table, i);
1536               delete_reg_equiv (i);
1537               reg_tick[i]++;
1538             }
1539
1540           if (in_table)
1541             for (hash = 0; hash < NBUCKETS; hash++)
1542               for (p = table[hash]; p; p = next)
1543                 {
1544                   next = p->next_same_hash;
1545
1546                   if (GET_CODE (p->exp) != REG
1547                       || REGNO (p->exp) >= FIRST_PSEUDO_REGISTER)
1548                     continue;
1549
1550                   tregno = REGNO (p->exp);
1551                   tendregno
1552                     = tregno + HARD_REGNO_NREGS (tregno, GET_MODE (p->exp));
1553                   if (tendregno > regno && tregno < endregno)
1554                   remove_from_table (p, hash);
1555                 }
1556         }
1557
1558       return;
1559     }
1560
1561   if (GET_CODE (x) == SUBREG)
1562     {
1563       if (GET_CODE (SUBREG_REG (x)) != REG)
1564         abort ();
1565       invalidate (SUBREG_REG (x));
1566       return;
1567     }
1568
1569   /* X is not a register; it must be a memory reference with
1570      a nonvarying address.  Remove all hash table elements
1571      that refer to overlapping pieces of memory.  */
1572
1573   if (GET_CODE (x) != MEM)
1574     abort ();
1575
1576   set_nonvarying_address_components (XEXP (x, 0), GET_MODE_SIZE (GET_MODE (x)),
1577                                      &base, &start, &end);
1578
1579   for (i = 0; i < NBUCKETS; i++)
1580     {
1581       register struct table_elt *next;
1582       for (p = table[i]; p; p = next)
1583         {
1584           next = p->next_same_hash;
1585           if (refers_to_mem_p (p->exp, base, start, end))
1586             remove_from_table (p, i);
1587         }
1588     }
1589 }
1590
1591 /* Remove all expressions that refer to register REGNO,
1592    since they are already invalid, and we are about to
1593    mark that register valid again and don't want the old
1594    expressions to reappear as valid.  */
1595
1596 static void
1597 remove_invalid_refs (regno)
1598      int regno;
1599 {
1600   register int i;
1601   register struct table_elt *p, *next;
1602
1603   for (i = 0; i < NBUCKETS; i++)
1604     for (p = table[i]; p; p = next)
1605       {
1606         next = p->next_same_hash;
1607         if (GET_CODE (p->exp) != REG
1608             && refers_to_regno_p (regno, regno + 1, p->exp, NULL_PTR))
1609           remove_from_table (p, i);
1610       }
1611 }
1612 \f
1613 /* Recompute the hash codes of any valid entries in the hash table that
1614    reference X, if X is a register, or SUBREG_REG (X) if X is a SUBREG.
1615
1616    This is called when we make a jump equivalence.  */
1617
1618 static void
1619 rehash_using_reg (x)
1620      rtx x;
1621 {
1622   int i;
1623   struct table_elt *p, *next;
1624   unsigned hash;
1625
1626   if (GET_CODE (x) == SUBREG)
1627     x = SUBREG_REG (x);
1628
1629   /* If X is not a register or if the register is known not to be in any
1630      valid entries in the table, we have no work to do.  */
1631
1632   if (GET_CODE (x) != REG
1633       || reg_in_table[REGNO (x)] < 0
1634       || reg_in_table[REGNO (x)] != reg_tick[REGNO (x)])
1635     return;
1636
1637   /* Scan all hash chains looking for valid entries that mention X.
1638      If we find one and it is in the wrong hash chain, move it.  We can skip
1639      objects that are registers, since they are handled specially.  */
1640
1641   for (i = 0; i < NBUCKETS; i++)
1642     for (p = table[i]; p; p = next)
1643       {
1644         next = p->next_same_hash;
1645         if (GET_CODE (p->exp) != REG && reg_mentioned_p (x, p->exp)
1646             && exp_equiv_p (p->exp, p->exp, 1, 0)
1647             && i != (hash = safe_hash (p->exp, p->mode) % NBUCKETS))
1648           {
1649             if (p->next_same_hash)
1650               p->next_same_hash->prev_same_hash = p->prev_same_hash;
1651
1652             if (p->prev_same_hash)
1653               p->prev_same_hash->next_same_hash = p->next_same_hash;
1654             else
1655               table[i] = p->next_same_hash;
1656
1657             p->next_same_hash = table[hash];
1658             p->prev_same_hash = 0;
1659             if (table[hash])
1660               table[hash]->prev_same_hash = p;
1661             table[hash] = p;
1662           }
1663       }
1664 }
1665 \f
1666 /* Remove from the hash table all expressions that reference memory,
1667    or some of them as specified by *WRITES.  */
1668
1669 static void
1670 invalidate_memory (writes)
1671      struct write_data *writes;
1672 {
1673   register int i;
1674   register struct table_elt *p, *next;
1675   int all = writes->all;
1676   int nonscalar = writes->nonscalar;
1677
1678   for (i = 0; i < NBUCKETS; i++)
1679     for (p = table[i]; p; p = next)
1680       {
1681         next = p->next_same_hash;
1682         if (p->in_memory
1683             && (all
1684                 || (nonscalar && p->in_struct)
1685                 || cse_rtx_addr_varies_p (p->exp)))
1686           remove_from_table (p, i);
1687       }
1688 }
1689 \f
1690 /* Remove from the hash table any expression that is a call-clobbered
1691    register.  Also update their TICK values.  */
1692
1693 static void
1694 invalidate_for_call ()
1695 {
1696   int regno, endregno;
1697   int i;
1698   unsigned hash;
1699   struct table_elt *p, *next;
1700   int in_table = 0;
1701
1702   /* Go through all the hard registers.  For each that is clobbered in
1703      a CALL_INSN, remove the register from quantity chains and update
1704      reg_tick if defined.  Also see if any of these registers is currently
1705      in the table.  */
1706
1707   for (regno = 0; regno < FIRST_PSEUDO_REGISTER; regno++)
1708     if (TEST_HARD_REG_BIT (regs_invalidated_by_call, regno))
1709       {
1710         delete_reg_equiv (regno);
1711         if (reg_tick[regno] >= 0)
1712           reg_tick[regno]++;
1713
1714         in_table |= TEST_HARD_REG_BIT (hard_regs_in_table, regno);
1715       }
1716
1717   /* In the case where we have no call-clobbered hard registers in the
1718      table, we are done.  Otherwise, scan the table and remove any
1719      entry that overlaps a call-clobbered register.  */
1720
1721   if (in_table)
1722     for (hash = 0; hash < NBUCKETS; hash++)
1723       for (p = table[hash]; p; p = next)
1724         {
1725           next = p->next_same_hash;
1726
1727           if (GET_CODE (p->exp) != REG
1728               || REGNO (p->exp) >= FIRST_PSEUDO_REGISTER)
1729             continue;
1730
1731           regno = REGNO (p->exp);
1732           endregno = regno + HARD_REGNO_NREGS (regno, GET_MODE (p->exp));
1733
1734           for (i = regno; i < endregno; i++)
1735             if (TEST_HARD_REG_BIT (regs_invalidated_by_call, i))
1736               {
1737                 remove_from_table (p, hash);
1738                 break;
1739               }
1740         }
1741 }
1742 \f
1743 /* Given an expression X of type CONST,
1744    and ELT which is its table entry (or 0 if it
1745    is not in the hash table),
1746    return an alternate expression for X as a register plus integer.
1747    If none can be found, return 0.  */
1748
1749 static rtx
1750 use_related_value (x, elt)
1751      rtx x;
1752      struct table_elt *elt;
1753 {
1754   register struct table_elt *relt = 0;
1755   register struct table_elt *p, *q;
1756   HOST_WIDE_INT offset;
1757
1758   /* First, is there anything related known?
1759      If we have a table element, we can tell from that.
1760      Otherwise, must look it up.  */
1761
1762   if (elt != 0 && elt->related_value != 0)
1763     relt = elt;
1764   else if (elt == 0 && GET_CODE (x) == CONST)
1765     {
1766       rtx subexp = get_related_value (x);
1767       if (subexp != 0)
1768         relt = lookup (subexp,
1769                        safe_hash (subexp, GET_MODE (subexp)) % NBUCKETS,
1770                        GET_MODE (subexp));
1771     }
1772
1773   if (relt == 0)
1774     return 0;
1775
1776   /* Search all related table entries for one that has an
1777      equivalent register.  */
1778
1779   p = relt;
1780   while (1)
1781     {
1782       /* This loop is strange in that it is executed in two different cases.
1783          The first is when X is already in the table.  Then it is searching
1784          the RELATED_VALUE list of X's class (RELT).  The second case is when
1785          X is not in the table.  Then RELT points to a class for the related
1786          value.
1787
1788          Ensure that, whatever case we are in, that we ignore classes that have
1789          the same value as X.  */
1790
1791       if (rtx_equal_p (x, p->exp))
1792         q = 0;
1793       else
1794         for (q = p->first_same_value; q; q = q->next_same_value)
1795           if (GET_CODE (q->exp) == REG)
1796             break;
1797
1798       if (q)
1799         break;
1800
1801       p = p->related_value;
1802
1803       /* We went all the way around, so there is nothing to be found.
1804          Alternatively, perhaps RELT was in the table for some other reason
1805          and it has no related values recorded.  */
1806       if (p == relt || p == 0)
1807         break;
1808     }
1809
1810   if (q == 0)
1811     return 0;
1812
1813   offset = (get_integer_term (x) - get_integer_term (p->exp));
1814   /* Note: OFFSET may be 0 if P->xexp and X are related by commutativity.  */
1815   return plus_constant (q->exp, offset);
1816 }
1817 \f
1818 /* Hash an rtx.  We are careful to make sure the value is never negative.
1819    Equivalent registers hash identically.
1820    MODE is used in hashing for CONST_INTs only;
1821    otherwise the mode of X is used.
1822
1823    Store 1 in do_not_record if any subexpression is volatile.
1824
1825    Store 1 in hash_arg_in_memory if X contains a MEM rtx
1826    which does not have the RTX_UNCHANGING_P bit set.
1827    In this case, also store 1 in hash_arg_in_struct
1828    if there is a MEM rtx which has the MEM_IN_STRUCT_P bit set.
1829
1830    Note that cse_insn knows that the hash code of a MEM expression
1831    is just (int) MEM plus the hash code of the address.  */
1832
1833 static unsigned
1834 canon_hash (x, mode)
1835      rtx x;
1836      enum machine_mode mode;
1837 {
1838   register int i, j;
1839   register unsigned hash = 0;
1840   register enum rtx_code code;
1841   register char *fmt;
1842
1843   /* repeat is used to turn tail-recursion into iteration.  */
1844  repeat:
1845   if (x == 0)
1846     return hash;
1847
1848   code = GET_CODE (x);
1849   switch (code)
1850     {
1851     case REG:
1852       {
1853         register int regno = REGNO (x);
1854
1855         /* On some machines, we can't record any non-fixed hard register,
1856            because extending its life will cause reload problems.  We
1857            consider ap, fp, and sp to be fixed for this purpose.
1858            On all machines, we can't record any global registers. */
1859
1860         if (regno < FIRST_PSEUDO_REGISTER
1861             && (global_regs[regno]
1862 #ifdef SMALL_REGISTER_CLASSES
1863                 || (! fixed_regs[regno]
1864                     && regno != FRAME_POINTER_REGNUM
1865                     && regno != HARD_FRAME_POINTER_REGNUM
1866                     && regno != ARG_POINTER_REGNUM
1867                     && regno != STACK_POINTER_REGNUM)
1868 #endif
1869                 ))
1870           {
1871             do_not_record = 1;
1872             return 0;
1873           }
1874         hash += ((unsigned) REG << 7) + (unsigned) reg_qty[regno];
1875         return hash;
1876       }
1877
1878     case CONST_INT:
1879       {
1880         unsigned HOST_WIDE_INT tem = INTVAL (x);
1881         hash += ((unsigned) CONST_INT << 7) + (unsigned) mode + tem;
1882         return hash;
1883       }
1884
1885     case CONST_DOUBLE:
1886       /* This is like the general case, except that it only counts
1887          the integers representing the constant.  */
1888       hash += (unsigned) code + (unsigned) GET_MODE (x);
1889       for (i = 2; i < GET_RTX_LENGTH (CONST_DOUBLE); i++)
1890         {
1891           unsigned tem = XINT (x, i);
1892           hash += tem;
1893         }
1894       return hash;
1895
1896       /* Assume there is only one rtx object for any given label.  */
1897     case LABEL_REF:
1898       hash
1899         += ((unsigned) LABEL_REF << 7) + (unsigned HOST_WIDE_INT) XEXP (x, 0);
1900       return hash;
1901
1902     case SYMBOL_REF:
1903       hash
1904         += ((unsigned) SYMBOL_REF << 7) + (unsigned HOST_WIDE_INT) XSTR (x, 0);
1905       return hash;
1906
1907     case MEM:
1908       if (MEM_VOLATILE_P (x))
1909         {
1910           do_not_record = 1;
1911           return 0;
1912         }
1913       if (! RTX_UNCHANGING_P (x))
1914         {
1915           hash_arg_in_memory = 1;
1916           if (MEM_IN_STRUCT_P (x)) hash_arg_in_struct = 1;
1917         }
1918       /* Now that we have already found this special case,
1919          might as well speed it up as much as possible.  */
1920       hash += (unsigned) MEM;
1921       x = XEXP (x, 0);
1922       goto repeat;
1923
1924     case PRE_DEC:
1925     case PRE_INC:
1926     case POST_DEC:
1927     case POST_INC:
1928     case PC:
1929     case CC0:
1930     case CALL:
1931     case UNSPEC_VOLATILE:
1932       do_not_record = 1;
1933       return 0;
1934
1935     case ASM_OPERANDS:
1936       if (MEM_VOLATILE_P (x))
1937         {
1938           do_not_record = 1;
1939           return 0;
1940         }
1941     }
1942
1943   i = GET_RTX_LENGTH (code) - 1;
1944   hash += (unsigned) code + (unsigned) GET_MODE (x);
1945   fmt = GET_RTX_FORMAT (code);
1946   for (; i >= 0; i--)
1947     {
1948       if (fmt[i] == 'e')
1949         {
1950           rtx tem = XEXP (x, i);
1951           rtx tem1;
1952
1953           /* If the operand is a REG that is equivalent to a constant, hash
1954              as if we were hashing the constant, since we will be comparing
1955              that way.  */
1956           if (tem != 0 && GET_CODE (tem) == REG
1957               && REGNO_QTY_VALID_P (REGNO (tem))
1958               && qty_mode[reg_qty[REGNO (tem)]] == GET_MODE (tem)
1959               && (tem1 = qty_const[reg_qty[REGNO (tem)]]) != 0
1960               && CONSTANT_P (tem1))
1961             tem = tem1;
1962
1963           /* If we are about to do the last recursive call
1964              needed at this level, change it into iteration.
1965              This function  is called enough to be worth it.  */
1966           if (i == 0)
1967             {
1968               x = tem;
1969               goto repeat;
1970             }
1971           hash += canon_hash (tem, 0);
1972         }
1973       else if (fmt[i] == 'E')
1974         for (j = 0; j < XVECLEN (x, i); j++)
1975           hash += canon_hash (XVECEXP (x, i, j), 0);
1976       else if (fmt[i] == 's')
1977         {
1978           register unsigned char *p = (unsigned char *) XSTR (x, i);
1979           if (p)
1980             while (*p)
1981               hash += *p++;
1982         }
1983       else if (fmt[i] == 'i')
1984         {
1985           register unsigned tem = XINT (x, i);
1986           hash += tem;
1987         }
1988       else
1989         abort ();
1990     }
1991   return hash;
1992 }
1993
1994 /* Like canon_hash but with no side effects.  */
1995
1996 static unsigned
1997 safe_hash (x, mode)
1998      rtx x;
1999      enum machine_mode mode;
2000 {
2001   int save_do_not_record = do_not_record;
2002   int save_hash_arg_in_memory = hash_arg_in_memory;
2003   int save_hash_arg_in_struct = hash_arg_in_struct;
2004   unsigned hash = canon_hash (x, mode);
2005   hash_arg_in_memory = save_hash_arg_in_memory;
2006   hash_arg_in_struct = save_hash_arg_in_struct;
2007   do_not_record = save_do_not_record;
2008   return hash;
2009 }
2010 \f
2011 /* Return 1 iff X and Y would canonicalize into the same thing,
2012    without actually constructing the canonicalization of either one.
2013    If VALIDATE is nonzero,
2014    we assume X is an expression being processed from the rtl
2015    and Y was found in the hash table.  We check register refs
2016    in Y for being marked as valid.
2017
2018    If EQUAL_VALUES is nonzero, we allow a register to match a constant value
2019    that is known to be in the register.  Ordinarily, we don't allow them
2020    to match, because letting them match would cause unpredictable results
2021    in all the places that search a hash table chain for an equivalent
2022    for a given value.  A possible equivalent that has different structure
2023    has its hash code computed from different data.  Whether the hash code
2024    is the same as that of the the given value is pure luck.  */
2025
2026 static int
2027 exp_equiv_p (x, y, validate, equal_values)
2028      rtx x, y;
2029      int validate;
2030      int equal_values;
2031 {
2032   register int i, j;
2033   register enum rtx_code code;
2034   register char *fmt;
2035
2036   /* Note: it is incorrect to assume an expression is equivalent to itself
2037      if VALIDATE is nonzero.  */
2038   if (x == y && !validate)
2039     return 1;
2040   if (x == 0 || y == 0)
2041     return x == y;
2042
2043   code = GET_CODE (x);
2044   if (code != GET_CODE (y))
2045     {
2046       if (!equal_values)
2047         return 0;
2048
2049       /* If X is a constant and Y is a register or vice versa, they may be
2050          equivalent.  We only have to validate if Y is a register.  */
2051       if (CONSTANT_P (x) && GET_CODE (y) == REG
2052           && REGNO_QTY_VALID_P (REGNO (y))
2053           && GET_MODE (y) == qty_mode[reg_qty[REGNO (y)]]
2054           && rtx_equal_p (x, qty_const[reg_qty[REGNO (y)]])
2055           && (! validate || reg_in_table[REGNO (y)] == reg_tick[REGNO (y)]))
2056         return 1;
2057
2058       if (CONSTANT_P (y) && code == REG
2059           && REGNO_QTY_VALID_P (REGNO (x))
2060           && GET_MODE (x) == qty_mode[reg_qty[REGNO (x)]]
2061           && rtx_equal_p (y, qty_const[reg_qty[REGNO (x)]]))
2062         return 1;
2063
2064       return 0;
2065     }
2066
2067   /* (MULT:SI x y) and (MULT:HI x y) are NOT equivalent.  */
2068   if (GET_MODE (x) != GET_MODE (y))
2069     return 0;
2070
2071   switch (code)
2072     {
2073     case PC:
2074     case CC0:
2075       return x == y;
2076
2077     case CONST_INT:
2078       return INTVAL (x) == INTVAL (y);
2079
2080     case LABEL_REF:
2081       return XEXP (x, 0) == XEXP (y, 0);
2082
2083     case SYMBOL_REF:
2084       return XSTR (x, 0) == XSTR (y, 0);
2085
2086     case REG:
2087       {
2088         int regno = REGNO (y);
2089         int endregno
2090           = regno + (regno >= FIRST_PSEUDO_REGISTER ? 1
2091                      : HARD_REGNO_NREGS (regno, GET_MODE (y)));
2092         int i;
2093
2094         /* If the quantities are not the same, the expressions are not
2095            equivalent.  If there are and we are not to validate, they
2096            are equivalent.  Otherwise, ensure all regs are up-to-date.  */
2097
2098         if (reg_qty[REGNO (x)] != reg_qty[regno])
2099           return 0;
2100
2101         if (! validate)
2102           return 1;
2103
2104         for (i = regno; i < endregno; i++)
2105           if (reg_in_table[i] != reg_tick[i])
2106             return 0;
2107
2108         return 1;
2109       }
2110
2111     /*  For commutative operations, check both orders.  */
2112     case PLUS:
2113     case MULT:
2114     case AND:
2115     case IOR:
2116     case XOR:
2117     case NE:
2118     case EQ:
2119       return ((exp_equiv_p (XEXP (x, 0), XEXP (y, 0), validate, equal_values)
2120                && exp_equiv_p (XEXP (x, 1), XEXP (y, 1),
2121                                validate, equal_values))
2122               || (exp_equiv_p (XEXP (x, 0), XEXP (y, 1),
2123                                validate, equal_values)
2124                   && exp_equiv_p (XEXP (x, 1), XEXP (y, 0),
2125                                   validate, equal_values)));
2126     }
2127
2128   /* Compare the elements.  If any pair of corresponding elements
2129      fail to match, return 0 for the whole things.  */
2130
2131   fmt = GET_RTX_FORMAT (code);
2132   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2133     {
2134       switch (fmt[i])
2135         {
2136         case 'e':
2137           if (! exp_equiv_p (XEXP (x, i), XEXP (y, i), validate, equal_values))
2138             return 0;
2139           break;
2140
2141         case 'E':
2142           if (XVECLEN (x, i) != XVECLEN (y, i))
2143             return 0;
2144           for (j = 0; j < XVECLEN (x, i); j++)
2145             if (! exp_equiv_p (XVECEXP (x, i, j), XVECEXP (y, i, j),
2146                                validate, equal_values))
2147               return 0;
2148           break;
2149
2150         case 's':
2151           if (strcmp (XSTR (x, i), XSTR (y, i)))
2152             return 0;
2153           break;
2154
2155         case 'i':
2156           if (XINT (x, i) != XINT (y, i))
2157             return 0;
2158           break;
2159
2160         case 'w':
2161           if (XWINT (x, i) != XWINT (y, i))
2162             return 0;
2163         break;
2164
2165         case '0':
2166           break;
2167
2168         default:
2169           abort ();
2170         }
2171       }
2172
2173   return 1;
2174 }
2175 \f
2176 /* Return 1 iff any subexpression of X matches Y.
2177    Here we do not require that X or Y be valid (for registers referred to)
2178    for being in the hash table.  */
2179
2180 static int
2181 refers_to_p (x, y)
2182      rtx x, y;
2183 {
2184   register int i;
2185   register enum rtx_code code;
2186   register char *fmt;
2187
2188  repeat:
2189   if (x == y)
2190     return 1;
2191   if (x == 0 || y == 0)
2192     return 0;
2193
2194   code = GET_CODE (x);
2195   /* If X as a whole has the same code as Y, they may match.
2196      If so, return 1.  */
2197   if (code == GET_CODE (y))
2198     {
2199       if (exp_equiv_p (x, y, 0, 1))
2200         return 1;
2201     }
2202
2203   /* X does not match, so try its subexpressions.  */
2204
2205   fmt = GET_RTX_FORMAT (code);
2206   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2207     if (fmt[i] == 'e')
2208       {
2209         if (i == 0)
2210           {
2211             x = XEXP (x, 0);
2212             goto repeat;
2213           }
2214         else
2215           if (refers_to_p (XEXP (x, i), y))
2216             return 1;
2217       }
2218     else if (fmt[i] == 'E')
2219       {
2220         int j;
2221         for (j = 0; j < XVECLEN (x, i); j++)
2222           if (refers_to_p (XVECEXP (x, i, j), y))
2223             return 1;
2224       }
2225
2226   return 0;
2227 }
2228 \f
2229 /* Given ADDR and SIZE (a memory address, and the size of the memory reference),
2230    set PBASE, PSTART, and PEND which correspond to the base of the address,
2231    the starting offset, and ending offset respectively.
2232
2233    ADDR is known to be a nonvarying address.
2234
2235    cse_address_varies_p returns zero for nonvarying addresses.  */
2236
2237 static void
2238 set_nonvarying_address_components (addr, size, pbase, pstart, pend)
2239      rtx addr;
2240      int size;
2241      rtx *pbase;
2242      HOST_WIDE_INT *pstart, *pend;
2243 {
2244   rtx base;
2245   HOST_WIDE_INT start, end;
2246
2247   base = addr;
2248   start = 0;
2249   end = 0;
2250
2251   /* Registers with nonvarying addresses usually have constant equivalents;
2252      but the frame pointer register is also possible.  */
2253   if (GET_CODE (base) == REG
2254       && qty_const != 0
2255       && REGNO_QTY_VALID_P (REGNO (base))
2256       && qty_mode[reg_qty[REGNO (base)]] == GET_MODE (base)
2257       && qty_const[reg_qty[REGNO (base)]] != 0)
2258     base = qty_const[reg_qty[REGNO (base)]];
2259   else if (GET_CODE (base) == PLUS
2260            && GET_CODE (XEXP (base, 1)) == CONST_INT
2261            && GET_CODE (XEXP (base, 0)) == REG
2262            && qty_const != 0
2263            && REGNO_QTY_VALID_P (REGNO (XEXP (base, 0)))
2264            && (qty_mode[reg_qty[REGNO (XEXP (base, 0))]]
2265                == GET_MODE (XEXP (base, 0)))
2266            && qty_const[reg_qty[REGNO (XEXP (base, 0))]])
2267     {
2268       start = INTVAL (XEXP (base, 1));
2269       base = qty_const[reg_qty[REGNO (XEXP (base, 0))]];
2270     }
2271
2272   /* Handle everything that we can find inside an address that has been
2273      viewed as constant.  */
2274
2275   while (1)
2276     {
2277       /* If no part of this switch does a "continue", the code outside
2278          will exit this loop.  */
2279
2280       switch (GET_CODE (base))
2281         {
2282         case LO_SUM:
2283           /* By definition, operand1 of a LO_SUM is the associated constant
2284              address.  Use the associated constant address as the base
2285              instead.  */
2286           base = XEXP (base, 1);
2287           continue;
2288
2289         case CONST:
2290           /* Strip off CONST.  */
2291           base = XEXP (base, 0);
2292           continue;
2293
2294         case PLUS:
2295           if (GET_CODE (XEXP (base, 1)) == CONST_INT)
2296             {
2297               start += INTVAL (XEXP (base, 1));
2298               base = XEXP (base, 0);
2299               continue;
2300             }
2301           break;
2302
2303         case AND:
2304           /* Handle the case of an AND which is the negative of a power of
2305              two.  This is used to represent unaligned memory operations.  */
2306           if (GET_CODE (XEXP (base, 1)) == CONST_INT
2307               && exact_log2 (- INTVAL (XEXP (base, 1))) > 0)
2308             {
2309               set_nonvarying_address_components (XEXP (base, 0), size,
2310                                                  pbase, pstart, pend);
2311
2312               /* Assume the worst misalignment.  START is affected, but not
2313                  END, so compensate but adjusting SIZE.  Don't lose any
2314                  constant we already had.  */
2315
2316               size = *pend - *pstart - INTVAL (XEXP (base, 1)) - 1;
2317               start += *pstart - INTVAL (XEXP (base, 1)) - 1;
2318               base = *pbase;
2319             }
2320           break;
2321         }
2322
2323       break;
2324     }
2325
2326   end = start + size;
2327
2328   /* Set the return values.  */
2329   *pbase = base;
2330   *pstart = start;
2331   *pend = end;
2332 }
2333
2334 /* Return 1 iff any subexpression of X refers to memory
2335    at an address of BASE plus some offset
2336    such that any of the bytes' offsets fall between START (inclusive)
2337    and END (exclusive).
2338
2339    The value is undefined if X is a varying address (as determined by
2340    cse_rtx_addr_varies_p).  This function is not used in such cases.
2341
2342    When used in the cse pass, `qty_const' is nonzero, and it is used
2343    to treat an address that is a register with a known constant value
2344    as if it were that constant value.
2345    In the loop pass, `qty_const' is zero, so this is not done.  */
2346
2347 static int
2348 refers_to_mem_p (x, base, start, end)
2349      rtx x, base;
2350      HOST_WIDE_INT start, end;
2351 {
2352   register HOST_WIDE_INT i;
2353   register enum rtx_code code;
2354   register char *fmt;
2355
2356   if (GET_CODE (base) == CONST_INT)
2357     {
2358       start += INTVAL (base);
2359       end += INTVAL (base);
2360       base = const0_rtx;
2361     }
2362
2363  repeat:
2364   if (x == 0)
2365     return 0;
2366
2367   code = GET_CODE (x);
2368   if (code == MEM)
2369     {
2370       register rtx addr = XEXP (x, 0);  /* Get the address.  */
2371       rtx mybase;
2372       HOST_WIDE_INT mystart, myend;
2373
2374       set_nonvarying_address_components (addr, GET_MODE_SIZE (GET_MODE (x)),
2375                                          &mybase, &mystart, &myend);
2376
2377
2378       /* refers_to_mem_p is never called with varying addresses.
2379          If the base addresses are not equal, there is no chance
2380          of the memory addresses conflicting.  */
2381       if (! rtx_equal_p (mybase, base))
2382         return 0;
2383
2384       return myend > start && mystart < end;
2385     }
2386
2387   /* X does not match, so try its subexpressions.  */
2388
2389   fmt = GET_RTX_FORMAT (code);
2390   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2391     if (fmt[i] == 'e')
2392       {
2393         if (i == 0)
2394           {
2395             x = XEXP (x, 0);
2396             goto repeat;
2397           }
2398         else
2399           if (refers_to_mem_p (XEXP (x, i), base, start, end))
2400             return 1;
2401       }
2402     else if (fmt[i] == 'E')
2403       {
2404         int j;
2405         for (j = 0; j < XVECLEN (x, i); j++)
2406           if (refers_to_mem_p (XVECEXP (x, i, j), base, start, end))
2407             return 1;
2408       }
2409
2410   return 0;
2411 }
2412
2413 /* Nonzero if X refers to memory at a varying address;
2414    except that a register which has at the moment a known constant value
2415    isn't considered variable.  */
2416
2417 static int
2418 cse_rtx_addr_varies_p (x)
2419      rtx x;
2420 {
2421   /* We need not check for X and the equivalence class being of the same
2422      mode because if X is equivalent to a constant in some mode, it
2423      doesn't vary in any mode.  */
2424
2425   if (GET_CODE (x) == MEM
2426       && GET_CODE (XEXP (x, 0)) == REG
2427       && REGNO_QTY_VALID_P (REGNO (XEXP (x, 0)))
2428       && GET_MODE (XEXP (x, 0)) == qty_mode[reg_qty[REGNO (XEXP (x, 0))]]
2429       && qty_const[reg_qty[REGNO (XEXP (x, 0))]] != 0)
2430     return 0;
2431
2432   if (GET_CODE (x) == MEM
2433       && GET_CODE (XEXP (x, 0)) == PLUS
2434       && GET_CODE (XEXP (XEXP (x, 0), 1)) == CONST_INT
2435       && GET_CODE (XEXP (XEXP (x, 0), 0)) == REG
2436       && REGNO_QTY_VALID_P (REGNO (XEXP (XEXP (x, 0), 0)))
2437       && (GET_MODE (XEXP (XEXP (x, 0), 0))
2438           == qty_mode[reg_qty[REGNO (XEXP (XEXP (x, 0), 0))]])
2439       && qty_const[reg_qty[REGNO (XEXP (XEXP (x, 0), 0))]])
2440     return 0;
2441
2442   return rtx_addr_varies_p (x);
2443 }
2444 \f
2445 /* Canonicalize an expression:
2446    replace each register reference inside it
2447    with the "oldest" equivalent register.
2448
2449    If INSN is non-zero and we are replacing a pseudo with a hard register
2450    or vice versa, validate_change is used to ensure that INSN remains valid
2451    after we make our substitution.  The calls are made with IN_GROUP non-zero
2452    so apply_change_group must be called upon the outermost return from this
2453    function (unless INSN is zero).  The result of apply_change_group can
2454    generally be discarded since the changes we are making are optional.  */
2455
2456 static rtx
2457 canon_reg (x, insn)
2458      rtx x;
2459      rtx insn;
2460 {
2461   register int i;
2462   register enum rtx_code code;
2463   register char *fmt;
2464
2465   if (x == 0)
2466     return x;
2467
2468   code = GET_CODE (x);
2469   switch (code)
2470     {
2471     case PC:
2472     case CC0:
2473     case CONST:
2474     case CONST_INT:
2475     case CONST_DOUBLE:
2476     case SYMBOL_REF:
2477     case LABEL_REF:
2478     case ADDR_VEC:
2479     case ADDR_DIFF_VEC:
2480       return x;
2481
2482     case REG:
2483       {
2484         register int first;
2485
2486         /* Never replace a hard reg, because hard regs can appear
2487            in more than one machine mode, and we must preserve the mode
2488            of each occurrence.  Also, some hard regs appear in
2489            MEMs that are shared and mustn't be altered.  Don't try to
2490            replace any reg that maps to a reg of class NO_REGS.  */
2491         if (REGNO (x) < FIRST_PSEUDO_REGISTER
2492             || ! REGNO_QTY_VALID_P (REGNO (x)))
2493           return x;
2494
2495         first = qty_first_reg[reg_qty[REGNO (x)]];
2496         return (first >= FIRST_PSEUDO_REGISTER ? regno_reg_rtx[first]
2497                 : REGNO_REG_CLASS (first) == NO_REGS ? x
2498                 : gen_rtx (REG, qty_mode[reg_qty[REGNO (x)]], first));
2499       }
2500     }
2501
2502   fmt = GET_RTX_FORMAT (code);
2503   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
2504     {
2505       register int j;
2506
2507       if (fmt[i] == 'e')
2508         {
2509           rtx new = canon_reg (XEXP (x, i), insn);
2510
2511           /* If replacing pseudo with hard reg or vice versa, ensure the
2512              insn remains valid.  Likewise if the insn has MATCH_DUPs.  */
2513           if (insn != 0 && new != 0
2514               && GET_CODE (new) == REG && GET_CODE (XEXP (x, i)) == REG
2515               && (((REGNO (new) < FIRST_PSEUDO_REGISTER)
2516                    != (REGNO (XEXP (x, i)) < FIRST_PSEUDO_REGISTER))
2517                   || insn_n_dups[recog_memoized (insn)] > 0))
2518             validate_change (insn, &XEXP (x, i), new, 1);
2519           else
2520             XEXP (x, i) = new;
2521         }
2522       else if (fmt[i] == 'E')
2523         for (j = 0; j < XVECLEN (x, i); j++)
2524           XVECEXP (x, i, j) = canon_reg (XVECEXP (x, i, j), insn);
2525     }
2526
2527   return x;
2528 }
2529 \f
2530 /* LOC is a location with INSN that is an operand address (the contents of
2531    a MEM).  Find the best equivalent address to use that is valid for this
2532    insn.
2533
2534    On most CISC machines, complicated address modes are costly, and rtx_cost
2535    is a good approximation for that cost.  However, most RISC machines have
2536    only a few (usually only one) memory reference formats.  If an address is
2537    valid at all, it is often just as cheap as any other address.  Hence, for
2538    RISC machines, we use the configuration macro `ADDRESS_COST' to compare the
2539    costs of various addresses.  For two addresses of equal cost, choose the one
2540    with the highest `rtx_cost' value as that has the potential of eliminating
2541    the most insns.  For equal costs, we choose the first in the equivalence
2542    class.  Note that we ignore the fact that pseudo registers are cheaper
2543    than hard registers here because we would also prefer the pseudo registers.
2544   */
2545
2546 static void
2547 find_best_addr (insn, loc)
2548      rtx insn;
2549      rtx *loc;
2550 {
2551   struct table_elt *elt, *p;
2552   rtx addr = *loc;
2553   int our_cost;
2554   int found_better = 1;
2555   int save_do_not_record = do_not_record;
2556   int save_hash_arg_in_memory = hash_arg_in_memory;
2557   int save_hash_arg_in_struct = hash_arg_in_struct;
2558   int addr_volatile;
2559   int regno;
2560   unsigned hash;
2561
2562   /* Do not try to replace constant addresses or addresses of local and
2563      argument slots.  These MEM expressions are made only once and inserted
2564      in many instructions, as well as being used to control symbol table
2565      output.  It is not safe to clobber them.
2566
2567      There are some uncommon cases where the address is already in a register
2568      for some reason, but we cannot take advantage of that because we have
2569      no easy way to unshare the MEM.  In addition, looking up all stack
2570      addresses is costly.  */
2571   if ((GET_CODE (addr) == PLUS
2572        && GET_CODE (XEXP (addr, 0)) == REG
2573        && GET_CODE (XEXP (addr, 1)) == CONST_INT
2574        && (regno = REGNO (XEXP (addr, 0)),
2575            regno == FRAME_POINTER_REGNUM || regno == HARD_FRAME_POINTER_REGNUM
2576            || regno == ARG_POINTER_REGNUM))
2577       || (GET_CODE (addr) == REG
2578           && (regno = REGNO (addr), regno == FRAME_POINTER_REGNUM
2579               || regno == HARD_FRAME_POINTER_REGNUM
2580               || regno == ARG_POINTER_REGNUM))
2581       || CONSTANT_ADDRESS_P (addr))
2582     return;
2583
2584   /* If this address is not simply a register, try to fold it.  This will
2585      sometimes simplify the expression.  Many simplifications
2586      will not be valid, but some, usually applying the associative rule, will
2587      be valid and produce better code.  */
2588   if (GET_CODE (addr) != REG
2589       && validate_change (insn, loc, fold_rtx (addr, insn), 0))
2590     addr = *loc;
2591
2592   /* If this address is not in the hash table, we can't look for equivalences
2593      of the whole address.  Also, ignore if volatile.  */
2594
2595   do_not_record = 0;
2596   hash = HASH (addr, Pmode);
2597   addr_volatile = do_not_record;
2598   do_not_record = save_do_not_record;
2599   hash_arg_in_memory = save_hash_arg_in_memory;
2600   hash_arg_in_struct = save_hash_arg_in_struct;
2601
2602   if (addr_volatile)
2603     return;
2604
2605   elt = lookup (addr, hash, Pmode);
2606
2607 #ifndef ADDRESS_COST
2608   if (elt)
2609     {
2610       our_cost = elt->cost;
2611
2612       /* Find the lowest cost below ours that works.  */
2613       for (elt = elt->first_same_value; elt; elt = elt->next_same_value)
2614         if (elt->cost < our_cost
2615             && (GET_CODE (elt->exp) == REG
2616                 || exp_equiv_p (elt->exp, elt->exp, 1, 0))
2617             && validate_change (insn, loc,
2618                                 canon_reg (copy_rtx (elt->exp), NULL_RTX), 0))
2619           return;
2620     }
2621 #else
2622
2623   if (elt)
2624     {
2625       /* We need to find the best (under the criteria documented above) entry
2626          in the class that is valid.  We use the `flag' field to indicate
2627          choices that were invalid and iterate until we can't find a better
2628          one that hasn't already been tried.  */
2629
2630       for (p = elt->first_same_value; p; p = p->next_same_value)
2631         p->flag = 0;
2632
2633       while (found_better)
2634         {
2635           int best_addr_cost = ADDRESS_COST (*loc);
2636           int best_rtx_cost = (elt->cost + 1) >> 1;
2637           struct table_elt *best_elt = elt;
2638
2639           found_better = 0;
2640           for (p = elt->first_same_value; p; p = p->next_same_value)
2641             if (! p->flag
2642                 && (GET_CODE (p->exp) == REG
2643                     || exp_equiv_p (p->exp, p->exp, 1, 0))
2644                 && (ADDRESS_COST (p->exp) < best_addr_cost
2645                     || (ADDRESS_COST (p->exp) == best_addr_cost
2646                         && (p->cost + 1) >> 1 > best_rtx_cost)))
2647               {
2648                 found_better = 1;
2649                 best_addr_cost = ADDRESS_COST (p->exp);
2650                 best_rtx_cost = (p->cost + 1) >> 1;
2651                 best_elt = p;
2652               }
2653
2654           if (found_better)
2655             {
2656               if (validate_change (insn, loc,
2657                                    canon_reg (copy_rtx (best_elt->exp),
2658                                               NULL_RTX), 0))
2659                 return;
2660               else
2661                 best_elt->flag = 1;
2662             }
2663         }
2664     }
2665
2666   /* If the address is a binary operation with the first operand a register
2667      and the second a constant, do the same as above, but looking for
2668      equivalences of the register.  Then try to simplify before checking for
2669      the best address to use.  This catches a few cases:  First is when we
2670      have REG+const and the register is another REG+const.  We can often merge
2671      the constants and eliminate one insn and one register.  It may also be
2672      that a machine has a cheap REG+REG+const.  Finally, this improves the
2673      code on the Alpha for unaligned byte stores.  */
2674
2675   if (flag_expensive_optimizations
2676       && (GET_RTX_CLASS (GET_CODE (*loc)) == '2'
2677           || GET_RTX_CLASS (GET_CODE (*loc)) == 'c')
2678       && GET_CODE (XEXP (*loc, 0)) == REG
2679       && GET_CODE (XEXP (*loc, 1)) == CONST_INT)
2680     {
2681       rtx c = XEXP (*loc, 1);
2682
2683       do_not_record = 0;
2684       hash = HASH (XEXP (*loc, 0), Pmode);
2685       do_not_record = save_do_not_record;
2686       hash_arg_in_memory = save_hash_arg_in_memory;
2687       hash_arg_in_struct = save_hash_arg_in_struct;
2688
2689       elt = lookup (XEXP (*loc, 0), hash, Pmode);
2690       if (elt == 0)
2691         return;
2692
2693       /* We need to find the best (under the criteria documented above) entry
2694          in the class that is valid.  We use the `flag' field to indicate
2695          choices that were invalid and iterate until we can't find a better
2696          one that hasn't already been tried.  */
2697
2698       for (p = elt->first_same_value; p; p = p->next_same_value)
2699         p->flag = 0;
2700
2701       while (found_better)
2702         {
2703           int best_addr_cost = ADDRESS_COST (*loc);
2704           int best_rtx_cost = (COST (*loc) + 1) >> 1;
2705           struct table_elt *best_elt = elt;
2706           rtx best_rtx = *loc;
2707           int count;
2708
2709           /* This is at worst case an O(n^2) algorithm, so limit our search
2710              to the first 32 elements on the list.  This avoids trouble
2711              compiling code with very long basic blocks that can easily
2712              call cse_gen_binary so many times that we run out of memory.  */
2713
2714           found_better = 0;
2715           for (p = elt->first_same_value, count = 0;
2716                p && count < 32;
2717                p = p->next_same_value, count++)
2718             if (! p->flag
2719                 && (GET_CODE (p->exp) == REG
2720                     || exp_equiv_p (p->exp, p->exp, 1, 0)))
2721               {
2722                 rtx new = cse_gen_binary (GET_CODE (*loc), Pmode, p->exp, c);
2723
2724                 if ((ADDRESS_COST (new) < best_addr_cost
2725                     || (ADDRESS_COST (new) == best_addr_cost
2726                         && (COST (new) + 1) >> 1 > best_rtx_cost)))
2727                   {
2728                     found_better = 1;
2729                     best_addr_cost = ADDRESS_COST (new);
2730                     best_rtx_cost = (COST (new) + 1) >> 1;
2731                     best_elt = p;
2732                     best_rtx = new;
2733                   }
2734               }
2735
2736           if (found_better)
2737             {
2738               if (validate_change (insn, loc,
2739                                    canon_reg (copy_rtx (best_rtx),
2740                                               NULL_RTX), 0))
2741                 return;
2742               else
2743                 best_elt->flag = 1;
2744             }
2745         }
2746     }
2747 #endif
2748 }
2749 \f
2750 /* Given an operation (CODE, *PARG1, *PARG2), where code is a comparison
2751    operation (EQ, NE, GT, etc.), follow it back through the hash table and
2752    what values are being compared.
2753
2754    *PARG1 and *PARG2 are updated to contain the rtx representing the values
2755    actually being compared.  For example, if *PARG1 was (cc0) and *PARG2
2756    was (const_int 0), *PARG1 and *PARG2 will be set to the objects that were
2757    compared to produce cc0.
2758
2759    The return value is the comparison operator and is either the code of
2760    A or the code corresponding to the inverse of the comparison.  */
2761
2762 static enum rtx_code
2763 find_comparison_args (code, parg1, parg2, pmode1, pmode2)
2764      enum rtx_code code;
2765      rtx *parg1, *parg2;
2766      enum machine_mode *pmode1, *pmode2;
2767 {
2768   rtx arg1, arg2;
2769
2770   arg1 = *parg1, arg2 = *parg2;
2771
2772   /* If ARG2 is const0_rtx, see what ARG1 is equivalent to.  */
2773
2774   while (arg2 == CONST0_RTX (GET_MODE (arg1)))
2775     {
2776       /* Set non-zero when we find something of interest.  */
2777       rtx x = 0;
2778       int reverse_code = 0;
2779       struct table_elt *p = 0;
2780
2781       /* If arg1 is a COMPARE, extract the comparison arguments from it.
2782          On machines with CC0, this is the only case that can occur, since
2783          fold_rtx will return the COMPARE or item being compared with zero
2784          when given CC0.  */
2785
2786       if (GET_CODE (arg1) == COMPARE && arg2 == const0_rtx)
2787         x = arg1;
2788
2789       /* If ARG1 is a comparison operator and CODE is testing for
2790          STORE_FLAG_VALUE, get the inner arguments.  */
2791
2792       else if (GET_RTX_CLASS (GET_CODE (arg1)) == '<')
2793         {
2794           if (code == NE
2795               || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_INT
2796                   && code == LT && STORE_FLAG_VALUE == -1)
2797 #ifdef FLOAT_STORE_FLAG_VALUE
2798               || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_FLOAT
2799                   && FLOAT_STORE_FLAG_VALUE < 0)
2800 #endif
2801               )
2802             x = arg1;
2803           else if (code == EQ
2804                    || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_INT
2805                        && code == GE && STORE_FLAG_VALUE == -1)
2806 #ifdef FLOAT_STORE_FLAG_VALUE
2807                    || (GET_MODE_CLASS (GET_MODE (arg1)) == MODE_FLOAT
2808                        && FLOAT_STORE_FLAG_VALUE < 0)
2809 #endif
2810                    )
2811             x = arg1, reverse_code = 1;
2812         }
2813
2814       /* ??? We could also check for
2815
2816          (ne (and (eq (...) (const_int 1))) (const_int 0))
2817
2818          and related forms, but let's wait until we see them occurring.  */
2819
2820       if (x == 0)
2821         /* Look up ARG1 in the hash table and see if it has an equivalence
2822            that lets us see what is being compared.  */
2823         p = lookup (arg1, safe_hash (arg1, GET_MODE (arg1)) % NBUCKETS,
2824                     GET_MODE (arg1));
2825       if (p) p = p->first_same_value;
2826
2827       for (; p; p = p->next_same_value)
2828         {
2829           enum machine_mode inner_mode = GET_MODE (p->exp);
2830
2831           /* If the entry isn't valid, skip it.  */
2832           if (! exp_equiv_p (p->exp, p->exp, 1, 0))
2833             continue;
2834
2835           if (GET_CODE (p->exp) == COMPARE
2836               /* Another possibility is that this machine has a compare insn
2837                  that includes the comparison code.  In that case, ARG1 would
2838                  be equivalent to a comparison operation that would set ARG1 to
2839                  either STORE_FLAG_VALUE or zero.  If this is an NE operation,
2840                  ORIG_CODE is the actual comparison being done; if it is an EQ,
2841                  we must reverse ORIG_CODE.  On machine with a negative value
2842                  for STORE_FLAG_VALUE, also look at LT and GE operations.  */
2843               || ((code == NE
2844                    || (code == LT
2845                        && GET_MODE_CLASS (inner_mode) == MODE_INT
2846                        && (GET_MODE_BITSIZE (inner_mode)
2847                            <= HOST_BITS_PER_WIDE_INT)
2848                        && (STORE_FLAG_VALUE
2849                            & ((HOST_WIDE_INT) 1
2850                               << (GET_MODE_BITSIZE (inner_mode) - 1))))
2851 #ifdef FLOAT_STORE_FLAG_VALUE
2852                    || (code == LT
2853                        && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
2854                        && FLOAT_STORE_FLAG_VALUE < 0)
2855 #endif
2856                    )
2857                   && GET_RTX_CLASS (GET_CODE (p->exp)) == '<'))
2858             {
2859               x = p->exp;
2860               break;
2861             }
2862           else if ((code == EQ
2863                     || (code == GE
2864                         && GET_MODE_CLASS (inner_mode) == MODE_INT
2865                         && (GET_MODE_BITSIZE (inner_mode)
2866                             <= HOST_BITS_PER_WIDE_INT)
2867                         && (STORE_FLAG_VALUE
2868                             & ((HOST_WIDE_INT) 1
2869                                << (GET_MODE_BITSIZE (inner_mode) - 1))))
2870 #ifdef FLOAT_STORE_FLAG_VALUE
2871                     || (code == GE
2872                         && GET_MODE_CLASS (inner_mode) == MODE_FLOAT
2873                         && FLOAT_STORE_FLAG_VALUE < 0)
2874 #endif
2875                     )
2876                    && GET_RTX_CLASS (GET_CODE (p->exp)) == '<')
2877             {
2878               reverse_code = 1;
2879               x = p->exp;
2880               break;
2881             }
2882
2883           /* If this is fp + constant, the equivalent is a better operand since
2884              it may let us predict the value of the comparison.  */
2885           else if (NONZERO_BASE_PLUS_P (p->exp))
2886             {
2887               arg1 = p->exp;
2888               continue;
2889             }
2890         }
2891
2892       /* If we didn't find a useful equivalence for ARG1, we are done.
2893          Otherwise, set up for the next iteration.  */
2894       if (x == 0)
2895         break;
2896
2897       arg1 = XEXP (x, 0),  arg2 = XEXP (x, 1);
2898       if (GET_RTX_CLASS (GET_CODE (x)) == '<')
2899         code = GET_CODE (x);
2900
2901       if (reverse_code)
2902         code = reverse_condition (code);
2903     }
2904
2905   /* Return our results.  Return the modes from before fold_rtx
2906      because fold_rtx might produce const_int, and then it's too late.  */
2907   *pmode1 = GET_MODE (arg1), *pmode2 = GET_MODE (arg2);
2908   *parg1 = fold_rtx (arg1, 0), *parg2 = fold_rtx (arg2, 0);
2909
2910   return code;
2911 }
2912 \f
2913 /* Try to simplify a unary operation CODE whose output mode is to be
2914    MODE with input operand OP whose mode was originally OP_MODE.
2915    Return zero if no simplification can be made.  */
2916
2917 rtx
2918 simplify_unary_operation (code, mode, op, op_mode)
2919      enum rtx_code code;
2920      enum machine_mode mode;
2921      rtx op;
2922      enum machine_mode op_mode;
2923 {
2924   register int width = GET_MODE_BITSIZE (mode);
2925
2926   /* The order of these tests is critical so that, for example, we don't
2927      check the wrong mode (input vs. output) for a conversion operation,
2928      such as FIX.  At some point, this should be simplified.  */
2929
2930 #if !defined(REAL_IS_NOT_DOUBLE) || defined(REAL_ARITHMETIC)
2931
2932   if (code == FLOAT && GET_MODE (op) == VOIDmode
2933       && (GET_CODE (op) == CONST_DOUBLE || GET_CODE (op) == CONST_INT))
2934     {
2935       HOST_WIDE_INT hv, lv;
2936       REAL_VALUE_TYPE d;
2937
2938       if (GET_CODE (op) == CONST_INT)
2939         lv = INTVAL (op), hv = INTVAL (op) < 0 ? -1 : 0;
2940       else
2941         lv = CONST_DOUBLE_LOW (op),  hv = CONST_DOUBLE_HIGH (op);
2942
2943 #ifdef REAL_ARITHMETIC
2944       REAL_VALUE_FROM_INT (d, lv, hv);
2945 #else
2946       if (hv < 0)
2947         {
2948           d = (double) (~ hv);
2949           d *= ((double) ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT / 2))
2950                 * (double) ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT / 2)));
2951           d += (double) (unsigned HOST_WIDE_INT) (~ lv);
2952           d = (- d - 1.0);
2953         }
2954       else
2955         {
2956           d = (double) hv;
2957           d *= ((double) ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT / 2))
2958                 * (double) ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT / 2)));
2959           d += (double) (unsigned HOST_WIDE_INT) lv;
2960         }
2961 #endif  /* REAL_ARITHMETIC */
2962
2963       return CONST_DOUBLE_FROM_REAL_VALUE (d, mode);
2964     }
2965   else if (code == UNSIGNED_FLOAT && GET_MODE (op) == VOIDmode
2966            && (GET_CODE (op) == CONST_DOUBLE || GET_CODE (op) == CONST_INT))
2967     {
2968       HOST_WIDE_INT hv, lv;
2969       REAL_VALUE_TYPE d;
2970
2971       if (GET_CODE (op) == CONST_INT)
2972         lv = INTVAL (op), hv = INTVAL (op) < 0 ? -1 : 0;
2973       else
2974         lv = CONST_DOUBLE_LOW (op),  hv = CONST_DOUBLE_HIGH (op);
2975
2976       if (GET_MODE_BITSIZE (op_mode) >= HOST_BITS_PER_WIDE_INT * 2)
2977         ;
2978       else
2979         hv = 0, lv &= GET_MODE_MASK (op_mode);
2980
2981 #ifdef REAL_ARITHMETIC
2982       REAL_VALUE_FROM_UNSIGNED_INT (d, lv, hv);
2983 #else
2984
2985       d = (double) (unsigned HOST_WIDE_INT) hv;
2986       d *= ((double) ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT / 2))
2987             * (double) ((HOST_WIDE_INT) 1 << (HOST_BITS_PER_WIDE_INT / 2)));
2988       d += (double) (unsigned HOST_WIDE_INT) lv;
2989 #endif  /* REAL_ARITHMETIC */
2990
2991       return CONST_DOUBLE_FROM_REAL_VALUE (d, mode);
2992     }
2993 #endif
2994
2995   if (GET_CODE (op) == CONST_INT
2996       && width <= HOST_BITS_PER_WIDE_INT && width > 0)
2997     {
2998       register HOST_WIDE_INT arg0 = INTVAL (op);
2999       register HOST_WIDE_INT val;
3000
3001       switch (code)
3002         {
3003         case NOT:
3004           val = ~ arg0;
3005           break;
3006
3007         case NEG:
3008           val = - arg0;
3009           break;
3010
3011         case ABS:
3012           val = (arg0 >= 0 ? arg0 : - arg0);
3013           break;
3014
3015         case FFS:
3016           /* Don't use ffs here.  Instead, get low order bit and then its
3017              number.  If arg0 is zero, this will return 0, as desired.  */
3018           arg0 &= GET_MODE_MASK (mode);
3019           val = exact_log2 (arg0 & (- arg0)) + 1;
3020           break;
3021
3022         case TRUNCATE:
3023           val = arg0;
3024           break;
3025
3026         case ZERO_EXTEND:
3027           if (op_mode == VOIDmode)
3028             op_mode = mode;
3029           if (GET_MODE_BITSIZE (op_mode) == HOST_BITS_PER_WIDE_INT)
3030             {
3031               /* If we were really extending the mode,
3032                  we would have to distinguish between zero-extension
3033                  and sign-extension.  */
3034               if (width != GET_MODE_BITSIZE (op_mode))
3035                 abort ();
3036               val = arg0;
3037             }
3038           else if (GET_MODE_BITSIZE (op_mode) < HOST_BITS_PER_WIDE_INT)
3039             val = arg0 & ~((HOST_WIDE_INT) (-1) << GET_MODE_BITSIZE (op_mode));
3040           else
3041             return 0;
3042           break;
3043
3044         case SIGN_EXTEND:
3045           if (op_mode == VOIDmode)
3046             op_mode = mode;
3047           if (GET_MODE_BITSIZE (op_mode) == HOST_BITS_PER_WIDE_INT)
3048             {
3049               /* If we were really extending the mode,
3050                  we would have to distinguish between zero-extension
3051                  and sign-extension.  */
3052               if (width != GET_MODE_BITSIZE (op_mode))
3053                 abort ();
3054               val = arg0;
3055             }
3056           else if (GET_MODE_BITSIZE (op_mode) < HOST_BITS_PER_WIDE_INT)
3057             {
3058               val
3059                 = arg0 & ~((HOST_WIDE_INT) (-1) << GET_MODE_BITSIZE (op_mode));
3060               if (val
3061                   & ((HOST_WIDE_INT) 1 << (GET_MODE_BITSIZE (op_mode) - 1)))
3062                 val -= (HOST_WIDE_INT) 1 << GET_MODE_BITSIZE (op_mode);
3063             }
3064           else
3065             return 0;
3066           break;
3067
3068         case SQRT:
3069           return 0;
3070
3071         default:
3072           abort ();
3073         }
3074
3075       /* Clear the bits that don't belong in our mode,
3076          unless they and our sign bit are all one.
3077          So we get either a reasonable negative value or a reasonable
3078          unsigned value for this mode.  */
3079       if (width < HOST_BITS_PER_WIDE_INT
3080           && ((val & ((HOST_WIDE_INT) (-1) << (width - 1)))
3081               != ((HOST_WIDE_INT) (-1) << (width - 1))))
3082         val &= (1 << width) - 1;
3083
3084       return GEN_INT (val);
3085     }
3086
3087   /* We can do some operations on integer CONST_DOUBLEs.  Also allow
3088      for a DImode operation on a CONST_INT. */
3089   else if (GET_MODE (op) == VOIDmode && width <= HOST_BITS_PER_INT * 2
3090            && (GET_CODE (op) == CONST_DOUBLE || GET_CODE (op) == CONST_INT))
3091     {
3092       HOST_WIDE_INT l1, h1, lv, hv;
3093
3094       if (GET_CODE (op) == CONST_DOUBLE)
3095         l1 = CONST_DOUBLE_LOW (op), h1 = CONST_DOUBLE_HIGH (op);
3096       else
3097         l1 = INTVAL (op), h1 = l1 < 0 ? -1 : 0;
3098
3099       switch (code)
3100         {
3101         case NOT:
3102           lv = ~ l1;
3103           hv = ~ h1;
3104           break;
3105
3106         case NEG:
3107           neg_double (l1, h1, &lv, &hv);
3108           break;
3109
3110         case ABS:
3111           if (h1 < 0)
3112             neg_double (l1, h1, &lv, &hv);
3113           else
3114             lv = l1, hv = h1;
3115           break;
3116
3117         case FFS:
3118           hv = 0;
3119           if (l1 == 0)
3120             lv = HOST_BITS_PER_WIDE_INT + exact_log2 (h1 & (-h1)) + 1;
3121           else
3122             lv = exact_log2 (l1 & (-l1)) + 1;
3123           break;
3124
3125         case TRUNCATE:
3126           /* This is just a change-of-mode, so do nothing.  */
3127           break;
3128
3129         case ZERO_EXTEND:
3130           if (op_mode == VOIDmode
3131               || GET_MODE_BITSIZE (op_mode) > HOST_BITS_PER_WIDE_INT)
3132             return 0;
3133
3134           hv = 0;
3135           lv = l1 & GET_MODE_MASK (op_mode);
3136           break;
3137
3138         case SIGN_EXTEND:
3139           if (op_mode == VOIDmode
3140               || GET_MODE_BITSIZE (op_mode) > HOST_BITS_PER_WIDE_INT)
3141             return 0;
3142           else
3143             {
3144               lv = l1 & GET_MODE_MASK (op_mode);
3145               if (GET_MODE_BITSIZE (op_mode) < HOST_BITS_PER_WIDE_INT
3146                   && (lv & ((HOST_WIDE_INT) 1
3147                             << (GET_MODE_BITSIZE (op_mode) - 1))) != 0)
3148                 lv -= (HOST_WIDE_INT) 1 << GET_MODE_BITSIZE (op_mode);
3149
3150               hv = (lv < 0) ? ~ (HOST_WIDE_INT) 0 : 0;
3151             }
3152           break;
3153
3154         case SQRT:
3155           return 0;
3156
3157         default:
3158           return 0;
3159         }
3160
3161       return immed_double_const (lv, hv, mode);
3162     }
3163
3164 #if ! defined (REAL_IS_NOT_DOUBLE) || defined (REAL_ARITHMETIC)
3165   else if (GET_CODE (op) == CONST_DOUBLE
3166            && GET_MODE_CLASS (mode) == MODE_FLOAT)
3167     {
3168       REAL_VALUE_TYPE d;
3169       jmp_buf handler;
3170       rtx x;
3171
3172       if (setjmp (handler))
3173         /* There used to be a warning here, but that is inadvisable.
3174            People may want to cause traps, and the natural way
3175            to do it should not get a warning.  */
3176         return 0;
3177
3178       set_float_handler (handler);
3179
3180       REAL_VALUE_FROM_CONST_DOUBLE (d, op);
3181
3182       switch (code)
3183         {
3184         case NEG:
3185           d = REAL_VALUE_NEGATE (d);
3186           break;
3187
3188         case ABS:
3189           if (REAL_VALUE_NEGATIVE (d))
3190             d = REAL_VALUE_NEGATE (d);
3191           break;
3192
3193         case FLOAT_TRUNCATE:
3194           d = real_value_truncate (mode, d);
3195           break;
3196
3197         case FLOAT_EXTEND:
3198           /* All this does is change the mode.  */
3199           break;
3200
3201         case FIX:
3202           d = REAL_VALUE_RNDZINT (d);
3203           break;
3204
3205         case UNSIGNED_FIX:
3206           d = REAL_VALUE_UNSIGNED_RNDZINT (d);
3207           break;
3208
3209         case SQRT:
3210           return 0;
3211
3212         default:
3213           abort ();
3214         }
3215
3216       x = CONST_DOUBLE_FROM_REAL_VALUE (d, mode);
3217       set_float_handler (NULL_PTR);
3218       return x;
3219     }
3220
3221   else if (GET_CODE (op) == CONST_DOUBLE
3222            && GET_MODE_CLASS (GET_MODE (op)) == MODE_FLOAT
3223            && GET_MODE_CLASS (mode) == MODE_INT
3224            && width <= HOST_BITS_PER_WIDE_INT && width > 0)
3225     {
3226       REAL_VALUE_TYPE d;
3227       jmp_buf handler;
3228       HOST_WIDE_INT val;
3229
3230       if (setjmp (handler))
3231         return 0;
3232
3233       set_float_handler (handler);
3234
3235       REAL_VALUE_FROM_CONST_DOUBLE (d, op);
3236
3237       switch (code)
3238         {
3239         case FIX:
3240           val = REAL_VALUE_FIX (d);
3241           break;
3242
3243         case UNSIGNED_FIX:
3244           val = REAL_VALUE_UNSIGNED_FIX (d);
3245           break;
3246
3247         default:
3248           abort ();
3249         }
3250
3251       set_float_handler (NULL_PTR);
3252
3253       /* Clear the bits that don't belong in our mode,
3254          unless they and our sign bit are all one.
3255          So we get either a reasonable negative value or a reasonable
3256          unsigned value for this mode.  */
3257       if (width < HOST_BITS_PER_WIDE_INT
3258           && ((val & ((HOST_WIDE_INT) (-1) << (width - 1)))
3259               != ((HOST_WIDE_INT) (-1) << (width - 1))))
3260         val &= ((HOST_WIDE_INT) 1 << width) - 1;
3261
3262       return GEN_INT (val);
3263     }
3264 #endif
3265   /* This was formerly used only for non-IEEE float.
3266      eggert@twinsun.com says it is safe for IEEE also.  */
3267   else
3268     {
3269       /* There are some simplifications we can do even if the operands
3270          aren't constant.  */
3271       switch (code)
3272         {
3273         case NEG:
3274         case NOT:
3275           /* (not (not X)) == X, similarly for NEG.  */
3276           if (GET_CODE (op) == code)
3277             return XEXP (op, 0);
3278           break;
3279
3280         case SIGN_EXTEND:
3281           /* (sign_extend (truncate (minus (label_ref L1) (label_ref L2))))
3282              becomes just the MINUS if its mode is MODE.  This allows
3283              folding switch statements on machines using casesi (such as
3284              the Vax).  */
3285           if (GET_CODE (op) == TRUNCATE
3286               && GET_MODE (XEXP (op, 0)) == mode
3287               && GET_CODE (XEXP (op, 0)) == MINUS
3288               && GET_CODE (XEXP (XEXP (op, 0), 0)) == LABEL_REF
3289               && GET_CODE (XEXP (XEXP (op, 0), 1)) == LABEL_REF)
3290             return XEXP (op, 0);
3291           break;
3292         }
3293
3294       return 0;
3295     }
3296 }
3297 \f
3298 /* Simplify a binary operation CODE with result mode MODE, operating on OP0
3299    and OP1.  Return 0 if no simplification is possible.
3300
3301    Don't use this for relational operations such as EQ or LT.
3302    Use simplify_relational_operation instead.  */
3303
3304 rtx
3305 simplify_binary_operation (code, mode, op0, op1)
3306      enum rtx_code code;
3307      enum machine_mode mode;
3308      rtx op0, op1;
3309 {
3310   register HOST_WIDE_INT arg0, arg1, arg0s, arg1s;
3311   HOST_WIDE_INT val;
3312   int width = GET_MODE_BITSIZE (mode);
3313   rtx tem;
3314
3315   /* Relational operations don't work here.  We must know the mode
3316      of the operands in order to do the comparison correctly.
3317      Assuming a full word can give incorrect results.
3318      Consider comparing 128 with -128 in QImode.  */
3319
3320   if (GET_RTX_CLASS (code) == '<')
3321     abort ();
3322
3323 #if ! defined (REAL_IS_NOT_DOUBLE) || defined (REAL_ARITHMETIC)
3324   if (GET_MODE_CLASS (mode) == MODE_FLOAT
3325       && GET_CODE (op0) == CONST_DOUBLE && GET_CODE (op1) == CONST_DOUBLE
3326       && mode == GET_MODE (op0) && mode == GET_MODE (op1))
3327     {
3328       REAL_VALUE_TYPE f0, f1, value;
3329       jmp_buf handler;
3330
3331       if (setjmp (handler))
3332         return 0;
3333
3334       set_float_handler (handler);
3335
3336       REAL_VALUE_FROM_CONST_DOUBLE (f0, op0);
3337       REAL_VALUE_FROM_CONST_DOUBLE (f1, op1);
3338       f0 = real_value_truncate (mode, f0);
3339       f1 = real_value_truncate (mode, f1);
3340
3341 #ifdef REAL_ARITHMETIC
3342       REAL_ARITHMETIC (value, rtx_to_tree_code (code), f0, f1);
3343 #else
3344       switch (code)
3345         {
3346         case PLUS:
3347           value = f0 + f1;
3348           break;
3349         case MINUS:
3350           value = f0 - f1;
3351           break;
3352         case MULT:
3353           value = f0 * f1;
3354           break;
3355         case DIV:
3356 #ifndef REAL_INFINITY
3357           if (f1 == 0)
3358             return 0;
3359 #endif
3360           value = f0 / f1;
3361           break;
3362         case SMIN:
3363           value = MIN (f0, f1);
3364           break;
3365         case SMAX:
3366           value = MAX (f0, f1);
3367           break;
3368         default:
3369           abort ();
3370         }
3371 #endif
3372
3373       value = real_value_truncate (mode, value);
3374       set_float_handler (NULL_PTR);
3375       return CONST_DOUBLE_FROM_REAL_VALUE (value, mode);
3376     }
3377 #endif  /* not REAL_IS_NOT_DOUBLE, or REAL_ARITHMETIC */
3378
3379   /* We can fold some multi-word operations.  */
3380   if (GET_MODE_CLASS (mode) == MODE_INT
3381       && width == HOST_BITS_PER_WIDE_INT * 2
3382       && (GET_CODE (op0) == CONST_DOUBLE || GET_CODE (op0) == CONST_INT)
3383       && (GET_CODE (op1) == CONST_DOUBLE || GET_CODE (op1) == CONST_INT))
3384     {
3385       HOST_WIDE_INT l1, l2, h1, h2, lv, hv;
3386
3387       if (GET_CODE (op0) == CONST_DOUBLE)
3388         l1 = CONST_DOUBLE_LOW (op0), h1 = CONST_DOUBLE_HIGH (op0);
3389       else
3390         l1 = INTVAL (op0), h1 = l1 < 0 ? -1 : 0;
3391
3392       if (GET_CODE (op1) == CONST_DOUBLE)
3393         l2 = CONST_DOUBLE_LOW (op1), h2 = CONST_DOUBLE_HIGH (op1);
3394       else
3395         l2 = INTVAL (op1), h2 = l2 < 0 ? -1 : 0;
3396
3397       switch (code)
3398         {
3399         case MINUS:
3400           /* A - B == A + (-B).  */
3401           neg_double (l2, h2, &lv, &hv);
3402           l2 = lv, h2 = hv;
3403
3404           /* .. fall through ... */
3405
3406         case PLUS:
3407           add_double (l1, h1, l2, h2, &lv, &hv);
3408           break;
3409
3410         case MULT:
3411           mul_double (l1, h1, l2, h2, &lv, &hv);
3412           break;
3413
3414         case DIV:  case MOD:   case UDIV:  case UMOD:
3415           /* We'd need to include tree.h to do this and it doesn't seem worth
3416              it.  */
3417           return 0;
3418
3419         case AND:
3420           lv = l1 & l2, hv = h1 & h2;
3421           break;
3422
3423         case IOR:
3424           lv = l1 | l2, hv = h1 | h2;
3425           break;
3426
3427         case XOR:
3428           lv = l1 ^ l2, hv = h1 ^ h2;
3429           break;
3430
3431         case SMIN:
3432           if (h1 < h2
3433               || (h1 == h2
3434                   && ((unsigned HOST_WIDE_INT) l1
3435                       < (unsigned HOST_WIDE_INT) l2)))
3436             lv = l1, hv = h1;
3437           else
3438             lv = l2, hv = h2;
3439           break;
3440
3441         case SMAX:
3442           if (h1 > h2
3443               || (h1 == h2
3444                   && ((unsigned HOST_WIDE_INT) l1
3445                       > (unsigned HOST_WIDE_INT) l2)))
3446             lv = l1, hv = h1;
3447           else
3448             lv = l2, hv = h2;
3449           break;
3450
3451         case UMIN:
3452           if ((unsigned HOST_WIDE_INT) h1 < (unsigned HOST_WIDE_INT) h2
3453               || (h1 == h2
3454                   && ((unsigned HOST_WIDE_INT) l1
3455                       < (unsigned HOST_WIDE_INT) l2)))
3456             lv = l1, hv = h1;
3457           else
3458             lv = l2, hv = h2;
3459           break;
3460
3461         case UMAX:
3462           if ((unsigned HOST_WIDE_INT) h1 > (unsigned HOST_WIDE_INT) h2
3463               || (h1 == h2
3464                   && ((unsigned HOST_WIDE_INT) l1
3465                       > (unsigned HOST_WIDE_INT) l2)))
3466             lv = l1, hv = h1;
3467           else
3468             lv = l2, hv = h2;
3469           break;
3470
3471         case LSHIFTRT:   case ASHIFTRT:
3472         case ASHIFT:
3473         case ROTATE:     case ROTATERT:
3474 #ifdef SHIFT_COUNT_TRUNCATED
3475           if (SHIFT_COUNT_TRUNCATED)
3476             l2 &= (GET_MODE_BITSIZE (mode) - 1), h2 = 0;
3477 #endif
3478
3479           if (h2 != 0 || l2 < 0 || l2 >= GET_MODE_BITSIZE (mode))
3480             return 0;
3481
3482           if (code == LSHIFTRT || code == ASHIFTRT)
3483             rshift_double (l1, h1, l2, GET_MODE_BITSIZE (mode), &lv, &hv,
3484                            code == ASHIFTRT);
3485           else if (code == ASHIFT)
3486             lshift_double (l1, h1, l2, GET_MODE_BITSIZE (mode), &lv, &hv, 1);
3487           else if (code == ROTATE)
3488             lrotate_double (l1, h1, l2, GET_MODE_BITSIZE (mode), &lv, &hv);
3489           else /* code == ROTATERT */
3490             rrotate_double (l1, h1, l2, GET_MODE_BITSIZE (mode), &lv, &hv);
3491           break;
3492
3493         default:
3494           return 0;
3495         }
3496
3497       return immed_double_const (lv, hv, mode);
3498     }
3499
3500   if (GET_CODE (op0) != CONST_INT || GET_CODE (op1) != CONST_INT
3501       || width > HOST_BITS_PER_WIDE_INT || width == 0)
3502     {
3503       /* Even if we can't compute a constant result,
3504          there are some cases worth simplifying.  */
3505
3506       switch (code)
3507         {
3508         case PLUS:
3509           /* In IEEE floating point, x+0 is not the same as x.  Similarly
3510              for the other optimizations below.  */
3511           if (TARGET_FLOAT_FORMAT == IEEE_FLOAT_FORMAT
3512               && FLOAT_MODE_P (mode) && ! flag_fast_math)
3513             break;
3514
3515           if (op1 == CONST0_RTX (mode))
3516             return op0;
3517
3518           /* ((-a) + b) -> (b - a) and similarly for (a + (-b)) */
3519           if (GET_CODE (op0) == NEG)
3520             return cse_gen_binary (MINUS, mode, op1, XEXP (op0, 0));
3521           else if (GET_CODE (op1) == NEG)
3522             return cse_gen_binary (MINUS, mode, op0, XEXP (op1, 0));
3523
3524           /* Handle both-operands-constant cases.  We can only add
3525              CONST_INTs to constants since the sum of relocatable symbols
3526              can't be handled by most assemblers.  Don't add CONST_INT
3527              to CONST_INT since overflow won't be computed properly if wider
3528              than HOST_BITS_PER_WIDE_INT.  */
3529
3530           if (CONSTANT_P (op0) && GET_MODE (op0) != VOIDmode
3531               && GET_CODE (op1) == CONST_INT)
3532             return plus_constant (op0, INTVAL (op1));
3533           else if (CONSTANT_P (op1) && GET_MODE (op1) != VOIDmode
3534                    && GET_CODE (op0) == CONST_INT)
3535             return plus_constant (op1, INTVAL (op0));
3536
3537           /* See if this is something like X * C - X or vice versa or
3538              if the multiplication is written as a shift.  If so, we can
3539              distribute and make a new multiply, shift, or maybe just
3540              have X (if C is 2 in the example above).  But don't make
3541              real multiply if we didn't have one before.  */
3542
3543           if (! FLOAT_MODE_P (mode))
3544             {
3545               HOST_WIDE_INT coeff0 = 1, coeff1 = 1;
3546               rtx lhs = op0, rhs = op1;
3547               int had_mult = 0;
3548
3549               if (GET_CODE (lhs) == NEG)
3550                 coeff0 = -1, lhs = XEXP (lhs, 0);
3551               else if (GET_CODE (lhs) == MULT
3552                        && GET_CODE (XEXP (lhs, 1)) == CONST_INT)
3553                 {
3554                   coeff0 = INTVAL (XEXP (lhs, 1)), lhs = XEXP (lhs, 0);
3555                   had_mult = 1;
3556                 }
3557               else if (GET_CODE (lhs) == ASHIFT
3558                        && GET_CODE (XEXP (lhs, 1)) == CONST_INT
3559                        && INTVAL (XEXP (lhs, 1)) >= 0
3560                        && INTVAL (XEXP (lhs, 1)) < HOST_BITS_PER_WIDE_INT)
3561                 {
3562                   coeff0 = ((HOST_WIDE_INT) 1) << INTVAL (XEXP (lhs, 1));
3563                   lhs = XEXP (lhs, 0);
3564                 }
3565
3566               if (GET_CODE (rhs) == NEG)
3567                 coeff1 = -1, rhs = XEXP (rhs, 0);
3568               else if (GET_CODE (rhs) == MULT
3569                        && GET_CODE (XEXP (rhs, 1)) == CONST_INT)
3570                 {
3571                   coeff1 = INTVAL (XEXP (rhs, 1)), rhs = XEXP (rhs, 0);
3572                   had_mult = 1;
3573                 }
3574               else if (GET_CODE (rhs) == ASHIFT
3575                        && GET_CODE (XEXP (rhs, 1)) == CONST_INT
3576                        && INTVAL (XEXP (rhs, 1)) >= 0
3577                        && INTVAL (XEXP (rhs, 1)) < HOST_BITS_PER_WIDE_INT)
3578                 {
3579                   coeff1 = ((HOST_WIDE_INT) 1) << INTVAL (XEXP (rhs, 1));
3580                   rhs = XEXP (rhs, 0);
3581                 }
3582
3583               if (rtx_equal_p (lhs, rhs))
3584                 {
3585                   tem = cse_gen_binary (MULT, mode, lhs,
3586                                         GEN_INT (coeff0 + coeff1));
3587                   return (GET_CODE (tem) == MULT && ! had_mult) ? 0 : tem;
3588                 }
3589             }
3590
3591           /* If one of the operands is a PLUS or a MINUS, see if we can
3592              simplify this by the associative law.
3593              Don't use the associative law for floating point.
3594              The inaccuracy makes it nonassociative,
3595              and subtle programs can break if operations are associated.  */
3596
3597           if (INTEGRAL_MODE_P (mode)
3598               && (GET_CODE (op0) == PLUS || GET_CODE (op0) == MINUS
3599                   || GET_CODE (op1) == PLUS || GET_CODE (op1) == MINUS)
3600               && (tem = simplify_plus_minus (code, mode, op0, op1)) != 0)
3601             return tem;
3602           break;
3603
3604         case COMPARE:
3605 #ifdef HAVE_cc0
3606           /* Convert (compare FOO (const_int 0)) to FOO unless we aren't
3607              using cc0, in which case we want to leave it as a COMPARE
3608              so we can distinguish it from a register-register-copy.
3609
3610              In IEEE floating point, x-0 is not the same as x.  */
3611
3612           if ((TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
3613                || ! FLOAT_MODE_P (mode) || flag_fast_math)
3614               && op1 == CONST0_RTX (mode))
3615             return op0;
3616 #else
3617           /* Do nothing here.  */
3618 #endif
3619           break;
3620
3621         case MINUS:
3622           /* None of these optimizations can be done for IEEE
3623              floating point.  */
3624           if (TARGET_FLOAT_FORMAT == IEEE_FLOAT_FORMAT
3625               && FLOAT_MODE_P (mode) && ! flag_fast_math)
3626             break;
3627
3628           /* We can't assume x-x is 0 even with non-IEEE floating point,
3629              but since it is zero except in very strange circumstances, we
3630              will treat it as zero with -ffast-math.  */
3631           if (rtx_equal_p (op0, op1)
3632               && ! side_effects_p (op0)
3633               && (! FLOAT_MODE_P (mode) || flag_fast_math))
3634             return CONST0_RTX (mode);
3635
3636           /* Change subtraction from zero into negation.  */
3637           if (op0 == CONST0_RTX (mode))
3638             return gen_rtx (NEG, mode, op1);
3639
3640           /* (-1 - a) is ~a.  */
3641           if (op0 == constm1_rtx)
3642             return gen_rtx (NOT, mode, op1);
3643
3644           /* Subtracting 0 has no effect.  */
3645           if (op1 == CONST0_RTX (mode))
3646             return op0;
3647
3648           /* See if this is something like X * C - X or vice versa or
3649              if the multiplication is written as a shift.  If so, we can
3650              distribute and make a new multiply, shift, or maybe just
3651              have X (if C is 2 in the example above).  But don't make
3652              real multiply if we didn't have one before.  */
3653
3654           if (! FLOAT_MODE_P (mode))
3655             {
3656               HOST_WIDE_INT coeff0 = 1, coeff1 = 1;
3657               rtx lhs = op0, rhs = op1;
3658               int had_mult = 0;
3659
3660               if (GET_CODE (lhs) == NEG)
3661                 coeff0 = -1, lhs = XEXP (lhs, 0);
3662               else if (GET_CODE (lhs) == MULT
3663                        && GET_CODE (XEXP (lhs, 1)) == CONST_INT)
3664                 {
3665                   coeff0 = INTVAL (XEXP (lhs, 1)), lhs = XEXP (lhs, 0);
3666                   had_mult = 1;
3667                 }
3668               else if (GET_CODE (lhs) == ASHIFT
3669                        && GET_CODE (XEXP (lhs, 1)) == CONST_INT
3670                        && INTVAL (XEXP (lhs, 1)) >= 0
3671                        && INTVAL (XEXP (lhs, 1)) < HOST_BITS_PER_WIDE_INT)
3672                 {
3673                   coeff0 = ((HOST_WIDE_INT) 1) << INTVAL (XEXP (lhs, 1));
3674                   lhs = XEXP (lhs, 0);
3675                 }
3676
3677               if (GET_CODE (rhs) == NEG)
3678                 coeff1 = - 1, rhs = XEXP (rhs, 0);
3679               else if (GET_CODE (rhs) == MULT
3680                        && GET_CODE (XEXP (rhs, 1)) == CONST_INT)
3681                 {
3682                   coeff1 = INTVAL (XEXP (rhs, 1)), rhs = XEXP (rhs, 0);
3683                   had_mult = 1;
3684                 }
3685               else if (GET_CODE (rhs) == ASHIFT
3686                        && GET_CODE (XEXP (rhs, 1)) == CONST_INT
3687                        && INTVAL (XEXP (rhs, 1)) >= 0
3688                        && INTVAL (XEXP (rhs, 1)) < HOST_BITS_PER_WIDE_INT)
3689                 {
3690                   coeff1 = ((HOST_WIDE_INT) 1) << INTVAL (XEXP (rhs, 1));
3691                   rhs = XEXP (rhs, 0);
3692                 }
3693
3694               if (rtx_equal_p (lhs, rhs))
3695                 {
3696                   tem = cse_gen_binary (MULT, mode, lhs,
3697                                         GEN_INT (coeff0 - coeff1));
3698                   return (GET_CODE (tem) == MULT && ! had_mult) ? 0 : tem;
3699                 }
3700             }
3701
3702           /* (a - (-b)) -> (a + b).  */
3703           if (GET_CODE (op1) == NEG)
3704             return cse_gen_binary (PLUS, mode, op0, XEXP (op1, 0));
3705
3706           /* If one of the operands is a PLUS or a MINUS, see if we can
3707              simplify this by the associative law.
3708              Don't use the associative law for floating point.
3709              The inaccuracy makes it nonassociative,
3710              and subtle programs can break if operations are associated.  */
3711
3712           if (INTEGRAL_MODE_P (mode)
3713               && (GET_CODE (op0) == PLUS || GET_CODE (op0) == MINUS
3714                   || GET_CODE (op1) == PLUS || GET_CODE (op1) == MINUS)
3715               && (tem = simplify_plus_minus (code, mode, op0, op1)) != 0)
3716             return tem;
3717
3718           /* Don't let a relocatable value get a negative coeff.  */
3719           if (GET_CODE (op1) == CONST_INT && GET_MODE (op0) != VOIDmode)
3720             return plus_constant (op0, - INTVAL (op1));
3721           break;
3722
3723         case MULT:
3724           if (op1 == constm1_rtx)
3725             {
3726               tem = simplify_unary_operation (NEG, mode, op0, mode);
3727
3728               return tem ? tem : gen_rtx (NEG, mode, op0);
3729             }
3730
3731           /* In IEEE floating point, x*0 is not always 0.  */
3732           if ((TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
3733                || ! FLOAT_MODE_P (mode) || flag_fast_math)
3734               && op1 == CONST0_RTX (mode)
3735               && ! side_effects_p (op0))
3736             return op1;
3737
3738           /* In IEEE floating point, x*1 is not equivalent to x for nans.
3739              However, ANSI says we can drop signals,
3740              so we can do this anyway.  */
3741           if (op1 == CONST1_RTX (mode))
3742             return op0;
3743
3744           /* Convert multiply by constant power of two into shift unless
3745              we are still generating RTL.  This test is a kludge.  */
3746           if (GET_CODE (op1) == CONST_INT
3747               && (val = exact_log2 (INTVAL (op1))) >= 0
3748               && ! rtx_equal_function_value_matters)
3749             return gen_rtx (ASHIFT, mode, op0, GEN_INT (val));
3750
3751           if (GET_CODE (op1) == CONST_DOUBLE
3752               && GET_MODE_CLASS (GET_MODE (op1)) == MODE_FLOAT)
3753             {
3754               REAL_VALUE_TYPE d;
3755               jmp_buf handler;
3756               int op1is2, op1ism1;
3757
3758               if (setjmp (handler))
3759                 return 0;
3760
3761               set_float_handler (handler);
3762               REAL_VALUE_FROM_CONST_DOUBLE (d, op1);
3763               op1is2 = REAL_VALUES_EQUAL (d, dconst2);
3764               op1ism1 = REAL_VALUES_EQUAL (d, dconstm1);
3765               set_float_handler (NULL_PTR);
3766
3767               /* x*2 is x+x and x*(-1) is -x */
3768               if (op1is2 && GET_MODE (op0) == mode)
3769                 return gen_rtx (PLUS, mode, op0, copy_rtx (op0));
3770
3771               else if (op1ism1 && GET_MODE (op0) == mode)
3772                 return gen_rtx (NEG, mode, op0);
3773             }
3774           break;
3775
3776         case IOR:
3777           if (op1 == const0_rtx)
3778             return op0;
3779           if (GET_CODE (op1) == CONST_INT
3780               && (INTVAL (op1) & GET_MODE_MASK (mode)) == GET_MODE_MASK (mode))
3781             return op1;
3782           if (rtx_equal_p (op0, op1) && ! side_effects_p (op0))
3783             return op0;
3784           /* A | (~A) -> -1 */
3785           if (((GET_CODE (op0) == NOT && rtx_equal_p (XEXP (op0, 0), op1))
3786                || (GET_CODE (op1) == NOT && rtx_equal_p (XEXP (op1, 0), op0)))
3787               && ! side_effects_p (op0)
3788               && GET_MODE_CLASS (mode) != MODE_CC)
3789             return constm1_rtx;
3790           break;
3791
3792         case XOR:
3793           if (op1 == const0_rtx)
3794             return op0;
3795           if (GET_CODE (op1) == CONST_INT
3796               && (INTVAL (op1) & GET_MODE_MASK (mode)) == GET_MODE_MASK (mode))
3797             return gen_rtx (NOT, mode, op0);
3798           if (op0 == op1 && ! side_effects_p (op0)
3799               && GET_MODE_CLASS (mode) != MODE_CC)
3800             return const0_rtx;
3801           break;
3802
3803         case AND:
3804           if (op1 == const0_rtx && ! side_effects_p (op0))
3805             return const0_rtx;
3806           if (GET_CODE (op1) == CONST_INT
3807               && (INTVAL (op1) & GET_MODE_MASK (mode)) == GET_MODE_MASK (mode))
3808             return op0;
3809           if (op0 == op1 && ! side_effects_p (op0)
3810               && GET_MODE_CLASS (mode) != MODE_CC)
3811             return op0;
3812           /* A & (~A) -> 0 */
3813           if (((GET_CODE (op0) == NOT && rtx_equal_p (XEXP (op0, 0), op1))
3814                || (GET_CODE (op1) == NOT && rtx_equal_p (XEXP (op1, 0), op0)))
3815               && ! side_effects_p (op0)
3816               && GET_MODE_CLASS (mode) != MODE_CC)
3817             return const0_rtx;
3818           break;
3819
3820         case UDIV:
3821           /* Convert divide by power of two into shift (divide by 1 handled
3822              below).  */
3823           if (GET_CODE (op1) == CONST_INT
3824               && (arg1 = exact_log2 (INTVAL (op1))) > 0)
3825             return gen_rtx (LSHIFTRT, mode, op0, GEN_INT (arg1));
3826
3827           /* ... fall through ... */
3828
3829         case DIV:
3830           if (op1 == CONST1_RTX (mode))
3831             return op0;
3832
3833           /* In IEEE floating point, 0/x is not always 0.  */
3834           if ((TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
3835                || ! FLOAT_MODE_P (mode) || flag_fast_math)
3836               && op0 == CONST0_RTX (mode)
3837               && ! side_effects_p (op1))
3838             return op0;
3839
3840 #if ! defined (REAL_IS_NOT_DOUBLE) || defined (REAL_ARITHMETIC)
3841           /* Change division by a constant into multiplication.  Only do
3842              this with -ffast-math until an expert says it is safe in
3843              general.  */
3844           else if (GET_CODE (op1) == CONST_DOUBLE
3845                    && GET_MODE_CLASS (GET_MODE (op1)) == MODE_FLOAT
3846                    && op1 != CONST0_RTX (mode)
3847                    && flag_fast_math)
3848             {
3849               REAL_VALUE_TYPE d;
3850               REAL_VALUE_FROM_CONST_DOUBLE (d, op1);
3851
3852               if (! REAL_VALUES_EQUAL (d, dconst0))
3853                 {
3854 #if defined (REAL_ARITHMETIC)
3855                   REAL_ARITHMETIC (d, rtx_to_tree_code (DIV), dconst1, d);
3856                   return gen_rtx (MULT, mode, op0,
3857                                   CONST_DOUBLE_FROM_REAL_VALUE (d, mode));
3858 #else
3859                   return gen_rtx (MULT, mode, op0,
3860                                   CONST_DOUBLE_FROM_REAL_VALUE (1./d, mode));
3861 #endif
3862                 }
3863             }
3864 #endif
3865           break;
3866
3867         case UMOD:
3868           /* Handle modulus by power of two (mod with 1 handled below).  */
3869           if (GET_CODE (op1) == CONST_INT
3870               && exact_log2 (INTVAL (op1)) > 0)
3871             return gen_rtx (AND, mode, op0, GEN_INT (INTVAL (op1) - 1));
3872
3873           /* ... fall through ... */
3874
3875         case MOD:
3876           if ((op0 == const0_rtx || op1 == const1_rtx)
3877               && ! side_effects_p (op0) && ! side_effects_p (op1))
3878             return const0_rtx;
3879           break;
3880
3881         case ROTATERT:
3882         case ROTATE:
3883           /* Rotating ~0 always results in ~0.  */
3884           if (GET_CODE (op0) == CONST_INT && width <= HOST_BITS_PER_WIDE_INT
3885               && INTVAL (op0) == GET_MODE_MASK (mode)
3886               && ! side_effects_p (op1))
3887             return op0;
3888
3889           /* ... fall through ... */
3890
3891         case ASHIFT:
3892         case ASHIFTRT:
3893         case LSHIFTRT:
3894           if (op1 == const0_rtx)
3895             return op0;
3896           if (op0 == const0_rtx && ! side_effects_p (op1))
3897             return op0;
3898           break;
3899
3900         case SMIN:
3901           if (width <= HOST_BITS_PER_WIDE_INT && GET_CODE (op1) == CONST_INT
3902               && INTVAL (op1) == (HOST_WIDE_INT) 1 << (width -1)
3903               && ! side_effects_p (op0))
3904             return op1;
3905           else if (rtx_equal_p (op0, op1) && ! side_effects_p (op0))
3906             return op0;
3907           break;
3908
3909         case SMAX:
3910           if (width <= HOST_BITS_PER_WIDE_INT && GET_CODE (op1) == CONST_INT
3911               && (INTVAL (op1)
3912                   == (unsigned HOST_WIDE_INT) GET_MODE_MASK (mode) >> 1)
3913               && ! side_effects_p (op0))
3914             return op1;
3915           else if (rtx_equal_p (op0, op1) && ! side_effects_p (op0))
3916             return op0;
3917           break;
3918
3919         case UMIN:
3920           if (op1 == const0_rtx && ! side_effects_p (op0))
3921             return op1;
3922           else if (rtx_equal_p (op0, op1) && ! side_effects_p (op0))
3923             return op0;
3924           break;
3925
3926         case UMAX:
3927           if (op1 == constm1_rtx && ! side_effects_p (op0))
3928             return op1;
3929           else if (rtx_equal_p (op0, op1) && ! side_effects_p (op0))
3930             return op0;
3931           break;
3932
3933         default:
3934           abort ();
3935         }
3936
3937       return 0;
3938     }
3939
3940   /* Get the integer argument values in two forms:
3941      zero-extended in ARG0, ARG1 and sign-extended in ARG0S, ARG1S.  */
3942
3943   arg0 = INTVAL (op0);
3944   arg1 = INTVAL (op1);
3945
3946   if (width < HOST_BITS_PER_WIDE_INT)
3947     {
3948       arg0 &= ((HOST_WIDE_INT) 1 << width) - 1;
3949       arg1 &= ((HOST_WIDE_INT) 1 << width) - 1;
3950
3951       arg0s = arg0;
3952       if (arg0s & ((HOST_WIDE_INT) 1 << (width - 1)))
3953         arg0s |= ((HOST_WIDE_INT) (-1) << width);
3954
3955       arg1s = arg1;
3956       if (arg1s & ((HOST_WIDE_INT) 1 << (width - 1)))
3957         arg1s |= ((HOST_WIDE_INT) (-1) << width);
3958     }
3959   else
3960     {
3961       arg0s = arg0;
3962       arg1s = arg1;
3963     }
3964
3965   /* Compute the value of the arithmetic.  */
3966
3967   switch (code)
3968     {
3969     case PLUS:
3970       val = arg0s + arg1s;
3971       break;
3972
3973     case MINUS:
3974       val = arg0s - arg1s;
3975       break;
3976
3977     case MULT:
3978       val = arg0s * arg1s;
3979       break;
3980
3981     case DIV:
3982       if (arg1s == 0)
3983         return 0;
3984       val = arg0s / arg1s;
3985       break;
3986
3987     case MOD:
3988       if (arg1s == 0)
3989         return 0;
3990       val = arg0s % arg1s;
3991       break;
3992
3993     case UDIV:
3994       if (arg1 == 0)
3995         return 0;
3996       val = (unsigned HOST_WIDE_INT) arg0 / arg1;
3997       break;
3998
3999     case UMOD:
4000       if (arg1 == 0)
4001         return 0;
4002       val = (unsigned HOST_WIDE_INT) arg0 % arg1;
4003       break;
4004
4005     case AND:
4006       val = arg0 & arg1;
4007       break;
4008
4009     case IOR:
4010       val = arg0 | arg1;
4011       break;
4012
4013     case XOR:
4014       val = arg0 ^ arg1;
4015       break;
4016
4017     case LSHIFTRT:
4018       /* If shift count is undefined, don't fold it; let the machine do
4019          what it wants.  But truncate it if the machine will do that.  */
4020       if (arg1 < 0)
4021         return 0;
4022
4023 #ifdef SHIFT_COUNT_TRUNCATED
4024       if (SHIFT_COUNT_TRUNCATED)
4025         arg1 %= width;
4026 #endif
4027
4028       val = ((unsigned HOST_WIDE_INT) arg0) >> arg1;
4029       break;
4030
4031     case ASHIFT:
4032       if (arg1 < 0)
4033         return 0;
4034
4035 #ifdef SHIFT_COUNT_TRUNCATED
4036       if (SHIFT_COUNT_TRUNCATED)
4037         arg1 %= width;
4038 #endif
4039
4040       val = ((unsigned HOST_WIDE_INT) arg0) << arg1;
4041       break;
4042
4043     case ASHIFTRT:
4044       if (arg1 < 0)
4045         return 0;
4046
4047 #ifdef SHIFT_COUNT_TRUNCATED
4048       if (SHIFT_COUNT_TRUNCATED)
4049         arg1 %= width;
4050 #endif
4051
4052       val = arg0s >> arg1;
4053
4054       /* Bootstrap compiler may not have sign extended the right shift.
4055          Manually extend the sign to insure bootstrap cc matches gcc.  */
4056       if (arg0s < 0 && arg1 > 0)
4057         val |= ((HOST_WIDE_INT) -1) << (HOST_BITS_PER_WIDE_INT - arg1);
4058
4059       break;
4060
4061     case ROTATERT:
4062       if (arg1 < 0)
4063         return 0;
4064
4065       arg1 %= width;
4066       val = ((((unsigned HOST_WIDE_INT) arg0) << (width - arg1))
4067              | (((unsigned HOST_WIDE_INT) arg0) >> arg1));
4068       break;
4069
4070     case ROTATE:
4071       if (arg1 < 0)
4072         return 0;
4073
4074       arg1 %= width;
4075       val = ((((unsigned HOST_WIDE_INT) arg0) << arg1)
4076              | (((unsigned HOST_WIDE_INT) arg0) >> (width - arg1)));
4077       break;
4078
4079     case COMPARE:
4080       /* Do nothing here.  */
4081       return 0;
4082
4083     case SMIN:
4084       val = arg0s <= arg1s ? arg0s : arg1s;
4085       break;
4086
4087     case UMIN:
4088       val = ((unsigned HOST_WIDE_INT) arg0
4089              <= (unsigned HOST_WIDE_INT) arg1 ? arg0 : arg1);
4090       break;
4091
4092     case SMAX:
4093       val = arg0s > arg1s ? arg0s : arg1s;
4094       break;
4095
4096     case UMAX:
4097       val = ((unsigned HOST_WIDE_INT) arg0
4098              > (unsigned HOST_WIDE_INT) arg1 ? arg0 : arg1);
4099       break;
4100
4101     default:
4102       abort ();
4103     }
4104
4105   /* Clear the bits that don't belong in our mode, unless they and our sign
4106      bit are all one.  So we get either a reasonable negative value or a
4107      reasonable unsigned value for this mode.  */
4108   if (width < HOST_BITS_PER_WIDE_INT
4109       && ((val & ((HOST_WIDE_INT) (-1) << (width - 1)))
4110           != ((HOST_WIDE_INT) (-1) << (width - 1))))
4111     val &= ((HOST_WIDE_INT) 1 << width) - 1;
4112
4113   return GEN_INT (val);
4114 }
4115 \f
4116 /* Simplify a PLUS or MINUS, at least one of whose operands may be another
4117    PLUS or MINUS.
4118
4119    Rather than test for specific case, we do this by a brute-force method
4120    and do all possible simplifications until no more changes occur.  Then
4121    we rebuild the operation.  */
4122
4123 static rtx
4124 simplify_plus_minus (code, mode, op0, op1)
4125      enum rtx_code code;
4126      enum machine_mode mode;
4127      rtx op0, op1;
4128 {
4129   rtx ops[8];
4130   int negs[8];
4131   rtx result, tem;
4132   int n_ops = 2, input_ops = 2, input_consts = 0, n_consts = 0;
4133   int first = 1, negate = 0, changed;
4134   int i, j;
4135
4136   bzero ((char *) ops, sizeof ops);
4137
4138   /* Set up the two operands and then expand them until nothing has been
4139      changed.  If we run out of room in our array, give up; this should
4140      almost never happen.  */
4141
4142   ops[0] = op0, ops[1] = op1, negs[0] = 0, negs[1] = (code == MINUS);
4143
4144   changed = 1;
4145   while (changed)
4146     {
4147       changed = 0;
4148
4149       for (i = 0; i < n_ops; i++)
4150         switch (GET_CODE (ops[i]))
4151           {
4152           case PLUS:
4153           case MINUS:
4154             if (n_ops == 7)
4155               return 0;
4156
4157             ops[n_ops] = XEXP (ops[i], 1);
4158             negs[n_ops++] = GET_CODE (ops[i]) == MINUS ? !negs[i] : negs[i];
4159             ops[i] = XEXP (ops[i], 0);
4160             input_ops++;
4161             changed = 1;
4162             break;
4163
4164           case NEG:
4165             ops[i] = XEXP (ops[i], 0);
4166             negs[i] = ! negs[i];
4167             changed = 1;
4168             break;
4169
4170           case CONST:
4171             ops[i] = XEXP (ops[i], 0);
4172             input_consts++;
4173             changed = 1;
4174             break;
4175
4176           case NOT:
4177             /* ~a -> (-a - 1) */
4178             if (n_ops != 7)
4179               {
4180                 ops[n_ops] = constm1_rtx;
4181                 negs[n_ops++] = negs[i];
4182                 ops[i] = XEXP (ops[i], 0);
4183                 negs[i] = ! negs[i];
4184                 changed = 1;
4185               }
4186             break;
4187
4188           case CONST_INT:
4189             if (negs[i])
4190               ops[i] = GEN_INT (- INTVAL (ops[i])), negs[i] = 0, changed = 1;
4191             break;
4192           }
4193     }
4194
4195   /* If we only have two operands, we can't do anything.  */
4196   if (n_ops <= 2)
4197     return 0;
4198
4199   /* Now simplify each pair of operands until nothing changes.  The first
4200      time through just simplify constants against each other.  */
4201
4202   changed = 1;
4203   while (changed)
4204     {
4205       changed = first;
4206
4207       for (i = 0; i < n_ops - 1; i++)
4208         for (j = i + 1; j < n_ops; j++)
4209           if (ops[i] != 0 && ops[j] != 0
4210               && (! first || (CONSTANT_P (ops[i]) && CONSTANT_P (ops[j]))))
4211             {
4212               rtx lhs = ops[i], rhs = ops[j];
4213               enum rtx_code ncode = PLUS;
4214
4215               if (negs[i] && ! negs[j])
4216                 lhs = ops[j], rhs = ops[i], ncode = MINUS;
4217               else if (! negs[i] && negs[j])
4218                 ncode = MINUS;
4219
4220               tem = simplify_binary_operation (ncode, mode, lhs, rhs);
4221               if (tem)
4222                 {
4223                   ops[i] = tem, ops[j] = 0;
4224                   negs[i] = negs[i] && negs[j];
4225                   if (GET_CODE (tem) == NEG)
4226                     ops[i] = XEXP (tem, 0), negs[i] = ! negs[i];
4227
4228                   if (GET_CODE (ops[i]) == CONST_INT && negs[i])
4229                     ops[i] = GEN_INT (- INTVAL (ops[i])), negs[i] = 0;
4230                   changed = 1;
4231                 }
4232             }
4233
4234       first = 0;
4235     }
4236
4237   /* Pack all the operands to the lower-numbered entries and give up if
4238      we didn't reduce the number of operands we had.  Make sure we
4239      count a CONST as two operands.  If we have the same number of
4240      operands, but have made more CONSTs than we had, this is also
4241      an improvement, so accept it.  */
4242
4243   for (i = 0, j = 0; j < n_ops; j++)
4244     if (ops[j] != 0)
4245       {
4246         ops[i] = ops[j], negs[i++] = negs[j];
4247         if (GET_CODE (ops[j]) == CONST)
4248           n_consts++;
4249       }
4250
4251   if (i + n_consts > input_ops
4252       || (i + n_consts == input_ops && n_consts <= input_consts))
4253     return 0;
4254
4255   n_ops = i;
4256
4257   /* If we have a CONST_INT, put it last.  */
4258   for (i = 0; i < n_ops - 1; i++)
4259     if (GET_CODE (ops[i]) == CONST_INT)
4260       {
4261         tem = ops[n_ops - 1], ops[n_ops - 1] = ops[i] , ops[i] = tem;
4262         j = negs[n_ops - 1], negs[n_ops - 1] = negs[i], negs[i] = j;
4263       }
4264
4265   /* Put a non-negated operand first.  If there aren't any, make all
4266      operands positive and negate the whole thing later.  */
4267   for (i = 0; i < n_ops && negs[i]; i++)
4268     ;
4269
4270   if (i == n_ops)
4271     {
4272       for (i = 0; i < n_ops; i++)
4273         negs[i] = 0;
4274       negate = 1;
4275     }
4276   else if (i != 0)
4277     {
4278       tem = ops[0], ops[0] = ops[i], ops[i] = tem;
4279       j = negs[0], negs[0] = negs[i], negs[i] = j;
4280     }
4281
4282   /* Now make the result by performing the requested operations.  */
4283   result = ops[0];
4284   for (i = 1; i < n_ops; i++)
4285     result = cse_gen_binary (negs[i] ? MINUS : PLUS, mode, result, ops[i]);
4286
4287   return negate ? gen_rtx (NEG, mode, result) : result;
4288 }
4289 \f
4290 /* Make a binary operation by properly ordering the operands and
4291    seeing if the expression folds.  */
4292
4293 static rtx
4294 cse_gen_binary (code, mode, op0, op1)
4295      enum rtx_code code;
4296      enum machine_mode mode;
4297      rtx op0, op1;
4298 {
4299   rtx tem;
4300
4301   /* Put complex operands first and constants second if commutative.  */
4302   if (GET_RTX_CLASS (code) == 'c'
4303       && ((CONSTANT_P (op0) && GET_CODE (op1) != CONST_INT)
4304           || (GET_RTX_CLASS (GET_CODE (op0)) == 'o'
4305               && GET_RTX_CLASS (GET_CODE (op1)) != 'o')
4306           || (GET_CODE (op0) == SUBREG
4307               && GET_RTX_CLASS (GET_CODE (SUBREG_REG (op0))) == 'o'
4308               && GET_RTX_CLASS (GET_CODE (op1)) != 'o')))
4309     tem = op0, op0 = op1, op1 = tem;
4310
4311   /* If this simplifies, do it.  */
4312   tem = simplify_binary_operation (code, mode, op0, op1);
4313
4314   if (tem)
4315     return tem;
4316
4317   /* Handle addition and subtraction of CONST_INT specially.  Otherwise,
4318      just form the operation.  */
4319
4320   if (code == PLUS && GET_CODE (op1) == CONST_INT
4321       && GET_MODE (op0) != VOIDmode)
4322     return plus_constant (op0, INTVAL (op1));
4323   else if (code == MINUS && GET_CODE (op1) == CONST_INT
4324            && GET_MODE (op0) != VOIDmode)
4325     return plus_constant (op0, - INTVAL (op1));
4326   else
4327     return gen_rtx (code, mode, op0, op1);
4328 }
4329 \f
4330 /* Like simplify_binary_operation except used for relational operators.
4331    MODE is the mode of the operands, not that of the result.  If MODE
4332    is VOIDmode, both operands must also be VOIDmode and we compare the
4333    operands in "infinite precision".
4334
4335    If no simplification is possible, this function returns zero.  Otherwise,
4336    it returns either const_true_rtx or const0_rtx.  */
4337
4338 rtx
4339 simplify_relational_operation (code, mode, op0, op1)
4340      enum rtx_code code;
4341      enum machine_mode mode;
4342      rtx op0, op1;
4343 {
4344   int equal, op0lt, op0ltu, op1lt, op1ltu;
4345   rtx tem;
4346
4347   /* If op0 is a compare, extract the comparison arguments from it.  */
4348   if (GET_CODE (op0) == COMPARE && op1 == const0_rtx)
4349     op1 = XEXP (op0, 1), op0 = XEXP (op0, 0);
4350
4351   /* We can't simplify MODE_CC values since we don't know what the
4352      actual comparison is.  */
4353   if (GET_MODE_CLASS (GET_MODE (op0)) == MODE_CC
4354 #ifdef HAVE_cc0
4355       || op0 == cc0_rtx
4356 #endif
4357       )
4358     return 0;
4359
4360   /* For integer comparisons of A and B maybe we can simplify A - B and can
4361      then simplify a comparison of that with zero.  If A and B are both either
4362      a register or a CONST_INT, this can't help; testing for these cases will
4363      prevent infinite recursion here and speed things up.
4364
4365      If CODE is an unsigned comparison, we can only do this if A - B is a
4366      constant integer, and then we have to compare that integer with zero as a
4367      signed comparison.  Note that this will give the incorrect result from
4368      comparisons that overflow.  Since these are undefined, this is probably
4369      OK.  If it causes a problem, we can check for A or B being an address
4370      (fp + const or SYMBOL_REF) and only do it in that case.  */
4371
4372   if (INTEGRAL_MODE_P (mode) && op1 != const0_rtx
4373       && ! ((GET_CODE (op0) == REG || GET_CODE (op0) == CONST_INT)
4374             && (GET_CODE (op1) == REG || GET_CODE (op1) == CONST_INT))
4375       && 0 != (tem = simplify_binary_operation (MINUS, mode, op0, op1))
4376       && (GET_CODE (tem) == CONST_INT
4377           || (code != GTU && code != GEU &&
4378               code != LTU && code != LEU)))
4379     return simplify_relational_operation (signed_condition (code),
4380                                           mode, tem, const0_rtx);
4381
4382   /* For non-IEEE floating-point, if the two operands are equal, we know the
4383      result.  */
4384   if (rtx_equal_p (op0, op1)
4385       && (TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
4386           || ! FLOAT_MODE_P (GET_MODE (op0)) || flag_fast_math))
4387     equal = 1, op0lt = 0, op0ltu = 0, op1lt = 0, op1ltu = 0;
4388
4389   /* If the operands are floating-point constants, see if we can fold
4390      the result.  */
4391 #if ! defined (REAL_IS_NOT_DOUBLE) || defined (REAL_ARITHMETIC)
4392   else if (GET_CODE (op0) == CONST_DOUBLE && GET_CODE (op1) == CONST_DOUBLE
4393            && GET_MODE_CLASS (GET_MODE (op0)) == MODE_FLOAT)
4394     {
4395       REAL_VALUE_TYPE d0, d1;
4396       jmp_buf handler;
4397
4398       if (setjmp (handler))
4399         return 0;
4400
4401       set_float_handler (handler);
4402       REAL_VALUE_FROM_CONST_DOUBLE (d0, op0);
4403       REAL_VALUE_FROM_CONST_DOUBLE (d1, op1);
4404       equal = REAL_VALUES_EQUAL (d0, d1);
4405       op0lt = op0ltu = REAL_VALUES_LESS (d0, d1);
4406       op1lt = op1ltu = REAL_VALUES_LESS (d1, d0);
4407       set_float_handler (NULL_PTR);
4408     }
4409 #endif  /* not REAL_IS_NOT_DOUBLE, or REAL_ARITHMETIC */
4410
4411   /* Otherwise, see if the operands are both integers.  */
4412   else if ((GET_MODE_CLASS (mode) == MODE_INT || mode == VOIDmode)
4413            && (GET_CODE (op0) == CONST_DOUBLE || GET_CODE (op0) == CONST_INT)
4414            && (GET_CODE (op1) == CONST_DOUBLE || GET_CODE (op1) == CONST_INT))
4415     {
4416       int width = GET_MODE_BITSIZE (mode);
4417       HOST_WIDE_INT l0s, h0s, l1s, h1s;
4418       unsigned HOST_WIDE_INT l0u, h0u, l1u, h1u;
4419
4420       /* Get the two words comprising each integer constant.  */
4421       if (GET_CODE (op0) == CONST_DOUBLE)
4422         {
4423           l0u = l0s = CONST_DOUBLE_LOW (op0);
4424           h0u = h0s = CONST_DOUBLE_HIGH (op0);
4425         }
4426       else
4427         {
4428           l0u = l0s = INTVAL (op0);
4429           h0u = 0, h0s = l0s < 0 ? -1 : 0;
4430         }
4431
4432       if (GET_CODE (op1) == CONST_DOUBLE)
4433         {
4434           l1u = l1s = CONST_DOUBLE_LOW (op1);
4435           h1u = h1s = CONST_DOUBLE_HIGH (op1);
4436         }
4437       else
4438         {
4439           l1u = l1s = INTVAL (op1);
4440           h1u = 0, h1s = l1s < 0 ? -1 : 0;
4441         }
4442
4443       /* If WIDTH is nonzero and smaller than HOST_BITS_PER_WIDE_INT,
4444          we have to sign or zero-extend the values.  */
4445       if (width != 0 && width <= HOST_BITS_PER_WIDE_INT)
4446         h0u = h1u = 0, h0s = l0s < 0 ? -1 : 0, h1s = l1s < 0 ? -1 : 0;
4447
4448       if (width != 0 && width < HOST_BITS_PER_WIDE_INT)
4449         {
4450           l0u &= ((HOST_WIDE_INT) 1 << width) - 1;
4451           l1u &= ((HOST_WIDE_INT) 1 << width) - 1;
4452
4453           if (l0s & ((HOST_WIDE_INT) 1 << (width - 1)))
4454             l0s |= ((HOST_WIDE_INT) (-1) << width);
4455
4456           if (l1s & ((HOST_WIDE_INT) 1 << (width - 1)))
4457             l1s |= ((HOST_WIDE_INT) (-1) << width);
4458         }
4459
4460       equal = (h0u == h1u && l0u == l1u);
4461       op0lt = (h0s < h1s || (h0s == h1s && l0s < l1s));
4462       op1lt = (h1s < h0s || (h1s == h0s && l1s < l0s));
4463       op0ltu = (h0u < h1u || (h0u == h1u && l0u < l1u));
4464       op1ltu = (h1u < h0u || (h1u == h0u && l1u < l0u));
4465     }
4466
4467   /* Otherwise, there are some code-specific tests we can make.  */
4468   else
4469     {
4470       switch (code)
4471         {
4472         case EQ:
4473           /* References to the frame plus a constant or labels cannot
4474              be zero, but a SYMBOL_REF can due to #pragma weak.  */
4475           if (((NONZERO_BASE_PLUS_P (op0) && op1 == const0_rtx)
4476                || GET_CODE (op0) == LABEL_REF)
4477 #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM
4478               /* On some machines, the ap reg can be 0 sometimes.  */
4479               && op0 != arg_pointer_rtx
4480 #endif
4481                 )
4482             return const0_rtx;
4483           break;
4484
4485         case NE:
4486           if (((NONZERO_BASE_PLUS_P (op0) && op1 == const0_rtx)
4487                || GET_CODE (op0) == LABEL_REF)
4488 #if FRAME_POINTER_REGNUM != ARG_POINTER_REGNUM
4489               && op0 != arg_pointer_rtx
4490 #endif
4491               )
4492             return const_true_rtx;
4493           break;
4494
4495         case GEU:
4496           /* Unsigned values are never negative.  */
4497           if (op1 == const0_rtx)
4498             return const_true_rtx;
4499           break;
4500
4501         case LTU:
4502           if (op1 == const0_rtx)
4503             return const0_rtx;
4504           break;
4505
4506         case LEU:
4507           /* Unsigned values are never greater than the largest
4508              unsigned value.  */
4509           if (GET_CODE (op1) == CONST_INT
4510               && INTVAL (op1) == GET_MODE_MASK (mode)
4511             && INTEGRAL_MODE_P (mode))
4512           return const_true_rtx;
4513           break;
4514
4515         case GTU:
4516           if (GET_CODE (op1) == CONST_INT
4517               && INTVAL (op1) == GET_MODE_MASK (mode)
4518               && INTEGRAL_MODE_P (mode))
4519             return const0_rtx;
4520           break;
4521         }
4522
4523       return 0;
4524     }
4525
4526   /* If we reach here, EQUAL, OP0LT, OP0LTU, OP1LT, and OP1LTU are set
4527      as appropriate.  */
4528   switch (code)
4529     {
4530     case EQ:
4531       return equal ? const_true_rtx : const0_rtx;
4532     case NE:
4533       return ! equal ? const_true_rtx : const0_rtx;
4534     case LT:
4535       return op0lt ? const_true_rtx : const0_rtx;
4536     case GT:
4537       return op1lt ? const_true_rtx : const0_rtx;
4538     case LTU:
4539       return op0ltu ? const_true_rtx : const0_rtx;
4540     case GTU:
4541       return op1ltu ? const_true_rtx : const0_rtx;
4542     case LE:
4543       return equal || op0lt ? const_true_rtx : const0_rtx;
4544     case GE:
4545       return equal || op1lt ? const_true_rtx : const0_rtx;
4546     case LEU:
4547       return equal || op0ltu ? const_true_rtx : const0_rtx;
4548     case GEU:
4549       return equal || op1ltu ? const_true_rtx : const0_rtx;
4550     }
4551
4552   abort ();
4553 }
4554 \f
4555 /* Simplify CODE, an operation with result mode MODE and three operands,
4556    OP0, OP1, and OP2.  OP0_MODE was the mode of OP0 before it became
4557    a constant.  Return 0 if no simplifications is possible.  */
4558
4559 rtx
4560 simplify_ternary_operation (code, mode, op0_mode, op0, op1, op2)
4561      enum rtx_code code;
4562      enum machine_mode mode, op0_mode;
4563      rtx op0, op1, op2;
4564 {
4565   int width = GET_MODE_BITSIZE (mode);
4566
4567   /* VOIDmode means "infinite" precision.  */
4568   if (width == 0)
4569     width = HOST_BITS_PER_WIDE_INT;
4570
4571   switch (code)
4572     {
4573     case SIGN_EXTRACT:
4574     case ZERO_EXTRACT:
4575       if (GET_CODE (op0) == CONST_INT
4576           && GET_CODE (op1) == CONST_INT
4577           && GET_CODE (op2) == CONST_INT
4578           && INTVAL (op1) + INTVAL (op2) <= GET_MODE_BITSIZE (op0_mode)
4579           && width <= HOST_BITS_PER_WIDE_INT)
4580         {
4581           /* Extracting a bit-field from a constant */
4582           HOST_WIDE_INT val = INTVAL (op0);
4583
4584 #if BITS_BIG_ENDIAN
4585           val >>= (GET_MODE_BITSIZE (op0_mode) - INTVAL (op2) - INTVAL (op1));
4586 #else
4587           val >>= INTVAL (op2);
4588 #endif
4589           if (HOST_BITS_PER_WIDE_INT != INTVAL (op1))
4590             {
4591               /* First zero-extend.  */
4592               val &= ((HOST_WIDE_INT) 1 << INTVAL (op1)) - 1;
4593               /* If desired, propagate sign bit.  */
4594               if (code == SIGN_EXTRACT
4595                   && (val & ((HOST_WIDE_INT) 1 << (INTVAL (op1) - 1))))
4596                 val |= ~ (((HOST_WIDE_INT) 1 << INTVAL (op1)) - 1);
4597             }
4598
4599           /* Clear the bits that don't belong in our mode,
4600              unless they and our sign bit are all one.
4601              So we get either a reasonable negative value or a reasonable
4602              unsigned value for this mode.  */
4603           if (width < HOST_BITS_PER_WIDE_INT
4604               && ((val & ((HOST_WIDE_INT) (-1) << (width - 1)))
4605                   != ((HOST_WIDE_INT) (-1) << (width - 1))))
4606             val &= ((HOST_WIDE_INT) 1 << width) - 1;
4607
4608           return GEN_INT (val);
4609         }
4610       break;
4611
4612     case IF_THEN_ELSE:
4613       if (GET_CODE (op0) == CONST_INT)
4614         return op0 != const0_rtx ? op1 : op2;
4615       break;
4616
4617     default:
4618       abort ();
4619     }
4620
4621   return 0;
4622 }
4623 \f
4624 /* If X is a nontrivial arithmetic operation on an argument
4625    for which a constant value can be determined, return
4626    the result of operating on that value, as a constant.
4627    Otherwise, return X, possibly with one or more operands
4628    modified by recursive calls to this function.
4629
4630    If X is a register whose contents are known, we do NOT
4631    return those contents here.  equiv_constant is called to
4632    perform that task.
4633
4634    INSN is the insn that we may be modifying.  If it is 0, make a copy
4635    of X before modifying it.  */
4636
4637 static rtx
4638 fold_rtx (x, insn)
4639      rtx x;
4640      rtx insn;
4641 {
4642   register enum rtx_code code;
4643   register enum machine_mode mode;
4644   register char *fmt;
4645   register int i;
4646   rtx new = 0;
4647   int copied = 0;
4648   int must_swap = 0;
4649
4650   /* Folded equivalents of first two operands of X.  */
4651   rtx folded_arg0;
4652   rtx folded_arg1;
4653
4654   /* Constant equivalents of first three operands of X;
4655      0 when no such equivalent is known.  */
4656   rtx const_arg0;
4657   rtx const_arg1;
4658   rtx const_arg2;
4659
4660   /* The mode of the first operand of X.  We need this for sign and zero
4661      extends.  */
4662   enum machine_mode mode_arg0;
4663
4664   if (x == 0)
4665     return x;
4666
4667   mode = GET_MODE (x);
4668   code = GET_CODE (x);
4669   switch (code)
4670     {
4671     case CONST:
4672     case CONST_INT:
4673     case CONST_DOUBLE:
4674     case SYMBOL_REF:
4675     case LABEL_REF:
4676     case REG:
4677       /* No use simplifying an EXPR_LIST
4678          since they are used only for lists of args
4679          in a function call's REG_EQUAL note.  */
4680     case EXPR_LIST:
4681       return x;
4682
4683 #ifdef HAVE_cc0
4684     case CC0:
4685       return prev_insn_cc0;
4686 #endif
4687
4688     case PC:
4689       /* If the next insn is a CODE_LABEL followed by a jump table,
4690          PC's value is a LABEL_REF pointing to that label.  That
4691          lets us fold switch statements on the Vax.  */
4692       if (insn && GET_CODE (insn) == JUMP_INSN)
4693         {
4694           rtx next = next_nonnote_insn (insn);
4695
4696           if (next && GET_CODE (next) == CODE_LABEL
4697               && NEXT_INSN (next) != 0
4698               && GET_CODE (NEXT_INSN (next)) == JUMP_INSN
4699               && (GET_CODE (PATTERN (NEXT_INSN (next))) == ADDR_VEC
4700                   || GET_CODE (PATTERN (NEXT_INSN (next))) == ADDR_DIFF_VEC))
4701             return gen_rtx (LABEL_REF, Pmode, next);
4702         }
4703       break;
4704
4705     case SUBREG:
4706       /* See if we previously assigned a constant value to this SUBREG.  */
4707       if ((new = lookup_as_function (x, CONST_INT)) != 0
4708           || (new = lookup_as_function (x, CONST_DOUBLE)) != 0)
4709         return new;
4710
4711       /* If this is a paradoxical SUBREG, we have no idea what value the
4712          extra bits would have.  However, if the operand is equivalent
4713          to a SUBREG whose operand is the same as our mode, and all the
4714          modes are within a word, we can just use the inner operand
4715          because these SUBREGs just say how to treat the register.
4716
4717          Similarly if we find an integer constant.  */
4718
4719       if (GET_MODE_SIZE (mode) > GET_MODE_SIZE (GET_MODE (SUBREG_REG (x))))
4720         {
4721           enum machine_mode imode = GET_MODE (SUBREG_REG (x));
4722           struct table_elt *elt;
4723
4724           if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD
4725               && GET_MODE_SIZE (imode) <= UNITS_PER_WORD
4726               && (elt = lookup (SUBREG_REG (x), HASH (SUBREG_REG (x), imode),
4727                                 imode)) != 0)
4728             for (elt = elt->first_same_value;
4729                  elt; elt = elt->next_same_value)
4730               {
4731                 if (CONSTANT_P (elt->exp)
4732                     && GET_MODE (elt->exp) == VOIDmode)
4733                   return elt->exp;
4734
4735                 if (GET_CODE (elt->exp) == SUBREG
4736                     && GET_MODE (SUBREG_REG (elt->exp)) == mode
4737                     && exp_equiv_p (elt->exp, elt->exp, 1, 0))
4738                   return copy_rtx (SUBREG_REG (elt->exp));
4739             }
4740
4741           return x;
4742         }
4743
4744       /* Fold SUBREG_REG.  If it changed, see if we can simplify the SUBREG.
4745          We might be able to if the SUBREG is extracting a single word in an
4746          integral mode or extracting the low part.  */
4747
4748       folded_arg0 = fold_rtx (SUBREG_REG (x), insn);
4749       const_arg0 = equiv_constant (folded_arg0);
4750       if (const_arg0)
4751         folded_arg0 = const_arg0;
4752
4753       if (folded_arg0 != SUBREG_REG (x))
4754         {
4755           new = 0;
4756
4757           if (GET_MODE_CLASS (mode) == MODE_INT
4758               && GET_MODE_SIZE (mode) == UNITS_PER_WORD
4759               && GET_MODE (SUBREG_REG (x)) != VOIDmode)
4760             new = operand_subword (folded_arg0, SUBREG_WORD (x), 0,
4761                                    GET_MODE (SUBREG_REG (x)));
4762           if (new == 0 && subreg_lowpart_p (x))
4763             new = gen_lowpart_if_possible (mode, folded_arg0);
4764           if (new)
4765             return new;
4766         }
4767
4768       /* If this is a narrowing SUBREG and our operand is a REG, see if
4769          we can find an equivalence for REG that is an arithmetic operation
4770          in a wider mode where both operands are paradoxical SUBREGs
4771          from objects of our result mode.  In that case, we couldn't report
4772          an equivalent value for that operation, since we don't know what the
4773          extra bits will be.  But we can find an equivalence for this SUBREG
4774          by folding that operation is the narrow mode.  This allows us to
4775          fold arithmetic in narrow modes when the machine only supports
4776          word-sized arithmetic.
4777
4778          Also look for a case where we have a SUBREG whose operand is the
4779          same as our result.  If both modes are smaller than a word, we
4780          are simply interpreting a register in different modes and we
4781          can use the inner value.  */
4782
4783       if (GET_CODE (folded_arg0) == REG
4784           && GET_MODE_SIZE (mode) < GET_MODE_SIZE (GET_MODE (folded_arg0))
4785           && subreg_lowpart_p (x))
4786         {
4787           struct table_elt *elt;
4788
4789           /* We can use HASH here since we know that canon_hash won't be
4790              called.  */
4791           elt = lookup (folded_arg0,
4792                         HASH (folded_arg0, GET_MODE (folded_arg0)),
4793                         GET_MODE (folded_arg0));
4794
4795           if (elt)
4796             elt = elt->first_same_value;
4797
4798           for (; elt; elt = elt->next_same_value)
4799             {
4800               enum rtx_code eltcode = GET_CODE (elt->exp);
4801
4802               /* Just check for unary and binary operations.  */
4803               if (GET_RTX_CLASS (GET_CODE (elt->exp)) == '1'
4804                   && GET_CODE (elt->exp) != SIGN_EXTEND
4805                   && GET_CODE (elt->exp) != ZERO_EXTEND
4806                   && GET_CODE (XEXP (elt->exp, 0)) == SUBREG
4807                   && GET_MODE (SUBREG_REG (XEXP (elt->exp, 0))) == mode)
4808                 {
4809                   rtx op0 = SUBREG_REG (XEXP (elt->exp, 0));
4810
4811                   if (GET_CODE (op0) != REG && ! CONSTANT_P (op0))
4812                     op0 = fold_rtx (op0, NULL_RTX);
4813
4814                   op0 = equiv_constant (op0);
4815                   if (op0)
4816                     new = simplify_unary_operation (GET_CODE (elt->exp), mode,
4817                                                     op0, mode);
4818                 }
4819               else if ((GET_RTX_CLASS (GET_CODE (elt->exp)) == '2'
4820                         || GET_RTX_CLASS (GET_CODE (elt->exp)) == 'c')
4821                        && eltcode != DIV && eltcode != MOD
4822                        && eltcode != UDIV && eltcode != UMOD
4823                        && eltcode != ASHIFTRT && eltcode != LSHIFTRT
4824                        && eltcode != ROTATE && eltcode != ROTATERT
4825                        && ((GET_CODE (XEXP (elt->exp, 0)) == SUBREG
4826                             && (GET_MODE (SUBREG_REG (XEXP (elt->exp, 0)))
4827                                 == mode))
4828                            || CONSTANT_P (XEXP (elt->exp, 0)))
4829                        && ((GET_CODE (XEXP (elt->exp, 1)) == SUBREG
4830                             && (GET_MODE (SUBREG_REG (XEXP (elt->exp, 1)))
4831                                 == mode))
4832                            || CONSTANT_P (XEXP (elt->exp, 1))))
4833                 {
4834                   rtx op0 = gen_lowpart_common (mode, XEXP (elt->exp, 0));
4835                   rtx op1 = gen_lowpart_common (mode, XEXP (elt->exp, 1));
4836
4837                   if (op0 && GET_CODE (op0) != REG && ! CONSTANT_P (op0))
4838                     op0 = fold_rtx (op0, NULL_RTX);
4839
4840                   if (op0)
4841                     op0 = equiv_constant (op0);
4842
4843                   if (op1 && GET_CODE (op1) != REG && ! CONSTANT_P (op1))
4844                     op1 = fold_rtx (op1, NULL_RTX);
4845
4846                   if (op1)
4847                     op1 = equiv_constant (op1);
4848
4849                   /* If we are looking for the low SImode part of
4850                      (ashift:DI c (const_int 32)), it doesn't work
4851                      to compute that in SImode, because a 32-bit shift
4852                      in SImode is unpredictable.  We know the value is 0.  */
4853                   if (op0 && op1
4854                       && GET_CODE (elt->exp) == ASHIFT
4855                       && GET_CODE (op1) == CONST_INT
4856                       && INTVAL (op1) >= GET_MODE_BITSIZE (mode))
4857                     {
4858                       if (INTVAL (op1) < GET_MODE_BITSIZE (GET_MODE (elt->exp)))
4859
4860                         /* If the count fits in the inner mode's width,
4861                            but exceeds the outer mode's width,
4862                            the value will get truncated to 0
4863                            by the subreg.  */
4864                         new = const0_rtx;
4865                       else
4866                         /* If the count exceeds even the inner mode's width,
4867                            don't fold this expression.  */
4868                         new = 0;
4869                     }
4870                   else if (op0 && op1)
4871                     new = simplify_binary_operation (GET_CODE (elt->exp), mode,
4872                                                      op0, op1);
4873                 }
4874
4875               else if (GET_CODE (elt->exp) == SUBREG
4876                        && GET_MODE (SUBREG_REG (elt->exp)) == mode
4877                        && (GET_MODE_SIZE (GET_MODE (folded_arg0))
4878                            <= UNITS_PER_WORD)
4879                        && exp_equiv_p (elt->exp, elt->exp, 1, 0))
4880                 new = copy_rtx (SUBREG_REG (elt->exp));
4881
4882               if (new)
4883                 return new;
4884             }
4885         }
4886
4887       return x;
4888
4889     case NOT:
4890     case NEG:
4891       /* If we have (NOT Y), see if Y is known to be (NOT Z).
4892          If so, (NOT Y) simplifies to Z.  Similarly for NEG.  */
4893       new = lookup_as_function (XEXP (x, 0), code);
4894       if (new)
4895         return fold_rtx (copy_rtx (XEXP (new, 0)), insn);
4896       break;
4897
4898     case MEM:
4899       /* If we are not actually processing an insn, don't try to find the
4900          best address.  Not only don't we care, but we could modify the
4901          MEM in an invalid way since we have no insn to validate against.  */
4902       if (insn != 0)
4903         find_best_addr (insn, &XEXP (x, 0));
4904
4905       {
4906         /* Even if we don't fold in the insn itself,
4907            we can safely do so here, in hopes of getting a constant.  */
4908         rtx addr = fold_rtx (XEXP (x, 0), NULL_RTX);
4909         rtx base = 0;
4910         HOST_WIDE_INT offset = 0;
4911
4912         if (GET_CODE (addr) == REG
4913             && REGNO_QTY_VALID_P (REGNO (addr))
4914             && GET_MODE (addr) == qty_mode[reg_qty[REGNO (addr)]]
4915             && qty_const[reg_qty[REGNO (addr)]] != 0)
4916           addr = qty_const[reg_qty[REGNO (addr)]];
4917
4918         /* If address is constant, split it into a base and integer offset.  */
4919         if (GET_CODE (addr) == SYMBOL_REF || GET_CODE (addr) == LABEL_REF)
4920           base = addr;
4921         else if (GET_CODE (addr) == CONST && GET_CODE (XEXP (addr, 0)) == PLUS
4922                  && GET_CODE (XEXP (XEXP (addr, 0), 1)) == CONST_INT)
4923           {
4924             base = XEXP (XEXP (addr, 0), 0);
4925             offset = INTVAL (XEXP (XEXP (addr, 0), 1));
4926           }
4927         else if (GET_CODE (addr) == LO_SUM
4928                  && GET_CODE (XEXP (addr, 1)) == SYMBOL_REF)
4929           base = XEXP (addr, 1);
4930
4931         /* If this is a constant pool reference, we can fold it into its
4932            constant to allow better value tracking.  */
4933         if (base && GET_CODE (base) == SYMBOL_REF
4934             && CONSTANT_POOL_ADDRESS_P (base))
4935           {
4936             rtx constant = get_pool_constant (base);
4937             enum machine_mode const_mode = get_pool_mode (base);
4938             rtx new;
4939
4940             if (CONSTANT_P (constant) && GET_CODE (constant) != CONST_INT)
4941               constant_pool_entries_cost = COST (constant);
4942
4943             /* If we are loading the full constant, we have an equivalence.  */
4944             if (offset == 0 && mode == const_mode)
4945               return constant;
4946
4947             /* If this actually isn't a constant (wierd!), we can't do
4948                anything.  Otherwise, handle the two most common cases:
4949                extracting a word from a multi-word constant, and extracting
4950                the low-order bits.  Other cases don't seem common enough to
4951                worry about.  */
4952             if (! CONSTANT_P (constant))
4953               return x;
4954
4955             if (GET_MODE_CLASS (mode) == MODE_INT
4956                 && GET_MODE_SIZE (mode) == UNITS_PER_WORD
4957                 && offset % UNITS_PER_WORD == 0
4958                 && (new = operand_subword (constant,
4959                                            offset / UNITS_PER_WORD,
4960                                            0, const_mode)) != 0)
4961               return new;
4962
4963             if (((BYTES_BIG_ENDIAN
4964                   && offset == GET_MODE_SIZE (GET_MODE (constant)) - 1)
4965                  || (! BYTES_BIG_ENDIAN && offset == 0))
4966                 && (new = gen_lowpart_if_possible (mode, constant)) != 0)
4967               return new;
4968           }
4969
4970         /* If this is a reference to a label at a known position in a jump
4971            table, we also know its value.  */
4972         if (base && GET_CODE (base) == LABEL_REF)
4973           {
4974             rtx label = XEXP (base, 0);
4975             rtx table_insn = NEXT_INSN (label);
4976
4977             if (table_insn && GET_CODE (table_insn) == JUMP_INSN
4978                 && GET_CODE (PATTERN (table_insn)) == ADDR_VEC)
4979               {
4980                 rtx table = PATTERN (table_insn);
4981
4982                 if (offset >= 0
4983                     && (offset / GET_MODE_SIZE (GET_MODE (table))
4984                         < XVECLEN (table, 0)))
4985                   return XVECEXP (table, 0,
4986                                   offset / GET_MODE_SIZE (GET_MODE (table)));
4987               }
4988             if (table_insn && GET_CODE (table_insn) == JUMP_INSN
4989                 && GET_CODE (PATTERN (table_insn)) == ADDR_DIFF_VEC)
4990               {
4991                 rtx table = PATTERN (table_insn);
4992
4993                 if (offset >= 0
4994                     && (offset / GET_MODE_SIZE (GET_MODE (table))
4995                         < XVECLEN (table, 1)))
4996                   {
4997                     offset /= GET_MODE_SIZE (GET_MODE (table));
4998                     new = gen_rtx (MINUS, Pmode, XVECEXP (table, 1, offset),
4999                                    XEXP (table, 0));
5000
5001                     if (GET_MODE (table) != Pmode)
5002                       new = gen_rtx (TRUNCATE, GET_MODE (table), new);
5003
5004                     /* Indicate this is a constant.  This isn't a
5005                        valid form of CONST, but it will only be used
5006                        to fold the next insns and then discarded, so
5007                        it should be safe.  */
5008                     return gen_rtx (CONST, GET_MODE (new), new);
5009                   }
5010               }
5011           }
5012
5013         return x;
5014       }
5015     }
5016
5017   const_arg0 = 0;
5018   const_arg1 = 0;
5019   const_arg2 = 0;
5020   mode_arg0 = VOIDmode;
5021
5022   /* Try folding our operands.
5023      Then see which ones have constant values known.  */
5024
5025   fmt = GET_RTX_FORMAT (code);
5026   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
5027     if (fmt[i] == 'e')
5028       {
5029         rtx arg = XEXP (x, i);
5030         rtx folded_arg = arg, const_arg = 0;
5031         enum machine_mode mode_arg = GET_MODE (arg);
5032         rtx cheap_arg, expensive_arg;
5033         rtx replacements[2];
5034         int j;
5035
5036         /* Most arguments are cheap, so handle them specially.  */
5037         switch (GET_CODE (arg))
5038           {
5039           case REG:
5040             /* This is the same as calling equiv_constant; it is duplicated
5041                here for speed.  */
5042             if (REGNO_QTY_VALID_P (REGNO (arg))
5043                 && qty_const[reg_qty[REGNO (arg)]] != 0
5044                 && GET_CODE (qty_const[reg_qty[REGNO (arg)]]) != REG
5045                 && GET_CODE (qty_const[reg_qty[REGNO (arg)]]) != PLUS)
5046               const_arg
5047                 = gen_lowpart_if_possible (GET_MODE (arg),
5048                                            qty_const[reg_qty[REGNO (arg)]]);
5049             break;
5050
5051           case CONST:
5052           case CONST_INT:
5053           case SYMBOL_REF:
5054           case LABEL_REF:
5055           case CONST_DOUBLE:
5056             const_arg = arg;
5057             break;
5058
5059 #ifdef HAVE_cc0
5060           case CC0:
5061             folded_arg = prev_insn_cc0;
5062             mode_arg = prev_insn_cc0_mode;
5063             const_arg = equiv_constant (folded_arg);
5064             break;
5065 #endif
5066
5067           default:
5068             folded_arg = fold_rtx (arg, insn);
5069             const_arg = equiv_constant (folded_arg);
5070           }
5071
5072         /* For the first three operands, see if the operand
5073            is constant or equivalent to a constant.  */
5074         switch (i)
5075           {
5076           case 0:
5077             folded_arg0 = folded_arg;
5078             const_arg0 = const_arg;
5079             mode_arg0 = mode_arg;
5080             break;
5081           case 1:
5082             folded_arg1 = folded_arg;
5083             const_arg1 = const_arg;
5084             break;
5085           case 2:
5086             const_arg2 = const_arg;
5087             break;
5088           }
5089
5090         /* Pick the least expensive of the folded argument and an
5091            equivalent constant argument.  */
5092         if (const_arg == 0 || const_arg == folded_arg
5093             || COST (const_arg) > COST (folded_arg))
5094           cheap_arg = folded_arg, expensive_arg = const_arg;
5095         else
5096           cheap_arg = const_arg, expensive_arg = folded_arg;
5097
5098         /* Try to replace the operand with the cheapest of the two
5099            possibilities.  If it doesn't work and this is either of the first
5100            two operands of a commutative operation, try swapping them.
5101            If THAT fails, try the more expensive, provided it is cheaper
5102            than what is already there.  */
5103
5104         if (cheap_arg == XEXP (x, i))
5105           continue;
5106
5107         if (insn == 0 && ! copied)
5108           {
5109             x = copy_rtx (x);
5110             copied = 1;
5111           }
5112
5113         replacements[0] = cheap_arg, replacements[1] = expensive_arg;
5114         for (j = 0;
5115              j < 2 && replacements[j]
5116              && COST (replacements[j]) < COST (XEXP (x, i));
5117              j++)
5118           {
5119             if (validate_change (insn, &XEXP (x, i), replacements[j], 0))
5120               break;
5121
5122             if (code == NE || code == EQ || GET_RTX_CLASS (code) == 'c')
5123               {
5124                 validate_change (insn, &XEXP (x, i), XEXP (x, 1 - i), 1);
5125                 validate_change (insn, &XEXP (x, 1 - i), replacements[j], 1);
5126
5127                 if (apply_change_group ())
5128                   {
5129                     /* Swap them back to be invalid so that this loop can
5130                        continue and flag them to be swapped back later.  */
5131                     rtx tem;
5132
5133                     tem = XEXP (x, 0); XEXP (x, 0) = XEXP (x, 1);
5134                                        XEXP (x, 1) = tem;
5135                     must_swap = 1;
5136                     break;
5137                   }
5138               }
5139           }
5140       }
5141
5142     else if (fmt[i] == 'E')
5143       /* Don't try to fold inside of a vector of expressions.
5144          Doing nothing is harmless.  */
5145       ;
5146
5147   /* If a commutative operation, place a constant integer as the second
5148      operand unless the first operand is also a constant integer.  Otherwise,
5149      place any constant second unless the first operand is also a constant.  */
5150
5151   if (code == EQ || code == NE || GET_RTX_CLASS (code) == 'c')
5152     {
5153       if (must_swap || (const_arg0
5154                         && (const_arg1 == 0
5155                             || (GET_CODE (const_arg0) == CONST_INT
5156                                 && GET_CODE (const_arg1) != CONST_INT))))
5157         {
5158           register rtx tem = XEXP (x, 0);
5159
5160           if (insn == 0 && ! copied)
5161             {
5162               x = copy_rtx (x);
5163               copied = 1;
5164             }
5165
5166           validate_change (insn, &XEXP (x, 0), XEXP (x, 1), 1);
5167           validate_change (insn, &XEXP (x, 1), tem, 1);
5168           if (apply_change_group ())
5169             {
5170               tem = const_arg0, const_arg0 = const_arg1, const_arg1 = tem;
5171               tem = folded_arg0, folded_arg0 = folded_arg1, folded_arg1 = tem;
5172             }
5173         }
5174     }
5175
5176   /* If X is an arithmetic operation, see if we can simplify it.  */
5177
5178   switch (GET_RTX_CLASS (code))
5179     {
5180     case '1':
5181       {
5182         int is_const = 0;
5183
5184         /* We can't simplify extension ops unless we know the
5185            original mode.  */
5186         if ((code == ZERO_EXTEND || code == SIGN_EXTEND)
5187             && mode_arg0 == VOIDmode)
5188           break;
5189
5190         /* If we had a CONST, strip it off and put it back later if we
5191            fold.  */
5192         if (const_arg0 != 0 && GET_CODE (const_arg0) == CONST)
5193           is_const = 1, const_arg0 = XEXP (const_arg0, 0);
5194
5195         new = simplify_unary_operation (code, mode,
5196                                         const_arg0 ? const_arg0 : folded_arg0,
5197                                         mode_arg0);
5198         if (new != 0 && is_const)
5199           new = gen_rtx (CONST, mode, new);
5200       }
5201       break;
5202
5203     case '<':
5204       /* See what items are actually being compared and set FOLDED_ARG[01]
5205          to those values and CODE to the actual comparison code.  If any are
5206          constant, set CONST_ARG0 and CONST_ARG1 appropriately.  We needn't
5207          do anything if both operands are already known to be constant.  */
5208
5209       if (const_arg0 == 0 || const_arg1 == 0)
5210         {
5211           struct table_elt *p0, *p1;
5212           rtx true = const_true_rtx, false = const0_rtx;
5213           enum machine_mode mode_arg1;
5214
5215 #ifdef FLOAT_STORE_FLAG_VALUE
5216           if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5217             {
5218               true = CONST_DOUBLE_FROM_REAL_VALUE (FLOAT_STORE_FLAG_VALUE,
5219                                                    mode);
5220               false = CONST0_RTX (mode);
5221             }
5222 #endif
5223
5224           code = find_comparison_args (code, &folded_arg0, &folded_arg1,
5225                                        &mode_arg0, &mode_arg1);
5226           const_arg0 = equiv_constant (folded_arg0);
5227           const_arg1 = equiv_constant (folded_arg1);
5228
5229           /* If the mode is VOIDmode or a MODE_CC mode, we don't know
5230              what kinds of things are being compared, so we can't do
5231              anything with this comparison.  */
5232
5233           if (mode_arg0 == VOIDmode || GET_MODE_CLASS (mode_arg0) == MODE_CC)
5234             break;
5235
5236           /* If we do not now have two constants being compared, see if we
5237              can nevertheless deduce some things about the comparison.  */
5238           if (const_arg0 == 0 || const_arg1 == 0)
5239             {
5240               /* Is FOLDED_ARG0 frame-pointer plus a constant?  Or non-explicit
5241                  constant?  These aren't zero, but we don't know their sign. */
5242               if (const_arg1 == const0_rtx
5243                   && (NONZERO_BASE_PLUS_P (folded_arg0)
5244 #if 0  /* Sad to say, on sysvr4, #pragma weak can make a symbol address
5245           come out as 0.  */
5246                       || GET_CODE (folded_arg0) == SYMBOL_REF
5247 #endif
5248                       || GET_CODE (folded_arg0) == LABEL_REF
5249                       || GET_CODE (folded_arg0) == CONST))
5250                 {
5251                   if (code == EQ)
5252                     return false;
5253                   else if (code == NE)
5254                     return true;
5255                 }
5256
5257               /* See if the two operands are the same.  We don't do this
5258                  for IEEE floating-point since we can't assume x == x
5259                  since x might be a NaN.  */
5260
5261               if ((TARGET_FLOAT_FORMAT != IEEE_FLOAT_FORMAT
5262                    || ! FLOAT_MODE_P (mode_arg0) || flag_fast_math)
5263                   && (folded_arg0 == folded_arg1
5264                       || (GET_CODE (folded_arg0) == REG
5265                           && GET_CODE (folded_arg1) == REG
5266                           && (reg_qty[REGNO (folded_arg0)]
5267                               == reg_qty[REGNO (folded_arg1)]))
5268                       || ((p0 = lookup (folded_arg0,
5269                                         (safe_hash (folded_arg0, mode_arg0)
5270                                          % NBUCKETS), mode_arg0))
5271                           && (p1 = lookup (folded_arg1,
5272                                            (safe_hash (folded_arg1, mode_arg0)
5273                                             % NBUCKETS), mode_arg0))
5274                           && p0->first_same_value == p1->first_same_value)))
5275                 return ((code == EQ || code == LE || code == GE
5276                          || code == LEU || code == GEU)
5277                         ? true : false);
5278
5279               /* If FOLDED_ARG0 is a register, see if the comparison we are
5280                  doing now is either the same as we did before or the reverse
5281                  (we only check the reverse if not floating-point).  */
5282               else if (GET_CODE (folded_arg0) == REG)
5283                 {
5284                   int qty = reg_qty[REGNO (folded_arg0)];
5285
5286                   if (REGNO_QTY_VALID_P (REGNO (folded_arg0))
5287                       && (comparison_dominates_p (qty_comparison_code[qty], code)
5288                           || (comparison_dominates_p (qty_comparison_code[qty],
5289                                                       reverse_condition (code))
5290                               && ! FLOAT_MODE_P (mode_arg0)))
5291                       && (rtx_equal_p (qty_comparison_const[qty], folded_arg1)
5292                           || (const_arg1
5293                               && rtx_equal_p (qty_comparison_const[qty],
5294                                               const_arg1))
5295                           || (GET_CODE (folded_arg1) == REG
5296                               && (reg_qty[REGNO (folded_arg1)]
5297                                   == qty_comparison_qty[qty]))))
5298                     return (comparison_dominates_p (qty_comparison_code[qty],
5299                                                     code)
5300                             ? true : false);
5301                 }
5302             }
5303         }
5304
5305       /* If we are comparing against zero, see if the first operand is
5306          equivalent to an IOR with a constant.  If so, we may be able to
5307          determine the result of this comparison.  */
5308
5309       if (const_arg1 == const0_rtx)
5310         {
5311           rtx y = lookup_as_function (folded_arg0, IOR);
5312           rtx inner_const;
5313
5314           if (y != 0
5315               && (inner_const = equiv_constant (XEXP (y, 1))) != 0
5316               && GET_CODE (inner_const) == CONST_INT
5317               && INTVAL (inner_const) != 0)
5318             {
5319               int sign_bitnum = GET_MODE_BITSIZE (mode_arg0) - 1;
5320               int has_sign = (HOST_BITS_PER_WIDE_INT >= sign_bitnum
5321                               && (INTVAL (inner_const)
5322                                   & ((HOST_WIDE_INT) 1 << sign_bitnum)));
5323               rtx true = const_true_rtx, false = const0_rtx;
5324
5325 #ifdef FLOAT_STORE_FLAG_VALUE
5326               if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5327                 {
5328                   true = CONST_DOUBLE_FROM_REAL_VALUE (FLOAT_STORE_FLAG_VALUE,
5329                                                        mode);
5330                   false = CONST0_RTX (mode);
5331                 }
5332 #endif
5333
5334               switch (code)
5335                 {
5336                 case EQ:
5337                   return false;
5338                 case NE:
5339                   return true;
5340                 case LT:  case LE:
5341                   if (has_sign)
5342                     return true;
5343                   break;
5344                 case GT:  case GE:
5345                   if (has_sign)
5346                     return false;
5347                   break;
5348                 }
5349             }
5350         }
5351
5352       new = simplify_relational_operation (code, mode_arg0,
5353                                            const_arg0 ? const_arg0 : folded_arg0,
5354                                            const_arg1 ? const_arg1 : folded_arg1);
5355 #ifdef FLOAT_STORE_FLAG_VALUE
5356       if (new != 0 && GET_MODE_CLASS (mode) == MODE_FLOAT)
5357         new = ((new == const0_rtx) ? CONST0_RTX (mode)
5358                : CONST_DOUBLE_FROM_REAL_VALUE (FLOAT_STORE_FLAG_VALUE, mode));
5359 #endif
5360       break;
5361
5362     case '2':
5363     case 'c':
5364       switch (code)
5365         {
5366         case PLUS:
5367           /* If the second operand is a LABEL_REF, see if the first is a MINUS
5368              with that LABEL_REF as its second operand.  If so, the result is
5369              the first operand of that MINUS.  This handles switches with an
5370              ADDR_DIFF_VEC table.  */
5371           if (const_arg1 && GET_CODE (const_arg1) == LABEL_REF)
5372             {
5373               rtx y = lookup_as_function (folded_arg0, MINUS);
5374
5375               if (y != 0 && GET_CODE (XEXP (y, 1)) == LABEL_REF
5376                   && XEXP (XEXP (y, 1), 0) == XEXP (const_arg1, 0))
5377                 return XEXP (y, 0);
5378
5379               /* Now try for a CONST of a MINUS like the above.  */
5380               if ((y = lookup_as_function (folded_arg0, CONST)) != 0
5381                   && GET_CODE (XEXP (y, 0)) == MINUS
5382                   && GET_CODE (XEXP (XEXP (y, 0), 1)) == LABEL_REF
5383                   && XEXP (XEXP (XEXP (y, 0),1), 0) == XEXP (const_arg1, 0))
5384                 return XEXP (XEXP (y, 0), 0);
5385             }
5386
5387           /* If second operand is a register equivalent to a negative
5388              CONST_INT, see if we can find a register equivalent to the
5389              positive constant.  Make a MINUS if so.  Don't do this for
5390              a negative constant since we might then alternate between
5391              chosing positive and negative constants.  Having the positive
5392              constant previously-used is the more common case.  */
5393           if (const_arg1 && GET_CODE (const_arg1) == CONST_INT
5394               && INTVAL (const_arg1) < 0 && GET_CODE (folded_arg1) == REG)
5395             {
5396               rtx new_const = GEN_INT (- INTVAL (const_arg1));
5397               struct table_elt *p
5398                 = lookup (new_const, safe_hash (new_const, mode) % NBUCKETS,
5399                           mode);
5400
5401               if (p)
5402                 for (p = p->first_same_value; p; p = p->next_same_value)
5403                   if (GET_CODE (p->exp) == REG)
5404                     return cse_gen_binary (MINUS, mode, folded_arg0,
5405                                            canon_reg (p->exp, NULL_RTX));
5406             }
5407           goto from_plus;
5408
5409         case MINUS:
5410           /* If we have (MINUS Y C), see if Y is known to be (PLUS Z C2).
5411              If so, produce (PLUS Z C2-C).  */
5412           if (const_arg1 != 0 && GET_CODE (const_arg1) == CONST_INT)
5413             {
5414               rtx y = lookup_as_function (XEXP (x, 0), PLUS);
5415               if (y && GET_CODE (XEXP (y, 1)) == CONST_INT)
5416                 return fold_rtx (plus_constant (copy_rtx (y),
5417                                                 -INTVAL (const_arg1)),
5418                                  NULL_RTX);
5419             }
5420
5421           /* ... fall through ... */
5422
5423         from_plus:
5424         case SMIN:    case SMAX:      case UMIN:    case UMAX:
5425         case IOR:     case AND:       case XOR:
5426         case MULT:    case DIV:       case UDIV:
5427         case ASHIFT:  case LSHIFTRT:  case ASHIFTRT:
5428           /* If we have (<op> <reg> <const_int>) for an associative OP and REG
5429              is known to be of similar form, we may be able to replace the
5430              operation with a combined operation.  This may eliminate the
5431              intermediate operation if every use is simplified in this way.
5432              Note that the similar optimization done by combine.c only works
5433              if the intermediate operation's result has only one reference.  */
5434
5435           if (GET_CODE (folded_arg0) == REG
5436               && const_arg1 && GET_CODE (const_arg1) == CONST_INT)
5437             {
5438               int is_shift
5439                 = (code == ASHIFT || code == ASHIFTRT || code == LSHIFTRT);
5440               rtx y = lookup_as_function (folded_arg0, code);
5441               rtx inner_const;
5442               enum rtx_code associate_code;
5443               rtx new_const;
5444
5445               if (y == 0
5446                   || 0 == (inner_const
5447                            = equiv_constant (fold_rtx (XEXP (y, 1), 0)))
5448                   || GET_CODE (inner_const) != CONST_INT
5449                   /* If we have compiled a statement like
5450                      "if (x == (x & mask1))", and now are looking at
5451                      "x & mask2", we will have a case where the first operand
5452                      of Y is the same as our first operand.  Unless we detect
5453                      this case, an infinite loop will result.  */
5454                   || XEXP (y, 0) == folded_arg0)
5455                 break;
5456
5457               /* Don't associate these operations if they are a PLUS with the
5458                  same constant and it is a power of two.  These might be doable
5459                  with a pre- or post-increment.  Similarly for two subtracts of
5460                  identical powers of two with post decrement.  */
5461
5462               if (code == PLUS && INTVAL (const_arg1) == INTVAL (inner_const)
5463                   && (0
5464 #if defined(HAVE_PRE_INCREMENT) || defined(HAVE_POST_INCREMENT)
5465                       || exact_log2 (INTVAL (const_arg1)) >= 0
5466 #endif
5467 #if defined(HAVE_PRE_DECREMENT) || defined(HAVE_POST_DECREMENT)
5468                       || exact_log2 (- INTVAL (const_arg1)) >= 0
5469 #endif
5470                   ))
5471                 break;
5472
5473               /* Compute the code used to compose the constants.  For example,
5474                  A/C1/C2 is A/(C1 * C2), so if CODE == DIV, we want MULT.  */
5475
5476               associate_code
5477                 = (code == MULT || code == DIV || code == UDIV ? MULT
5478                    : is_shift || code == PLUS || code == MINUS ? PLUS : code);
5479
5480               new_const = simplify_binary_operation (associate_code, mode,
5481                                                      const_arg1, inner_const);
5482
5483               if (new_const == 0)
5484                 break;
5485
5486               /* If we are associating shift operations, don't let this
5487                  produce a shift of the size of the object or larger.
5488                  This could occur when we follow a sign-extend by a right
5489                  shift on a machine that does a sign-extend as a pair
5490                  of shifts.  */
5491
5492               if (is_shift && GET_CODE (new_const) == CONST_INT
5493                   && INTVAL (new_const) >= GET_MODE_BITSIZE (mode))
5494                 {
5495                   /* As an exception, we can turn an ASHIFTRT of this
5496                      form into a shift of the number of bits - 1.  */
5497                   if (code == ASHIFTRT)
5498                     new_const = GEN_INT (GET_MODE_BITSIZE (mode) - 1);
5499                   else
5500                     break;
5501                 }
5502
5503               y = copy_rtx (XEXP (y, 0));
5504
5505               /* If Y contains our first operand (the most common way this
5506                  can happen is if Y is a MEM), we would do into an infinite
5507                  loop if we tried to fold it.  So don't in that case.  */
5508
5509               if (! reg_mentioned_p (folded_arg0, y))
5510                 y = fold_rtx (y, insn);
5511
5512               return cse_gen_binary (code, mode, y, new_const);
5513             }
5514         }
5515
5516       new = simplify_binary_operation (code, mode,
5517                                        const_arg0 ? const_arg0 : folded_arg0,
5518                                        const_arg1 ? const_arg1 : folded_arg1);
5519       break;
5520
5521     case 'o':
5522       /* (lo_sum (high X) X) is simply X.  */
5523       if (code == LO_SUM && const_arg0 != 0
5524           && GET_CODE (const_arg0) == HIGH
5525           && rtx_equal_p (XEXP (const_arg0, 0), const_arg1))
5526         return const_arg1;
5527       break;
5528
5529     case '3':
5530     case 'b':
5531       new = simplify_ternary_operation (code, mode, mode_arg0,
5532                                         const_arg0 ? const_arg0 : folded_arg0,
5533                                         const_arg1 ? const_arg1 : folded_arg1,
5534                                         const_arg2 ? const_arg2 : XEXP (x, 2));
5535       break;
5536     }
5537
5538   return new ? new : x;
5539 }
5540 \f
5541 /* Return a constant value currently equivalent to X.
5542    Return 0 if we don't know one.  */
5543
5544 static rtx
5545 equiv_constant (x)
5546      rtx x;
5547 {
5548   if (GET_CODE (x) == REG
5549       && REGNO_QTY_VALID_P (REGNO (x))
5550       && qty_const[reg_qty[REGNO (x)]])
5551     x = gen_lowpart_if_possible (GET_MODE (x), qty_const[reg_qty[REGNO (x)]]);
5552
5553   if (x != 0 && CONSTANT_P (x))
5554     return x;
5555
5556   /* If X is a MEM, try to fold it outside the context of any insn to see if
5557      it might be equivalent to a constant.  That handles the case where it
5558      is a constant-pool reference.  Then try to look it up in the hash table
5559      in case it is something whose value we have seen before.  */
5560
5561   if (GET_CODE (x) == MEM)
5562     {
5563       struct table_elt *elt;
5564
5565       x = fold_rtx (x, NULL_RTX);
5566       if (CONSTANT_P (x))
5567         return x;
5568
5569       elt = lookup (x, safe_hash (x, GET_MODE (x)) % NBUCKETS, GET_MODE (x));
5570       if (elt == 0)
5571         return 0;
5572
5573       for (elt = elt->first_same_value; elt; elt = elt->next_same_value)
5574         if (elt->is_const && CONSTANT_P (elt->exp))
5575           return elt->exp;
5576     }
5577
5578   return 0;
5579 }
5580 \f
5581 /* Assuming that X is an rtx (e.g., MEM, REG or SUBREG) for a fixed-point
5582    number, return an rtx (MEM, SUBREG, or CONST_INT) that refers to the
5583    least-significant part of X.
5584    MODE specifies how big a part of X to return.
5585
5586    If the requested operation cannot be done, 0 is returned.
5587
5588    This is similar to gen_lowpart in emit-rtl.c.  */
5589
5590 rtx
5591 gen_lowpart_if_possible (mode, x)
5592      enum machine_mode mode;
5593      register rtx x;
5594 {
5595   rtx result = gen_lowpart_common (mode, x);
5596
5597   if (result)
5598     return result;
5599   else if (GET_CODE (x) == MEM)
5600     {
5601       /* This is the only other case we handle.  */
5602       register int offset = 0;
5603       rtx new;
5604
5605 #if WORDS_BIG_ENDIAN
5606       offset = (MAX (GET_MODE_SIZE (GET_MODE (x)), UNITS_PER_WORD)
5607                 - MAX (GET_MODE_SIZE (mode), UNITS_PER_WORD));
5608 #endif
5609 #if BYTES_BIG_ENDIAN
5610       /* Adjust the address so that the address-after-the-data
5611          is unchanged.  */
5612       offset -= (MIN (UNITS_PER_WORD, GET_MODE_SIZE (mode))
5613                  - MIN (UNITS_PER_WORD, GET_MODE_SIZE (GET_MODE (x))));
5614 #endif
5615       new = gen_rtx (MEM, mode, plus_constant (XEXP (x, 0), offset));
5616       if (! memory_address_p (mode, XEXP (new, 0)))
5617         return 0;
5618       MEM_VOLATILE_P (new) = MEM_VOLATILE_P (x);
5619       RTX_UNCHANGING_P (new) = RTX_UNCHANGING_P (x);
5620       MEM_IN_STRUCT_P (new) = MEM_IN_STRUCT_P (x);
5621       return new;
5622     }
5623   else
5624     return 0;
5625 }
5626 \f
5627 /* Given INSN, a jump insn, TAKEN indicates if we are following the "taken"
5628    branch.  It will be zero if not.
5629
5630    In certain cases, this can cause us to add an equivalence.  For example,
5631    if we are following the taken case of
5632         if (i == 2)
5633    we can add the fact that `i' and '2' are now equivalent.
5634
5635    In any case, we can record that this comparison was passed.  If the same
5636    comparison is seen later, we will know its value.  */
5637
5638 static void
5639 record_jump_equiv (insn, taken)
5640      rtx insn;
5641      int taken;
5642 {
5643   int cond_known_true;
5644   rtx op0, op1;
5645   enum machine_mode mode, mode0, mode1;
5646   int reversed_nonequality = 0;
5647   enum rtx_code code;
5648
5649   /* Ensure this is the right kind of insn.  */
5650   if (! condjump_p (insn) || simplejump_p (insn))
5651     return;
5652
5653   /* See if this jump condition is known true or false.  */
5654   if (taken)
5655     cond_known_true = (XEXP (SET_SRC (PATTERN (insn)), 2) == pc_rtx);
5656   else
5657     cond_known_true = (XEXP (SET_SRC (PATTERN (insn)), 1) == pc_rtx);
5658
5659   /* Get the type of comparison being done and the operands being compared.
5660      If we had to reverse a non-equality condition, record that fact so we
5661      know that it isn't valid for floating-point.  */
5662   code = GET_CODE (XEXP (SET_SRC (PATTERN (insn)), 0));
5663   op0 = fold_rtx (XEXP (XEXP (SET_SRC (PATTERN (insn)), 0), 0), insn);
5664   op1 = fold_rtx (XEXP (XEXP (SET_SRC (PATTERN (insn)), 0), 1), insn);
5665
5666   code = find_comparison_args (code, &op0, &op1, &mode0, &mode1);
5667   if (! cond_known_true)
5668     {
5669       reversed_nonequality = (code != EQ && code != NE);
5670       code = reverse_condition (code);
5671     }
5672
5673   /* The mode is the mode of the non-constant.  */
5674   mode = mode0;
5675   if (mode1 != VOIDmode)
5676     mode = mode1;
5677
5678   record_jump_cond (code, mode, op0, op1, reversed_nonequality);
5679 }
5680
5681 /* We know that comparison CODE applied to OP0 and OP1 in MODE is true.
5682    REVERSED_NONEQUALITY is nonzero if CODE had to be swapped.
5683    Make any useful entries we can with that information.  Called from
5684    above function and called recursively.  */
5685
5686 static void
5687 record_jump_cond (code, mode, op0, op1, reversed_nonequality)
5688      enum rtx_code code;
5689      enum machine_mode mode;
5690      rtx op0, op1;
5691      int reversed_nonequality;
5692 {
5693   unsigned op0_hash, op1_hash;
5694   int op0_in_memory, op0_in_struct, op1_in_memory, op1_in_struct;
5695   struct table_elt *op0_elt, *op1_elt;
5696
5697   /* If OP0 and OP1 are known equal, and either is a paradoxical SUBREG,
5698      we know that they are also equal in the smaller mode (this is also
5699      true for all smaller modes whether or not there is a SUBREG, but
5700      is not worth testing for with no SUBREG.  */
5701
5702   /* Note that GET_MODE (op0) may not equal MODE.  */
5703   if (code == EQ && GET_CODE (op0) == SUBREG
5704       && (GET_MODE_SIZE (GET_MODE (op0))
5705           > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
5706     {
5707       enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op0));
5708       rtx tem = gen_lowpart_if_possible (inner_mode, op1);
5709
5710       record_jump_cond (code, mode, SUBREG_REG (op0),
5711                         tem ? tem : gen_rtx (SUBREG, inner_mode, op1, 0),
5712                         reversed_nonequality);
5713     }
5714
5715   if (code == EQ && GET_CODE (op1) == SUBREG
5716       && (GET_MODE_SIZE (GET_MODE (op1))
5717           > GET_MODE_SIZE (GET_MODE (SUBREG_REG (op1)))))
5718     {
5719       enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op1));
5720       rtx tem = gen_lowpart_if_possible (inner_mode, op0);
5721
5722       record_jump_cond (code, mode, SUBREG_REG (op1),
5723                         tem ? tem : gen_rtx (SUBREG, inner_mode, op0, 0),
5724                         reversed_nonequality);
5725     }
5726
5727   /* Similarly, if this is an NE comparison, and either is a SUBREG
5728      making a smaller mode, we know the whole thing is also NE.  */
5729
5730   /* Note that GET_MODE (op0) may not equal MODE;
5731      if we test MODE instead, we can get an infinite recursion
5732      alternating between two modes each wider than MODE.  */
5733
5734   if (code == NE && GET_CODE (op0) == SUBREG
5735       && subreg_lowpart_p (op0)
5736       && (GET_MODE_SIZE (GET_MODE (op0))
5737           < GET_MODE_SIZE (GET_MODE (SUBREG_REG (op0)))))
5738     {
5739       enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op0));
5740       rtx tem = gen_lowpart_if_possible (inner_mode, op1);
5741
5742       record_jump_cond (code, mode, SUBREG_REG (op0),
5743                         tem ? tem : gen_rtx (SUBREG, inner_mode, op1, 0),
5744                         reversed_nonequality);
5745     }
5746
5747   if (code == NE && GET_CODE (op1) == SUBREG
5748       && subreg_lowpart_p (op1)
5749       && (GET_MODE_SIZE (GET_MODE (op1))
5750           < GET_MODE_SIZE (GET_MODE (SUBREG_REG (op1)))))
5751     {
5752       enum machine_mode inner_mode = GET_MODE (SUBREG_REG (op1));
5753       rtx tem = gen_lowpart_if_possible (inner_mode, op0);
5754
5755       record_jump_cond (code, mode, SUBREG_REG (op1),
5756                         tem ? tem : gen_rtx (SUBREG, inner_mode, op0, 0),
5757                         reversed_nonequality);
5758     }
5759
5760   /* Hash both operands.  */
5761
5762   do_not_record = 0;
5763   hash_arg_in_memory = 0;
5764   hash_arg_in_struct = 0;
5765   op0_hash = HASH (op0, mode);
5766   op0_in_memory = hash_arg_in_memory;
5767   op0_in_struct = hash_arg_in_struct;
5768
5769   if (do_not_record)
5770     return;
5771
5772   do_not_record = 0;
5773   hash_arg_in_memory = 0;
5774   hash_arg_in_struct = 0;
5775   op1_hash = HASH (op1, mode);
5776   op1_in_memory = hash_arg_in_memory;
5777   op1_in_struct = hash_arg_in_struct;
5778
5779   if (do_not_record)
5780     return;
5781
5782   /* Look up both operands.  */
5783   op0_elt = lookup (op0, op0_hash, mode);
5784   op1_elt = lookup (op1, op1_hash, mode);
5785
5786   /* If we aren't setting two things equal all we can do is save this
5787      comparison.   Similarly if this is floating-point.  In the latter
5788      case, OP1 might be zero and both -0.0 and 0.0 are equal to it.
5789      If we record the equality, we might inadvertently delete code
5790      whose intent was to change -0 to +0.  */
5791
5792   if (code != EQ || FLOAT_MODE_P (GET_MODE (op0)))
5793     {
5794       /* If we reversed a floating-point comparison, if OP0 is not a
5795          register, or if OP1 is neither a register or constant, we can't
5796          do anything.  */
5797
5798       if (GET_CODE (op1) != REG)
5799         op1 = equiv_constant (op1);
5800
5801       if ((reversed_nonequality && FLOAT_MODE_P (mode))
5802           || GET_CODE (op0) != REG || op1 == 0)
5803         return;
5804
5805       /* Put OP0 in the hash table if it isn't already.  This gives it a
5806          new quantity number.  */
5807       if (op0_elt == 0)
5808         {
5809           if (insert_regs (op0, NULL_PTR, 0))
5810             {
5811               rehash_using_reg (op0);
5812               op0_hash = HASH (op0, mode);
5813
5814               /* If OP0 is contained in OP1, this changes its hash code
5815                  as well.  Faster to rehash than to check, except
5816                  for the simple case of a constant.  */
5817               if (! CONSTANT_P (op1))
5818                 op1_hash = HASH (op1,mode);
5819             }
5820
5821           op0_elt = insert (op0, NULL_PTR, op0_hash, mode);
5822           op0_elt->in_memory = op0_in_memory;
5823           op0_elt->in_struct = op0_in_struct;
5824         }
5825
5826       qty_comparison_code[reg_qty[REGNO (op0)]] = code;
5827       if (GET_CODE (op1) == REG)
5828         {
5829           /* Look it up again--in case op0 and op1 are the same.  */
5830           op1_elt = lookup (op1, op1_hash, mode);
5831
5832           /* Put OP1 in the hash table so it gets a new quantity number.  */
5833           if (op1_elt == 0)
5834             {
5835               if (insert_regs (op1, NULL_PTR, 0))
5836                 {
5837                   rehash_using_reg (op1);
5838                   op1_hash = HASH (op1, mode);
5839                 }
5840
5841               op1_elt = insert (op1, NULL_PTR, op1_hash, mode);
5842               op1_elt->in_memory = op1_in_memory;
5843               op1_elt->in_struct = op1_in_struct;
5844             }
5845
5846           qty_comparison_qty[reg_qty[REGNO (op0)]] = reg_qty[REGNO (op1)];
5847           qty_comparison_const[reg_qty[REGNO (op0)]] = 0;
5848         }
5849       else
5850         {
5851           qty_comparison_qty[reg_qty[REGNO (op0)]] = -1;
5852           qty_comparison_const[reg_qty[REGNO (op0)]] = op1;
5853         }
5854
5855       return;
5856     }
5857
5858   /* If either side is still missing an equivalence, make it now,
5859      then merge the equivalences.  */
5860
5861   if (op0_elt == 0)
5862     {
5863       if (insert_regs (op0, NULL_PTR, 0))
5864         {
5865           rehash_using_reg (op0);
5866           op0_hash = HASH (op0, mode);
5867         }
5868
5869       op0_elt = insert (op0, NULL_PTR, op0_hash, mode);
5870       op0_elt->in_memory = op0_in_memory;
5871       op0_elt->in_struct = op0_in_struct;
5872     }
5873
5874   if (op1_elt == 0)
5875     {
5876       if (insert_regs (op1, NULL_PTR, 0))
5877         {
5878           rehash_using_reg (op1);
5879           op1_hash = HASH (op1, mode);
5880         }
5881
5882       op1_elt = insert (op1, NULL_PTR, op1_hash, mode);
5883       op1_elt->in_memory = op1_in_memory;
5884       op1_elt->in_struct = op1_in_struct;
5885     }
5886
5887   merge_equiv_classes (op0_elt, op1_elt);
5888   last_jump_equiv_class = op0_elt;
5889 }
5890 \f
5891 /* CSE processing for one instruction.
5892    First simplify sources and addresses of all assignments
5893    in the instruction, using previously-computed equivalents values.
5894    Then install the new sources and destinations in the table
5895    of available values.
5896
5897    If IN_LIBCALL_BLOCK is nonzero, don't record any equivalence made in
5898    the insn.  */
5899
5900 /* Data on one SET contained in the instruction.  */
5901
5902 struct set
5903 {
5904   /* The SET rtx itself.  */
5905   rtx rtl;
5906   /* The SET_SRC of the rtx (the original value, if it is changing).  */
5907   rtx src;
5908   /* The hash-table element for the SET_SRC of the SET.  */
5909   struct table_elt *src_elt;
5910   /* Hash value for the SET_SRC.  */
5911   unsigned src_hash;
5912   /* Hash value for the SET_DEST.  */
5913   unsigned dest_hash;
5914   /* The SET_DEST, with SUBREG, etc., stripped.  */
5915   rtx inner_dest;
5916   /* Place where the pointer to the INNER_DEST was found.  */
5917   rtx *inner_dest_loc;
5918   /* Nonzero if the SET_SRC is in memory.  */
5919   char src_in_memory;
5920   /* Nonzero if the SET_SRC is in a structure.  */
5921   char src_in_struct;
5922   /* Nonzero if the SET_SRC contains something
5923      whose value cannot be predicted and understood.  */
5924   char src_volatile;
5925   /* Original machine mode, in case it becomes a CONST_INT.  */
5926   enum machine_mode mode;
5927   /* A constant equivalent for SET_SRC, if any.  */
5928   rtx src_const;
5929   /* Hash value of constant equivalent for SET_SRC.  */
5930   unsigned src_const_hash;
5931   /* Table entry for constant equivalent for SET_SRC, if any.  */
5932   struct table_elt *src_const_elt;
5933 };
5934
5935 static void
5936 cse_insn (insn, in_libcall_block)
5937      rtx insn;
5938      int in_libcall_block;
5939 {
5940   register rtx x = PATTERN (insn);
5941   register int i;
5942   rtx tem;
5943   register int n_sets = 0;
5944
5945   /* Records what this insn does to set CC0.  */
5946   rtx this_insn_cc0 = 0;
5947   enum machine_mode this_insn_cc0_mode;
5948   struct write_data writes_memory;
5949   static struct write_data init = {0, 0, 0, 0};
5950
5951   rtx src_eqv = 0;
5952   struct table_elt *src_eqv_elt = 0;
5953   int src_eqv_volatile;
5954   int src_eqv_in_memory;
5955   int src_eqv_in_struct;
5956   unsigned src_eqv_hash;
5957
5958   struct set *sets;
5959
5960   this_insn = insn;
5961   writes_memory = init;
5962
5963   /* Find all the SETs and CLOBBERs in this instruction.
5964      Record all the SETs in the array `set' and count them.
5965      Also determine whether there is a CLOBBER that invalidates
5966      all memory references, or all references at varying addresses.  */
5967
5968   if (GET_CODE (insn) == CALL_INSN)
5969     {
5970       for (tem = CALL_INSN_FUNCTION_USAGE (insn); tem; tem = XEXP (tem, 1))
5971         if (GET_CODE (XEXP (tem, 0)) == CLOBBER)
5972           invalidate (SET_DEST (XEXP (tem, 0)));
5973     }
5974
5975   if (GET_CODE (x) == SET)
5976     {
5977       sets = (struct set *) alloca (sizeof (struct set));
5978       sets[0].rtl = x;
5979
5980       /* Ignore SETs that are unconditional jumps.
5981          They never need cse processing, so this does not hurt.
5982          The reason is not efficiency but rather
5983          so that we can test at the end for instructions
5984          that have been simplified to unconditional jumps
5985          and not be misled by unchanged instructions
5986          that were unconditional jumps to begin with.  */
5987       if (SET_DEST (x) == pc_rtx
5988           && GET_CODE (SET_SRC (x)) == LABEL_REF)
5989         ;
5990
5991       /* Don't count call-insns, (set (reg 0) (call ...)), as a set.
5992          The hard function value register is used only once, to copy to
5993          someplace else, so it isn't worth cse'ing (and on 80386 is unsafe)!
5994          Ensure we invalidate the destination register.  On the 80386 no
5995          other code would invalidate it since it is a fixed_reg.
5996          We need not check the return of apply_change_group; see canon_reg. */
5997
5998       else if (GET_CODE (SET_SRC (x)) == CALL)
5999         {
6000           canon_reg (SET_SRC (x), insn);
6001           apply_change_group ();
6002           fold_rtx (SET_SRC (x), insn);
6003           invalidate (SET_DEST (x));
6004         }
6005       else
6006         n_sets = 1;
6007     }
6008   else if (GET_CODE (x) == PARALLEL)
6009     {
6010       register int lim = XVECLEN (x, 0);
6011
6012       sets = (struct set *) alloca (lim * sizeof (struct set));
6013
6014       /* Find all regs explicitly clobbered in this insn,
6015          and ensure they are not replaced with any other regs
6016          elsewhere in this insn.
6017          When a reg that is clobbered is also used for input,
6018          we should presume that that is for a reason,
6019          and we should not substitute some other register
6020          which is not supposed to be clobbered.
6021          Therefore, this loop cannot be merged into the one below
6022          because a CALL may precede a CLOBBER and refer to the
6023          value clobbered.  We must not let a canonicalization do
6024          anything in that case.  */
6025       for (i = 0; i < lim; i++)
6026         {
6027           register rtx y = XVECEXP (x, 0, i);
6028           if (GET_CODE (y) == CLOBBER)
6029             {
6030               rtx clobbered = XEXP (y, 0);
6031
6032               if (GET_CODE (clobbered) == REG
6033                   || GET_CODE (clobbered) == SUBREG)
6034                 invalidate (clobbered);
6035               else if (GET_CODE (clobbered) == STRICT_LOW_PART
6036                        || GET_CODE (clobbered) == ZERO_EXTRACT)
6037                 invalidate (XEXP (clobbered, 0));
6038             }
6039         }
6040
6041       for (i = 0; i < lim; i++)
6042         {
6043           register rtx y = XVECEXP (x, 0, i);
6044           if (GET_CODE (y) == SET)
6045             {
6046               /* As above, we ignore unconditional jumps and call-insns and
6047                  ignore the result of apply_change_group.  */
6048               if (GET_CODE (SET_SRC (y)) == CALL)
6049                 {
6050                   canon_reg (SET_SRC (y), insn);
6051                   apply_change_group ();
6052                   fold_rtx (SET_SRC (y), insn);
6053                   invalidate (SET_DEST (y));
6054                 }
6055               else if (SET_DEST (y) == pc_rtx
6056                        && GET_CODE (SET_SRC (y)) == LABEL_REF)
6057                 ;
6058               else
6059                 sets[n_sets++].rtl = y;
6060             }
6061           else if (GET_CODE (y) == CLOBBER)
6062             {
6063               /* If we clobber memory, take note of that,
6064                  and canon the address.
6065                  This does nothing when a register is clobbered
6066                  because we have already invalidated the reg.  */
6067               if (GET_CODE (XEXP (y, 0)) == MEM)
6068                 {
6069                   canon_reg (XEXP (y, 0), NULL_RTX);
6070                   note_mem_written (XEXP (y, 0), &writes_memory);
6071                 }
6072             }
6073           else if (GET_CODE (y) == USE
6074                    && ! (GET_CODE (XEXP (y, 0)) == REG
6075                          && REGNO (XEXP (y, 0)) < FIRST_PSEUDO_REGISTER))
6076             canon_reg (y, NULL_RTX);
6077           else if (GET_CODE (y) == CALL)
6078             {
6079               /* The result of apply_change_group can be ignored; see
6080                  canon_reg.  */
6081               canon_reg (y, insn);
6082               apply_change_group ();
6083               fold_rtx (y, insn);
6084             }
6085         }
6086     }
6087   else if (GET_CODE (x) == CLOBBER)
6088     {
6089       if (GET_CODE (XEXP (x, 0)) == MEM)
6090         {
6091           canon_reg (XEXP (x, 0), NULL_RTX);
6092           note_mem_written (XEXP (x, 0), &writes_memory);
6093         }
6094     }
6095
6096   /* Canonicalize a USE of a pseudo register or memory location.  */
6097   else if (GET_CODE (x) == USE
6098            && ! (GET_CODE (XEXP (x, 0)) == REG
6099                  && REGNO (XEXP (x, 0)) < FIRST_PSEUDO_REGISTER))
6100     canon_reg (XEXP (x, 0), NULL_RTX);
6101   else if (GET_CODE (x) == CALL)
6102     {
6103       /* The result of apply_change_group can be ignored; see canon_reg.  */
6104       canon_reg (x, insn);
6105       apply_change_group ();
6106       fold_rtx (x, insn);
6107     }
6108
6109   /* Store the equivalent value in SRC_EQV, if different, or if the DEST
6110      is a STRICT_LOW_PART.  The latter condition is necessary because SRC_EQV
6111      is handled specially for this case, and if it isn't set, then there will
6112      be no equivalence for the destinatation.  */
6113   if (n_sets == 1 && REG_NOTES (insn) != 0
6114       && (tem = find_reg_note (insn, REG_EQUAL, NULL_RTX)) != 0
6115       && (! rtx_equal_p (XEXP (tem, 0), SET_SRC (sets[0].rtl))
6116           || GET_CODE (SET_DEST (sets[0].rtl)) == STRICT_LOW_PART))
6117     src_eqv = canon_reg (XEXP (tem, 0), NULL_RTX);
6118
6119   /* Canonicalize sources and addresses of destinations.
6120      We do this in a separate pass to avoid problems when a MATCH_DUP is
6121      present in the insn pattern.  In that case, we want to ensure that
6122      we don't break the duplicate nature of the pattern.  So we will replace
6123      both operands at the same time.  Otherwise, we would fail to find an
6124      equivalent substitution in the loop calling validate_change below.
6125
6126      We used to suppress canonicalization of DEST if it appears in SRC,
6127      but we don't do this any more.  */
6128
6129   for (i = 0; i < n_sets; i++)
6130     {
6131       rtx dest = SET_DEST (sets[i].rtl);
6132       rtx src = SET_SRC (sets[i].rtl);
6133       rtx new = canon_reg (src, insn);
6134
6135       if ((GET_CODE (new) == REG && GET_CODE (src) == REG
6136            && ((REGNO (new) < FIRST_PSEUDO_REGISTER)
6137                != (REGNO (src) < FIRST_PSEUDO_REGISTER)))
6138           || insn_n_dups[recog_memoized (insn)] > 0)
6139         validate_change (insn, &SET_SRC (sets[i].rtl), new, 1);
6140       else
6141         SET_SRC (sets[i].rtl) = new;
6142
6143       if (GET_CODE (dest) == ZERO_EXTRACT || GET_CODE (dest) == SIGN_EXTRACT)
6144         {
6145           validate_change (insn, &XEXP (dest, 1),
6146                            canon_reg (XEXP (dest, 1), insn), 1);
6147           validate_change (insn, &XEXP (dest, 2),
6148                            canon_reg (XEXP (dest, 2), insn), 1);
6149         }
6150
6151       while (GET_CODE (dest) == SUBREG || GET_CODE (dest) == STRICT_LOW_PART
6152              || GET_CODE (dest) == ZERO_EXTRACT
6153              || GET_CODE (dest) == SIGN_EXTRACT)
6154         dest = XEXP (dest, 0);
6155
6156       if (GET_CODE (dest) == MEM)
6157         canon_reg (dest, insn);
6158     }
6159
6160   /* Now that we have done all the replacements, we can apply the change
6161      group and see if they all work.  Note that this will cause some
6162      canonicalizations that would have worked individually not to be applied
6163      because some other canonicalization didn't work, but this should not
6164      occur often.
6165
6166      The result of apply_change_group can be ignored; see canon_reg.  */
6167
6168   apply_change_group ();
6169
6170   /* Set sets[i].src_elt to the class each source belongs to.
6171      Detect assignments from or to volatile things
6172      and set set[i] to zero so they will be ignored
6173      in the rest of this function.
6174
6175      Nothing in this loop changes the hash table or the register chains.  */
6176
6177   for (i = 0; i < n_sets; i++)
6178     {
6179       register rtx src, dest;
6180       register rtx src_folded;
6181       register struct table_elt *elt = 0, *p;
6182       enum machine_mode mode;
6183       rtx src_eqv_here;
6184       rtx src_const = 0;
6185       rtx src_related = 0;
6186       struct table_elt *src_const_elt = 0;
6187       int src_cost = 10000, src_eqv_cost = 10000, src_folded_cost = 10000;
6188       int src_related_cost = 10000, src_elt_cost = 10000;
6189       /* Set non-zero if we need to call force_const_mem on with the
6190          contents of src_folded before using it.  */
6191       int src_folded_force_flag = 0;
6192
6193       dest = SET_DEST (sets[i].rtl);
6194       src = SET_SRC (sets[i].rtl);
6195
6196       /* If SRC is a constant that has no machine mode,
6197          hash it with the destination's machine mode.
6198          This way we can keep different modes separate.  */
6199
6200       mode = GET_MODE (src) == VOIDmode ? GET_MODE (dest) : GET_MODE (src);
6201       sets[i].mode = mode;
6202
6203       if (src_eqv)
6204         {
6205           enum machine_mode eqvmode = mode;
6206           if (GET_CODE (dest) == STRICT_LOW_PART)
6207             eqvmode = GET_MODE (SUBREG_REG (XEXP (dest, 0)));
6208           do_not_record = 0;
6209           hash_arg_in_memory = 0;
6210           hash_arg_in_struct = 0;
6211           src_eqv = fold_rtx (src_eqv, insn);
6212           src_eqv_hash = HASH (src_eqv, eqvmode);
6213
6214           /* Find the equivalence class for the equivalent expression.  */
6215
6216           if (!do_not_record)
6217             src_eqv_elt = lookup (src_eqv, src_eqv_hash, eqvmode);
6218
6219           src_eqv_volatile = do_not_record;
6220           src_eqv_in_memory = hash_arg_in_memory;
6221           src_eqv_in_struct = hash_arg_in_struct;
6222         }
6223
6224       /* If this is a STRICT_LOW_PART assignment, src_eqv corresponds to the
6225          value of the INNER register, not the destination.  So it is not
6226          a legal substitution for the source.  But save it for later.  */
6227       if (GET_CODE (dest) == STRICT_LOW_PART)
6228         src_eqv_here = 0;
6229       else
6230         src_eqv_here = src_eqv;
6231
6232       /* Simplify and foldable subexpressions in SRC.  Then get the fully-
6233          simplified result, which may not necessarily be valid.  */
6234       src_folded = fold_rtx (src, insn);
6235
6236       /* If storing a constant in a bitfield, pre-truncate the constant
6237          so we will be able to record it later.  */
6238       if (GET_CODE (SET_DEST (sets[i].rtl)) == ZERO_EXTRACT
6239           || GET_CODE (SET_DEST (sets[i].rtl)) == SIGN_EXTRACT)
6240         {
6241           rtx width = XEXP (SET_DEST (sets[i].rtl), 1);
6242
6243           if (GET_CODE (src) == CONST_INT
6244               && GET_CODE (width) == CONST_INT
6245               && INTVAL (width) < HOST_BITS_PER_WIDE_INT
6246               && (INTVAL (src) & ((HOST_WIDE_INT) (-1) << INTVAL (width))))
6247             src_folded
6248               = GEN_INT (INTVAL (src) & (((HOST_WIDE_INT) 1
6249                                           << INTVAL (width)) - 1));
6250         }
6251
6252       /* Compute SRC's hash code, and also notice if it
6253          should not be recorded at all.  In that case,
6254          prevent any further processing of this assignment.  */
6255       do_not_record = 0;
6256       hash_arg_in_memory = 0;
6257       hash_arg_in_struct = 0;
6258
6259       sets[i].src = src;
6260       sets[i].src_hash = HASH (src, mode);
6261       sets[i].src_volatile = do_not_record;
6262       sets[i].src_in_memory = hash_arg_in_memory;
6263       sets[i].src_in_struct = hash_arg_in_struct;
6264
6265 #if 0
6266       /* It is no longer clear why we used to do this, but it doesn't
6267          appear to still be needed.  So let's try without it since this
6268          code hurts cse'ing widened ops.  */
6269       /* If source is a perverse subreg (such as QI treated as an SI),
6270          treat it as volatile.  It may do the work of an SI in one context
6271          where the extra bits are not being used, but cannot replace an SI
6272          in general.  */
6273       if (GET_CODE (src) == SUBREG
6274           && (GET_MODE_SIZE (GET_MODE (src))
6275               > GET_MODE_SIZE (GET_MODE (SUBREG_REG (src)))))
6276         sets[i].src_volatile = 1;
6277 #endif
6278
6279       /* Locate all possible equivalent forms for SRC.  Try to replace
6280          SRC in the insn with each cheaper equivalent.
6281
6282          We have the following types of equivalents: SRC itself, a folded
6283          version, a value given in a REG_EQUAL note, or a value related
6284          to a constant.
6285
6286          Each of these equivalents may be part of an additional class
6287          of equivalents (if more than one is in the table, they must be in
6288          the same class; we check for this).
6289
6290          If the source is volatile, we don't do any table lookups.
6291
6292          We note any constant equivalent for possible later use in a
6293          REG_NOTE.  */
6294
6295       if (!sets[i].src_volatile)
6296         elt = lookup (src, sets[i].src_hash, mode);
6297
6298       sets[i].src_elt = elt;
6299
6300       if (elt && src_eqv_here && src_eqv_elt)
6301         {
6302           if (elt->first_same_value != src_eqv_elt->first_same_value)
6303             {
6304               /* The REG_EQUAL is indicating that two formerly distinct
6305                  classes are now equivalent.  So merge them.  */
6306               merge_equiv_classes (elt, src_eqv_elt);
6307               src_eqv_hash = HASH (src_eqv, elt->mode);
6308               src_eqv_elt = lookup (src_eqv, src_eqv_hash, elt->mode);
6309             }
6310
6311           src_eqv_here = 0;
6312         }
6313
6314       else if (src_eqv_elt)
6315         elt = src_eqv_elt;
6316
6317       /* Try to find a constant somewhere and record it in `src_const'.
6318          Record its table element, if any, in `src_const_elt'.  Look in
6319          any known equivalences first.  (If the constant is not in the
6320          table, also set `sets[i].src_const_hash').  */
6321       if (elt)
6322         for (p = elt->first_same_value; p; p = p->next_same_value)
6323           if (p->is_const)
6324             {
6325               src_const = p->exp;
6326               src_const_elt = elt;
6327               break;
6328             }
6329
6330       if (src_const == 0
6331           && (CONSTANT_P (src_folded)
6332               /* Consider (minus (label_ref L1) (label_ref L2)) as
6333                  "constant" here so we will record it. This allows us
6334                  to fold switch statements when an ADDR_DIFF_VEC is used.  */
6335               || (GET_CODE (src_folded) == MINUS
6336                   && GET_CODE (XEXP (src_folded, 0)) == LABEL_REF
6337                   && GET_CODE (XEXP (src_folded, 1)) == LABEL_REF)))
6338         src_const = src_folded, src_const_elt = elt;
6339       else if (src_const == 0 && src_eqv_here && CONSTANT_P (src_eqv_here))
6340         src_const = src_eqv_here, src_const_elt = src_eqv_elt;
6341
6342       /* If we don't know if the constant is in the table, get its
6343          hash code and look it up.  */
6344       if (src_const && src_const_elt == 0)
6345         {
6346           sets[i].src_const_hash = HASH (src_const, mode);
6347           src_const_elt = lookup (src_const, sets[i].src_const_hash, mode);
6348         }
6349
6350       sets[i].src_const = src_const;
6351       sets[i].src_const_elt = src_const_elt;
6352
6353       /* If the constant and our source are both in the table, mark them as
6354          equivalent.  Otherwise, if a constant is in the table but the source
6355          isn't, set ELT to it.  */
6356       if (src_const_elt && elt
6357           && src_const_elt->first_same_value != elt->first_same_value)
6358         merge_equiv_classes (elt, src_const_elt);
6359       else if (src_const_elt && elt == 0)
6360         elt = src_const_elt;
6361
6362       /* See if there is a register linearly related to a constant
6363          equivalent of SRC.  */
6364       if (src_const
6365           && (GET_CODE (src_const) == CONST
6366               || (src_const_elt && src_const_elt->related_value != 0)))
6367         {
6368           src_related = use_related_value (src_const, src_const_elt);
6369           if (src_related)
6370             {
6371               struct table_elt *src_related_elt
6372                     = lookup (src_related, HASH (src_related, mode), mode);
6373               if (src_related_elt && elt)
6374                 {
6375                   if (elt->first_same_value
6376                       != src_related_elt->first_same_value)
6377                     /* This can occur when we previously saw a CONST
6378                        involving a SYMBOL_REF and then see the SYMBOL_REF
6379                        twice.  Merge the involved classes.  */
6380                     merge_equiv_classes (elt, src_related_elt);
6381
6382                   src_related = 0;
6383                   src_related_elt = 0;
6384                 }
6385               else if (src_related_elt && elt == 0)
6386                 elt = src_related_elt;
6387             }
6388         }
6389
6390       /* See if we have a CONST_INT that is already in a register in a
6391          wider mode.  */
6392
6393       if (src_const && src_related == 0 && GET_CODE (src_const) == CONST_INT
6394           && GET_MODE_CLASS (mode) == MODE_INT
6395           && GET_MODE_BITSIZE (mode) < BITS_PER_WORD)
6396         {
6397           enum machine_mode wider_mode;
6398
6399           for (wider_mode = GET_MODE_WIDER_MODE (mode);
6400                GET_MODE_BITSIZE (wider_mode) <= BITS_PER_WORD
6401                && src_related == 0;
6402                wider_mode = GET_MODE_WIDER_MODE (wider_mode))
6403             {
6404               struct table_elt *const_elt
6405                 = lookup (src_const, HASH (src_const, wider_mode), wider_mode);
6406
6407               if (const_elt == 0)
6408                 continue;
6409
6410               for (const_elt = const_elt->first_same_value;
6411                    const_elt; const_elt = const_elt->next_same_value)
6412                 if (GET_CODE (const_elt->exp) == REG)
6413                   {
6414                     src_related = gen_lowpart_if_possible (mode,
6415                                                            const_elt->exp);
6416                     break;
6417                   }
6418             }
6419         }
6420
6421       /* Another possibility is that we have an AND with a constant in
6422          a mode narrower than a word.  If so, it might have been generated
6423          as part of an "if" which would narrow the AND.  If we already
6424          have done the AND in a wider mode, we can use a SUBREG of that
6425          value.  */
6426
6427       if (flag_expensive_optimizations && ! src_related
6428           && GET_CODE (src) == AND && GET_CODE (XEXP (src, 1)) == CONST_INT
6429           && GET_MODE_SIZE (mode) < UNITS_PER_WORD)
6430         {
6431           enum machine_mode tmode;
6432           rtx new_and = gen_rtx (AND, VOIDmode, NULL_RTX, XEXP (src, 1));
6433
6434           for (tmode = GET_MODE_WIDER_MODE (mode);
6435                GET_MODE_SIZE (tmode) <= UNITS_PER_WORD;
6436                tmode = GET_MODE_WIDER_MODE (tmode))
6437             {
6438               rtx inner = gen_lowpart_if_possible (tmode, XEXP (src, 0));
6439               struct table_elt *larger_elt;
6440
6441               if (inner)
6442                 {
6443                   PUT_MODE (new_and, tmode);
6444                   XEXP (new_and, 0) = inner;
6445                   larger_elt = lookup (new_and, HASH (new_and, tmode), tmode);
6446                   if (larger_elt == 0)
6447                     continue;
6448
6449                   for (larger_elt = larger_elt->first_same_value;
6450                        larger_elt; larger_elt = larger_elt->next_same_value)
6451                     if (GET_CODE (larger_elt->exp) == REG)
6452                       {
6453                         src_related
6454                           = gen_lowpart_if_possible (mode, larger_elt->exp);
6455                         break;
6456                       }
6457
6458                   if (src_related)
6459                     break;
6460                 }
6461             }
6462         }
6463
6464 #ifdef LOAD_EXTEND_OP
6465       /* See if a MEM has already been loaded with a widening operation;
6466          if it has, we can use a subreg of that.  Many CISC machines
6467          also have such operations, but this is only likely to be
6468          beneficial these machines.  */
6469
6470       if (flag_expensive_optimizations &&  src_related == 0
6471           && (GET_MODE_SIZE (mode) < UNITS_PER_WORD)
6472           && GET_MODE_CLASS (mode) == MODE_INT
6473           && GET_CODE (src) == MEM && ! do_not_record
6474           && LOAD_EXTEND_OP (mode) != NIL)
6475         {
6476           enum machine_mode tmode;
6477
6478           /* Set what we are trying to extend and the operation it might
6479              have been extended with.  */
6480           PUT_CODE (memory_extend_rtx, LOAD_EXTEND_OP (mode));
6481           XEXP (memory_extend_rtx, 0) = src;
6482
6483           for (tmode = GET_MODE_WIDER_MODE (mode);
6484                GET_MODE_SIZE (tmode) <= UNITS_PER_WORD;
6485                tmode = GET_MODE_WIDER_MODE (tmode))
6486             {
6487               struct table_elt *larger_elt;
6488
6489               PUT_MODE (memory_extend_rtx, tmode);
6490               larger_elt = lookup (memory_extend_rtx,
6491                                    HASH (memory_extend_rtx, tmode), tmode);
6492               if (larger_elt == 0)
6493                 continue;
6494
6495               for (larger_elt = larger_elt->first_same_value;
6496                    larger_elt; larger_elt = larger_elt->next_same_value)
6497                 if (GET_CODE (larger_elt->exp) == REG)
6498                   {
6499                     src_related = gen_lowpart_if_possible (mode,
6500                                                            larger_elt->exp);
6501                     break;
6502                   }
6503
6504               if (src_related)
6505                 break;
6506             }
6507         }
6508 #endif /* LOAD_EXTEND_OP */
6509
6510       if (src == src_folded)
6511         src_folded = 0;
6512
6513       /* At this point, ELT, if non-zero, points to a class of expressions
6514          equivalent to the source of this SET and SRC, SRC_EQV, SRC_FOLDED,
6515          and SRC_RELATED, if non-zero, each contain additional equivalent
6516          expressions.  Prune these latter expressions by deleting expressions
6517          already in the equivalence class.
6518
6519          Check for an equivalent identical to the destination.  If found,
6520          this is the preferred equivalent since it will likely lead to
6521          elimination of the insn.  Indicate this by placing it in
6522          `src_related'.  */
6523
6524       if (elt) elt = elt->first_same_value;
6525       for (p = elt; p; p = p->next_same_value)
6526         {
6527           enum rtx_code code = GET_CODE (p->exp);
6528
6529           /* If the expression is not valid, ignore it.  Then we do not
6530              have to check for validity below.  In most cases, we can use
6531              `rtx_equal_p', since canonicalization has already been done.  */
6532           if (code != REG && ! exp_equiv_p (p->exp, p->exp, 1, 0))
6533             continue;
6534
6535           if (src && GET_CODE (src) == code && rtx_equal_p (src, p->exp))
6536             src = 0;
6537           else if (src_folded && GET_CODE (src_folded) == code
6538                    && rtx_equal_p (src_folded, p->exp))
6539             src_folded = 0;
6540           else if (src_eqv_here && GET_CODE (src_eqv_here) == code
6541                    && rtx_equal_p (src_eqv_here, p->exp))
6542             src_eqv_here = 0;
6543           else if (src_related && GET_CODE (src_related) == code
6544                    && rtx_equal_p (src_related, p->exp))
6545             src_related = 0;
6546
6547           /* This is the same as the destination of the insns, we want
6548              to prefer it.  Copy it to src_related.  The code below will
6549              then give it a negative cost.  */
6550           if (GET_CODE (dest) == code && rtx_equal_p (p->exp, dest))
6551             src_related = dest;
6552
6553         }
6554
6555       /* Find the cheapest valid equivalent, trying all the available
6556          possibilities.  Prefer items not in the hash table to ones
6557          that are when they are equal cost.  Note that we can never
6558          worsen an insn as the current contents will also succeed.
6559          If we find an equivalent identical to the destination, use it as best,
6560          since this insn will probably be eliminated in that case. */
6561       if (src)
6562         {
6563           if (rtx_equal_p (src, dest))
6564             src_cost = -1;
6565           else
6566             src_cost = COST (src);
6567         }
6568
6569       if (src_eqv_here)
6570         {
6571           if (rtx_equal_p (src_eqv_here, dest))
6572             src_eqv_cost = -1;
6573           else
6574             src_eqv_cost = COST (src_eqv_here);
6575         }
6576
6577       if (src_folded)
6578         {
6579           if (rtx_equal_p (src_folded, dest))
6580             src_folded_cost = -1;
6581           else
6582             src_folded_cost = COST (src_folded);
6583         }
6584
6585       if (src_related)
6586         {
6587           if (rtx_equal_p (src_related, dest))
6588             src_related_cost = -1;
6589           else
6590             src_related_cost = COST (src_related);
6591         }
6592
6593       /* If this was an indirect jump insn, a known label will really be
6594          cheaper even though it looks more expensive.  */
6595       if (dest == pc_rtx && src_const && GET_CODE (src_const) == LABEL_REF)
6596         src_folded = src_const, src_folded_cost = -1;
6597
6598       /* Terminate loop when replacement made.  This must terminate since
6599          the current contents will be tested and will always be valid.  */
6600       while (1)
6601         {
6602           rtx trial;
6603
6604           /* Skip invalid entries.  */
6605           while (elt && GET_CODE (elt->exp) != REG
6606                  && ! exp_equiv_p (elt->exp, elt->exp, 1, 0))
6607             elt = elt->next_same_value;
6608
6609           if (elt) src_elt_cost = elt->cost;
6610
6611           /* Find cheapest and skip it for the next time.   For items
6612              of equal cost, use this order:
6613              src_folded, src, src_eqv, src_related and hash table entry.  */
6614           if (src_folded_cost <= src_cost
6615               && src_folded_cost <= src_eqv_cost
6616               && src_folded_cost <= src_related_cost
6617               && src_folded_cost <= src_elt_cost)
6618             {
6619               trial = src_folded, src_folded_cost = 10000;
6620               if (src_folded_force_flag)
6621                 trial = force_const_mem (mode, trial);
6622             }
6623           else if (src_cost <= src_eqv_cost
6624                    && src_cost <= src_related_cost
6625                    && src_cost <= src_elt_cost)
6626             trial = src, src_cost = 10000;
6627           else if (src_eqv_cost <= src_related_cost
6628                    && src_eqv_cost <= src_elt_cost)
6629             trial = copy_rtx (src_eqv_here), src_eqv_cost = 10000;
6630           else if (src_related_cost <= src_elt_cost)
6631             trial = copy_rtx (src_related), src_related_cost = 10000;
6632           else
6633             {
6634               trial = copy_rtx (elt->exp);
6635               elt = elt->next_same_value;
6636               src_elt_cost = 10000;
6637             }
6638
6639           /* We don't normally have an insn matching (set (pc) (pc)), so
6640              check for this separately here.  We will delete such an
6641              insn below.
6642
6643              Tablejump insns contain a USE of the table, so simply replacing
6644              the operand with the constant won't match.  This is simply an
6645              unconditional branch, however, and is therefore valid.  Just
6646              insert the substitution here and we will delete and re-emit
6647              the insn later.  */
6648
6649           if (n_sets == 1 && dest == pc_rtx
6650               && (trial == pc_rtx
6651                   || (GET_CODE (trial) == LABEL_REF
6652                       && ! condjump_p (insn))))
6653             {
6654               /* If TRIAL is a label in front of a jump table, we are
6655                  really falling through the switch (this is how casesi
6656                  insns work), so we must branch around the table.  */
6657               if (GET_CODE (trial) == CODE_LABEL
6658                   && NEXT_INSN (trial) != 0
6659                   && GET_CODE (NEXT_INSN (trial)) == JUMP_INSN
6660                   && (GET_CODE (PATTERN (NEXT_INSN (trial))) == ADDR_DIFF_VEC
6661                       || GET_CODE (PATTERN (NEXT_INSN (trial))) == ADDR_VEC))
6662
6663                 trial = gen_rtx (LABEL_REF, Pmode, get_label_after (trial));
6664
6665               SET_SRC (sets[i].rtl) = trial;
6666               cse_jumps_altered = 1;
6667               break;
6668             }
6669
6670           /* Look for a substitution that makes a valid insn.  */
6671           else if (validate_change (insn, &SET_SRC (sets[i].rtl), trial, 0))
6672             {
6673               /* The result of apply_change_group can be ignored; see
6674                  canon_reg.  */
6675
6676               validate_change (insn, &SET_SRC (sets[i].rtl),
6677                                canon_reg (SET_SRC (sets[i].rtl), insn),
6678                                1);
6679               apply_change_group ();
6680               break;
6681             }
6682
6683           /* If we previously found constant pool entries for
6684              constants and this is a constant, try making a
6685              pool entry.  Put it in src_folded unless we already have done
6686              this since that is where it likely came from.  */
6687
6688           else if (constant_pool_entries_cost
6689                    && CONSTANT_P (trial)
6690                    && (src_folded == 0 || GET_CODE (src_folded) != MEM)
6691                    && GET_MODE_CLASS (mode) != MODE_CC)
6692             {
6693               src_folded_force_flag = 1;
6694               src_folded = trial;
6695               src_folded_cost = constant_pool_entries_cost;
6696             }
6697         }
6698
6699       src = SET_SRC (sets[i].rtl);
6700
6701       /* In general, it is good to have a SET with SET_SRC == SET_DEST.
6702          However, there is an important exception:  If both are registers
6703          that are not the head of their equivalence class, replace SET_SRC
6704          with the head of the class.  If we do not do this, we will have
6705          both registers live over a portion of the basic block.  This way,
6706          their lifetimes will likely abut instead of overlapping.  */
6707       if (GET_CODE (dest) == REG
6708           && REGNO_QTY_VALID_P (REGNO (dest))
6709           && qty_mode[reg_qty[REGNO (dest)]] == GET_MODE (dest)
6710           && qty_first_reg[reg_qty[REGNO (dest)]] != REGNO (dest)
6711           && GET_CODE (src) == REG && REGNO (src) == REGNO (dest)
6712           /* Don't do this if the original insn had a hard reg as
6713              SET_SRC.  */
6714           && (GET_CODE (sets[i].src) != REG
6715               || REGNO (sets[i].src) >= FIRST_PSEUDO_REGISTER))
6716         /* We can't call canon_reg here because it won't do anything if
6717            SRC is a hard register.  */
6718         {
6719           int first = qty_first_reg[reg_qty[REGNO (src)]];
6720
6721           src = SET_SRC (sets[i].rtl)
6722             = first >= FIRST_PSEUDO_REGISTER ? regno_reg_rtx[first]
6723               : gen_rtx (REG, GET_MODE (src), first);
6724
6725           /* If we had a constant that is cheaper than what we are now
6726              setting SRC to, use that constant.  We ignored it when we
6727              thought we could make this into a no-op.  */
6728           if (src_const && COST (src_const) < COST (src)
6729               && validate_change (insn, &SET_SRC (sets[i].rtl), src_const, 0))
6730             src = src_const;
6731         }
6732
6733       /* If we made a change, recompute SRC values.  */
6734       if (src != sets[i].src)
6735         {
6736           do_not_record = 0;
6737           hash_arg_in_memory = 0;
6738           hash_arg_in_struct = 0;
6739           sets[i].src = src;
6740           sets[i].src_hash = HASH (src, mode);
6741           sets[i].src_volatile = do_not_record;
6742           sets[i].src_in_memory = hash_arg_in_memory;
6743           sets[i].src_in_struct = hash_arg_in_struct;
6744           sets[i].src_elt = lookup (src, sets[i].src_hash, mode);
6745         }
6746
6747       /* If this is a single SET, we are setting a register, and we have an
6748          equivalent constant, we want to add a REG_NOTE.   We don't want
6749          to write a REG_EQUAL note for a constant pseudo since verifying that
6750          that pseudo hasn't been eliminated is a pain.  Such a note also
6751          won't help anything.  */
6752       if (n_sets == 1 && src_const && GET_CODE (dest) == REG
6753           && GET_CODE (src_const) != REG)
6754         {
6755           tem = find_reg_note (insn, REG_EQUAL, NULL_RTX);
6756
6757           /* Record the actual constant value in a REG_EQUAL note, making
6758              a new one if one does not already exist.  */
6759           if (tem)
6760             XEXP (tem, 0) = src_const;
6761           else
6762             REG_NOTES (insn) = gen_rtx (EXPR_LIST, REG_EQUAL,
6763                                         src_const, REG_NOTES (insn));
6764
6765           /* If storing a constant value in a register that
6766              previously held the constant value 0,
6767              record this fact with a REG_WAS_0 note on this insn.
6768
6769              Note that the *register* is required to have previously held 0,
6770              not just any register in the quantity and we must point to the
6771              insn that set that register to zero.
6772
6773              Rather than track each register individually, we just see if
6774              the last set for this quantity was for this register.  */
6775
6776           if (REGNO_QTY_VALID_P (REGNO (dest))
6777               && qty_const[reg_qty[REGNO (dest)]] == const0_rtx)
6778             {
6779               /* See if we previously had a REG_WAS_0 note.  */
6780               rtx note = find_reg_note (insn, REG_WAS_0, NULL_RTX);
6781               rtx const_insn = qty_const_insn[reg_qty[REGNO (dest)]];
6782
6783               if ((tem = single_set (const_insn)) != 0
6784                   && rtx_equal_p (SET_DEST (tem), dest))
6785                 {
6786                   if (note)
6787                     XEXP (note, 0) = const_insn;
6788                   else
6789                     REG_NOTES (insn) = gen_rtx (INSN_LIST, REG_WAS_0,
6790                                                 const_insn, REG_NOTES (insn));
6791                 }
6792             }
6793         }
6794
6795       /* Now deal with the destination.  */
6796       do_not_record = 0;
6797       sets[i].inner_dest_loc = &SET_DEST (sets[0].rtl);
6798
6799       /* Look within any SIGN_EXTRACT or ZERO_EXTRACT
6800          to the MEM or REG within it.  */
6801       while (GET_CODE (dest) == SIGN_EXTRACT
6802              || GET_CODE (dest) == ZERO_EXTRACT
6803              || GET_CODE (dest) == SUBREG
6804              || GET_CODE (dest) == STRICT_LOW_PART)
6805         {
6806           sets[i].inner_dest_loc = &XEXP (dest, 0);
6807           dest = XEXP (dest, 0);
6808         }
6809
6810       sets[i].inner_dest = dest;
6811
6812       if (GET_CODE (dest) == MEM)
6813         {
6814           dest = fold_rtx (dest, insn);
6815
6816           /* Decide whether we invalidate everything in memory,
6817              or just things at non-fixed places.
6818              Writing a large aggregate must invalidate everything
6819              because we don't know how long it is.  */
6820           note_mem_written (dest, &writes_memory);
6821         }
6822
6823       /* Compute the hash code of the destination now,
6824          before the effects of this instruction are recorded,
6825          since the register values used in the address computation
6826          are those before this instruction.  */
6827       sets[i].dest_hash = HASH (dest, mode);
6828
6829       /* Don't enter a bit-field in the hash table
6830          because the value in it after the store
6831          may not equal what was stored, due to truncation.  */
6832
6833       if (GET_CODE (SET_DEST (sets[i].rtl)) == ZERO_EXTRACT
6834           || GET_CODE (SET_DEST (sets[i].rtl)) == SIGN_EXTRACT)
6835         {
6836           rtx width = XEXP (SET_DEST (sets[i].rtl), 1);
6837
6838           if (src_const != 0 && GET_CODE (src_const) == CONST_INT
6839               && GET_CODE (width) == CONST_INT
6840               && INTVAL (width) < HOST_BITS_PER_WIDE_INT
6841               && ! (INTVAL (src_const)
6842                     & ((HOST_WIDE_INT) (-1) << INTVAL (width))))
6843             /* Exception: if the value is constant,
6844                and it won't be truncated, record it.  */
6845             ;
6846           else
6847             {
6848               /* This is chosen so that the destination will be invalidated
6849                  but no new value will be recorded.
6850                  We must invalidate because sometimes constant
6851                  values can be recorded for bitfields.  */
6852               sets[i].src_elt = 0;
6853               sets[i].src_volatile = 1;
6854               src_eqv = 0;
6855               src_eqv_elt = 0;
6856             }
6857         }
6858
6859       /* If only one set in a JUMP_INSN and it is now a no-op, we can delete
6860          the insn.  */
6861       else if (n_sets == 1 && dest == pc_rtx && src == pc_rtx)
6862         {
6863           PUT_CODE (insn, NOTE);
6864           NOTE_LINE_NUMBER (insn) = NOTE_INSN_DELETED;
6865           NOTE_SOURCE_FILE (insn) = 0;
6866           cse_jumps_altered = 1;
6867           /* One less use of the label this insn used to jump to.  */
6868           --LABEL_NUSES (JUMP_LABEL (insn));
6869           /* No more processing for this set.  */
6870           sets[i].rtl = 0;
6871         }
6872
6873       /* If this SET is now setting PC to a label, we know it used to
6874          be a conditional or computed branch.  So we see if we can follow
6875          it.  If it was a computed branch, delete it and re-emit.  */
6876       else if (dest == pc_rtx && GET_CODE (src) == LABEL_REF)
6877         {
6878           rtx p;
6879
6880           /* If this is not in the format for a simple branch and
6881              we are the only SET in it, re-emit it.  */
6882           if (! simplejump_p (insn) && n_sets == 1)
6883             {
6884               rtx new = emit_jump_insn_before (gen_jump (XEXP (src, 0)), insn);
6885               JUMP_LABEL (new) = XEXP (src, 0);
6886               LABEL_NUSES (XEXP (src, 0))++;
6887               delete_insn (insn);
6888               insn = new;
6889             }
6890           else
6891             /* Otherwise, force rerecognition, since it probably had
6892                a different pattern before.
6893                This shouldn't really be necessary, since whatever
6894                changed the source value above should have done this.
6895                Until the right place is found, might as well do this here.  */
6896             INSN_CODE (insn) = -1;
6897
6898           /* Now that we've converted this jump to an unconditional jump,
6899              there is dead code after it.  Delete the dead code until we
6900              reach a BARRIER, the end of the function, or a label.  Do
6901              not delete NOTEs except for NOTE_INSN_DELETED since later
6902              phases assume these notes are retained.  */
6903
6904           p = insn;
6905
6906           while (NEXT_INSN (p) != 0
6907                  && GET_CODE (NEXT_INSN (p)) != BARRIER
6908                  && GET_CODE (NEXT_INSN (p)) != CODE_LABEL)
6909             {
6910               if (GET_CODE (NEXT_INSN (p)) != NOTE
6911                   || NOTE_LINE_NUMBER (NEXT_INSN (p)) == NOTE_INSN_DELETED)
6912                 delete_insn (NEXT_INSN (p));
6913               else
6914                 p = NEXT_INSN (p);
6915             }
6916
6917           /* If we don't have a BARRIER immediately after INSN, put one there.
6918              Much code assumes that there are no NOTEs between a JUMP_INSN and
6919              BARRIER.  */
6920
6921           if (NEXT_INSN (insn) == 0
6922               || GET_CODE (NEXT_INSN (insn)) != BARRIER)
6923             emit_barrier_after (insn);
6924
6925           /* We might have two BARRIERs separated by notes.  Delete the second
6926              one if so.  */
6927
6928           if (p != insn && NEXT_INSN (p) != 0
6929               && GET_CODE (NEXT_INSN (p)) == BARRIER)
6930             delete_insn (NEXT_INSN (p));
6931
6932           cse_jumps_altered = 1;
6933           sets[i].rtl = 0;
6934         }
6935
6936       /* If destination is volatile, invalidate it and then do no further
6937          processing for this assignment.  */
6938
6939       else if (do_not_record)
6940         {
6941           if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG
6942               || GET_CODE (dest) == MEM)
6943             invalidate (dest);
6944           else if (GET_CODE (dest) == STRICT_LOW_PART
6945                    || GET_CODE (dest) == ZERO_EXTRACT)
6946             invalidate (XEXP (dest, 0));
6947           sets[i].rtl = 0;
6948         }
6949
6950       if (sets[i].rtl != 0 && dest != SET_DEST (sets[i].rtl))
6951         sets[i].dest_hash = HASH (SET_DEST (sets[i].rtl), mode);
6952
6953 #ifdef HAVE_cc0
6954       /* If setting CC0, record what it was set to, or a constant, if it
6955          is equivalent to a constant.  If it is being set to a floating-point
6956          value, make a COMPARE with the appropriate constant of 0.  If we
6957          don't do this, later code can interpret this as a test against
6958          const0_rtx, which can cause problems if we try to put it into an
6959          insn as a floating-point operand.  */
6960       if (dest == cc0_rtx)
6961         {
6962           this_insn_cc0 = src_const && mode != VOIDmode ? src_const : src;
6963           this_insn_cc0_mode = mode;
6964           if (FLOAT_MODE_P (mode))
6965             this_insn_cc0 = gen_rtx (COMPARE, VOIDmode, this_insn_cc0,
6966                                      CONST0_RTX (mode));
6967         }
6968 #endif
6969     }
6970
6971   /* Now enter all non-volatile source expressions in the hash table
6972      if they are not already present.
6973      Record their equivalence classes in src_elt.
6974      This way we can insert the corresponding destinations into
6975      the same classes even if the actual sources are no longer in them
6976      (having been invalidated).  */
6977
6978   if (src_eqv && src_eqv_elt == 0 && sets[0].rtl != 0 && ! src_eqv_volatile
6979       && ! rtx_equal_p (src_eqv, SET_DEST (sets[0].rtl)))
6980     {
6981       register struct table_elt *elt;
6982       register struct table_elt *classp = sets[0].src_elt;
6983       rtx dest = SET_DEST (sets[0].rtl);
6984       enum machine_mode eqvmode = GET_MODE (dest);
6985
6986       if (GET_CODE (dest) == STRICT_LOW_PART)
6987         {
6988           eqvmode = GET_MODE (SUBREG_REG (XEXP (dest, 0)));
6989           classp = 0;
6990         }
6991       if (insert_regs (src_eqv, classp, 0))
6992         src_eqv_hash = HASH (src_eqv, eqvmode);
6993       elt = insert (src_eqv, classp, src_eqv_hash, eqvmode);
6994       elt->in_memory = src_eqv_in_memory;
6995       elt->in_struct = src_eqv_in_struct;
6996       src_eqv_elt = elt;
6997
6998       /* Check to see if src_eqv_elt is the same as a set source which
6999          does not yet have an elt, and if so set the elt of the set source
7000          to src_eqv_elt.  */
7001       for (i = 0; i < n_sets; i++)
7002         if (sets[i].rtl && sets[i].src_elt == 0
7003             && rtx_equal_p (SET_SRC (sets[i].rtl), src_eqv))
7004           sets[i].src_elt = src_eqv_elt;
7005     }
7006
7007   for (i = 0; i < n_sets; i++)
7008     if (sets[i].rtl && ! sets[i].src_volatile
7009         && ! rtx_equal_p (SET_SRC (sets[i].rtl), SET_DEST (sets[i].rtl)))
7010       {
7011         if (GET_CODE (SET_DEST (sets[i].rtl)) == STRICT_LOW_PART)
7012           {
7013             /* REG_EQUAL in setting a STRICT_LOW_PART
7014                gives an equivalent for the entire destination register,
7015                not just for the subreg being stored in now.
7016                This is a more interesting equivalence, so we arrange later
7017                to treat the entire reg as the destination.  */
7018             sets[i].src_elt = src_eqv_elt;
7019             sets[i].src_hash = src_eqv_hash;
7020           }
7021         else
7022           {
7023             /* Insert source and constant equivalent into hash table, if not
7024                already present.  */
7025             register struct table_elt *classp = src_eqv_elt;
7026             register rtx src = sets[i].src;
7027             register rtx dest = SET_DEST (sets[i].rtl);
7028             enum machine_mode mode
7029               = GET_MODE (src) == VOIDmode ? GET_MODE (dest) : GET_MODE (src);
7030
7031             if (sets[i].src_elt == 0)
7032               {
7033                 register struct table_elt *elt;
7034
7035                 /* Note that these insert_regs calls cannot remove
7036                    any of the src_elt's, because they would have failed to
7037                    match if not still valid.  */
7038                 if (insert_regs (src, classp, 0))
7039                   sets[i].src_hash = HASH (src, mode);
7040                 elt = insert (src, classp, sets[i].src_hash, mode);
7041                 elt->in_memory = sets[i].src_in_memory;
7042                 elt->in_struct = sets[i].src_in_struct;
7043                 sets[i].src_elt = classp = elt;
7044               }
7045
7046             if (sets[i].src_const && sets[i].src_const_elt == 0
7047                 && src != sets[i].src_const
7048                 && ! rtx_equal_p (sets[i].src_const, src))
7049               sets[i].src_elt = insert (sets[i].src_const, classp,
7050                                         sets[i].src_const_hash, mode);
7051           }
7052       }
7053     else if (sets[i].src_elt == 0)
7054       /* If we did not insert the source into the hash table (e.g., it was
7055          volatile), note the equivalence class for the REG_EQUAL value, if any,
7056          so that the destination goes into that class.  */
7057       sets[i].src_elt = src_eqv_elt;
7058
7059   invalidate_from_clobbers (&writes_memory, x);
7060
7061   /* Some registers are invalidated by subroutine calls.  Memory is
7062      invalidated by non-constant calls.  */
7063
7064   if (GET_CODE (insn) == CALL_INSN)
7065     {
7066       static struct write_data everything = {0, 1, 1, 1};
7067
7068       if (! CONST_CALL_P (insn))
7069         invalidate_memory (&everything);
7070       invalidate_for_call ();
7071     }
7072
7073   /* Now invalidate everything set by this instruction.
7074      If a SUBREG or other funny destination is being set,
7075      sets[i].rtl is still nonzero, so here we invalidate the reg
7076      a part of which is being set.  */
7077
7078   for (i = 0; i < n_sets; i++)
7079     if (sets[i].rtl)
7080       {
7081         register rtx dest = sets[i].inner_dest;
7082
7083         /* Needed for registers to remove the register from its
7084            previous quantity's chain.
7085            Needed for memory if this is a nonvarying address, unless
7086            we have just done an invalidate_memory that covers even those.  */
7087         if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG
7088             || (! writes_memory.all && ! cse_rtx_addr_varies_p (dest)))
7089           invalidate (dest);
7090         else if (GET_CODE (dest) == STRICT_LOW_PART
7091                  || GET_CODE (dest) == ZERO_EXTRACT)
7092           invalidate (XEXP (dest, 0));
7093       }
7094
7095   /* Make sure registers mentioned in destinations
7096      are safe for use in an expression to be inserted.
7097      This removes from the hash table
7098      any invalid entry that refers to one of these registers.
7099
7100      We don't care about the return value from mention_regs because
7101      we are going to hash the SET_DEST values unconditionally.  */
7102
7103   for (i = 0; i < n_sets; i++)
7104     if (sets[i].rtl && GET_CODE (SET_DEST (sets[i].rtl)) != REG)
7105       mention_regs (SET_DEST (sets[i].rtl));
7106
7107   /* We may have just removed some of the src_elt's from the hash table.
7108      So replace each one with the current head of the same class.  */
7109
7110   for (i = 0; i < n_sets; i++)
7111     if (sets[i].rtl)
7112       {
7113         if (sets[i].src_elt && sets[i].src_elt->first_same_value == 0)
7114           /* If elt was removed, find current head of same class,
7115              or 0 if nothing remains of that class.  */
7116           {
7117             register struct table_elt *elt = sets[i].src_elt;
7118
7119             while (elt && elt->prev_same_value)
7120               elt = elt->prev_same_value;
7121
7122             while (elt && elt->first_same_value == 0)
7123               elt = elt->next_same_value;
7124             sets[i].src_elt = elt ? elt->first_same_value : 0;
7125           }
7126       }
7127
7128   /* Now insert the destinations into their equivalence classes.  */
7129
7130   for (i = 0; i < n_sets; i++)
7131     if (sets[i].rtl)
7132       {
7133         register rtx dest = SET_DEST (sets[i].rtl);
7134         register struct table_elt *elt;
7135
7136         /* Don't record value if we are not supposed to risk allocating
7137            floating-point values in registers that might be wider than
7138            memory.  */
7139         if ((flag_float_store
7140              && GET_CODE (dest) == MEM
7141              && FLOAT_MODE_P (GET_MODE (dest)))
7142             /* Don't record values of destinations set inside a libcall block
7143                since we might delete the libcall.  Things should have been set
7144                up so we won't want to reuse such a value, but we play it safe
7145                here.  */
7146             || in_libcall_block
7147             /* If we didn't put a REG_EQUAL value or a source into the hash
7148                table, there is no point is recording DEST.  */
7149              || sets[i].src_elt == 0)
7150           continue;
7151
7152         /* STRICT_LOW_PART isn't part of the value BEING set,
7153            and neither is the SUBREG inside it.
7154            Note that in this case SETS[I].SRC_ELT is really SRC_EQV_ELT.  */
7155         if (GET_CODE (dest) == STRICT_LOW_PART)
7156           dest = SUBREG_REG (XEXP (dest, 0));
7157
7158         if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG)
7159           /* Registers must also be inserted into chains for quantities.  */
7160           if (insert_regs (dest, sets[i].src_elt, 1))
7161             /* If `insert_regs' changes something, the hash code must be
7162                recalculated.  */
7163             sets[i].dest_hash = HASH (dest, GET_MODE (dest));
7164
7165         elt = insert (dest, sets[i].src_elt,
7166                       sets[i].dest_hash, GET_MODE (dest));
7167         elt->in_memory = GET_CODE (sets[i].inner_dest) == MEM;
7168         if (elt->in_memory)
7169           {
7170             /* This implicitly assumes a whole struct
7171                need not have MEM_IN_STRUCT_P.
7172                But a whole struct is *supposed* to have MEM_IN_STRUCT_P.  */
7173             elt->in_struct = (MEM_IN_STRUCT_P (sets[i].inner_dest)
7174                               || sets[i].inner_dest != SET_DEST (sets[i].rtl));
7175           }
7176
7177         /* If we have (set (subreg:m1 (reg:m2 foo) 0) (bar:m1)), M1 is no
7178            narrower than M2, and both M1 and M2 are the same number of words,
7179            we are also doing (set (reg:m2 foo) (subreg:m2 (bar:m1) 0)) so
7180            make that equivalence as well.
7181
7182            However, BAR may have equivalences for which gen_lowpart_if_possible
7183            will produce a simpler value than gen_lowpart_if_possible applied to
7184            BAR (e.g., if BAR was ZERO_EXTENDed from M2), so we will scan all
7185            BAR's equivalences.  If we don't get a simplified form, make
7186            the SUBREG.  It will not be used in an equivalence, but will
7187            cause two similar assignments to be detected.
7188
7189            Note the loop below will find SUBREG_REG (DEST) since we have
7190            already entered SRC and DEST of the SET in the table.  */
7191
7192         if (GET_CODE (dest) == SUBREG
7193             && (((GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))) - 1)
7194                  / UNITS_PER_WORD)
7195                 == (GET_MODE_SIZE (GET_MODE (dest)) - 1)/ UNITS_PER_WORD)
7196             && (GET_MODE_SIZE (GET_MODE (dest))
7197                 >= GET_MODE_SIZE (GET_MODE (SUBREG_REG (dest))))
7198             && sets[i].src_elt != 0)
7199           {
7200             enum machine_mode new_mode = GET_MODE (SUBREG_REG (dest));
7201             struct table_elt *elt, *classp = 0;
7202
7203             for (elt = sets[i].src_elt->first_same_value; elt;
7204                  elt = elt->next_same_value)
7205               {
7206                 rtx new_src = 0;
7207                 unsigned src_hash;
7208                 struct table_elt *src_elt;
7209
7210                 /* Ignore invalid entries.  */
7211                 if (GET_CODE (elt->exp) != REG
7212                     && ! exp_equiv_p (elt->exp, elt->exp, 1, 0))
7213                   continue;
7214
7215                 new_src = gen_lowpart_if_possible (new_mode, elt->exp);
7216                 if (new_src == 0)
7217                   new_src = gen_rtx (SUBREG, new_mode, elt->exp, 0);
7218
7219                 src_hash = HASH (new_src, new_mode);
7220                 src_elt = lookup (new_src, src_hash, new_mode);
7221
7222                 /* Put the new source in the hash table is if isn't
7223                    already.  */
7224                 if (src_elt == 0)
7225                   {
7226                     if (insert_regs (new_src, classp, 0))
7227                       src_hash = HASH (new_src, new_mode);
7228                     src_elt = insert (new_src, classp, src_hash, new_mode);
7229                     src_elt->in_memory = elt->in_memory;
7230                     src_elt->in_struct = elt->in_struct;
7231                   }
7232                 else if (classp && classp != src_elt->first_same_value)
7233                   /* Show that two things that we've seen before are
7234                      actually the same.  */
7235                   merge_equiv_classes (src_elt, classp);
7236
7237                 classp = src_elt->first_same_value;
7238               }
7239           }
7240       }
7241
7242   /* Special handling for (set REG0 REG1)
7243      where REG0 is the "cheapest", cheaper than REG1.
7244      After cse, REG1 will probably not be used in the sequel,
7245      so (if easily done) change this insn to (set REG1 REG0) and
7246      replace REG1 with REG0 in the previous insn that computed their value.
7247      Then REG1 will become a dead store and won't cloud the situation
7248      for later optimizations.
7249
7250      Do not make this change if REG1 is a hard register, because it will
7251      then be used in the sequel and we may be changing a two-operand insn
7252      into a three-operand insn.
7253
7254      Also do not do this if we are operating on a copy of INSN.  */
7255
7256   if (n_sets == 1 && sets[0].rtl && GET_CODE (SET_DEST (sets[0].rtl)) == REG
7257       && NEXT_INSN (PREV_INSN (insn)) == insn
7258       && GET_CODE (SET_SRC (sets[0].rtl)) == REG
7259       && REGNO (SET_SRC (sets[0].rtl)) >= FIRST_PSEUDO_REGISTER
7260       && REGNO_QTY_VALID_P (REGNO (SET_SRC (sets[0].rtl)))
7261       && (qty_first_reg[reg_qty[REGNO (SET_SRC (sets[0].rtl))]]
7262           == REGNO (SET_DEST (sets[0].rtl))))
7263     {
7264       rtx prev = PREV_INSN (insn);
7265       while (prev && GET_CODE (prev) == NOTE)
7266         prev = PREV_INSN (prev);
7267
7268       if (prev && GET_CODE (prev) == INSN && GET_CODE (PATTERN (prev)) == SET
7269           && SET_DEST (PATTERN (prev)) == SET_SRC (sets[0].rtl))
7270         {
7271           rtx dest = SET_DEST (sets[0].rtl);
7272           rtx note = find_reg_note (prev, REG_EQUIV, NULL_RTX);
7273
7274           validate_change (prev, & SET_DEST (PATTERN (prev)), dest, 1);
7275           validate_change (insn, & SET_DEST (sets[0].rtl),
7276                            SET_SRC (sets[0].rtl), 1);
7277           validate_change (insn, & SET_SRC (sets[0].rtl), dest, 1);
7278           apply_change_group ();
7279
7280           /* If REG1 was equivalent to a constant, REG0 is not.  */
7281           if (note)
7282             PUT_REG_NOTE_KIND (note, REG_EQUAL);
7283
7284           /* If there was a REG_WAS_0 note on PREV, remove it.  Move
7285              any REG_WAS_0 note on INSN to PREV.  */
7286           note = find_reg_note (prev, REG_WAS_0, NULL_RTX);
7287           if (note)
7288             remove_note (prev, note);
7289
7290           note = find_reg_note (insn, REG_WAS_0, NULL_RTX);
7291           if (note)
7292             {
7293               remove_note (insn, note);
7294               XEXP (note, 1) = REG_NOTES (prev);
7295               REG_NOTES (prev) = note;
7296             }
7297         }
7298     }
7299
7300   /* If this is a conditional jump insn, record any known equivalences due to
7301      the condition being tested.  */
7302
7303   last_jump_equiv_class = 0;
7304   if (GET_CODE (insn) == JUMP_INSN
7305       && n_sets == 1 && GET_CODE (x) == SET
7306       && GET_CODE (SET_SRC (x)) == IF_THEN_ELSE)
7307     record_jump_equiv (insn, 0);
7308
7309 #ifdef HAVE_cc0
7310   /* If the previous insn set CC0 and this insn no longer references CC0,
7311      delete the previous insn.  Here we use the fact that nothing expects CC0
7312      to be valid over an insn, which is true until the final pass.  */
7313   if (prev_insn && GET_CODE (prev_insn) == INSN
7314       && (tem = single_set (prev_insn)) != 0
7315       && SET_DEST (tem) == cc0_rtx
7316       && ! reg_mentioned_p (cc0_rtx, x))
7317     {
7318       PUT_CODE (prev_insn, NOTE);
7319       NOTE_LINE_NUMBER (prev_insn) = NOTE_INSN_DELETED;
7320       NOTE_SOURCE_FILE (prev_insn) = 0;
7321     }
7322
7323   prev_insn_cc0 = this_insn_cc0;
7324   prev_insn_cc0_mode = this_insn_cc0_mode;
7325 #endif
7326
7327   prev_insn = insn;
7328 }
7329 \f
7330 /* Store 1 in *WRITES_PTR for those categories of memory ref
7331    that must be invalidated when the expression WRITTEN is stored in.
7332    If WRITTEN is null, say everything must be invalidated.  */
7333
7334 static void
7335 note_mem_written (written, writes_ptr)
7336      rtx written;
7337      struct write_data *writes_ptr;
7338 {
7339   static struct write_data everything = {0, 1, 1, 1};
7340
7341   if (written == 0)
7342     *writes_ptr = everything;
7343   else if (GET_CODE (written) == MEM)
7344     {
7345       /* Pushing or popping the stack invalidates just the stack pointer. */
7346       rtx addr = XEXP (written, 0);
7347       if ((GET_CODE (addr) == PRE_DEC || GET_CODE (addr) == PRE_INC
7348            || GET_CODE (addr) == POST_DEC || GET_CODE (addr) == POST_INC)
7349           && GET_CODE (XEXP (addr, 0)) == REG
7350           && REGNO (XEXP (addr, 0)) == STACK_POINTER_REGNUM)
7351         {
7352           writes_ptr->sp = 1;
7353           return;
7354         }
7355       else if (GET_MODE (written) == BLKmode)
7356         *writes_ptr = everything;
7357       /* (mem (scratch)) means clobber everything.  */
7358       else if (GET_CODE (addr) == SCRATCH)
7359         *writes_ptr = everything;
7360       else if (cse_rtx_addr_varies_p (written))
7361         {
7362           /* A varying address that is a sum indicates an array element,
7363              and that's just as good as a structure element
7364              in implying that we need not invalidate scalar variables.
7365              However, we must allow QImode aliasing of scalars, because the
7366              ANSI C standard allows character pointers to alias anything.  */
7367           if (! ((MEM_IN_STRUCT_P (written)
7368                   || GET_CODE (XEXP (written, 0)) == PLUS)
7369                  && GET_MODE (written) != QImode))
7370             writes_ptr->all = 1;
7371           writes_ptr->nonscalar = 1;
7372         }
7373       writes_ptr->var = 1;
7374     }
7375 }
7376
7377 /* Perform invalidation on the basis of everything about an insn
7378    except for invalidating the actual places that are SET in it.
7379    This includes the places CLOBBERed, and anything that might
7380    alias with something that is SET or CLOBBERed.
7381
7382    W points to the writes_memory for this insn, a struct write_data
7383    saying which kinds of memory references must be invalidated.
7384    X is the pattern of the insn.  */
7385
7386 static void
7387 invalidate_from_clobbers (w, x)
7388      struct write_data *w;
7389      rtx x;
7390 {
7391   /* If W->var is not set, W specifies no action.
7392      If W->all is set, this step gets all memory refs
7393      so they can be ignored in the rest of this function.  */
7394   if (w->var)
7395     invalidate_memory (w);
7396
7397   if (w->sp)
7398     {
7399       if (reg_tick[STACK_POINTER_REGNUM] >= 0)
7400         reg_tick[STACK_POINTER_REGNUM]++;
7401
7402       /* This should be *very* rare.  */
7403       if (TEST_HARD_REG_BIT (hard_regs_in_table, STACK_POINTER_REGNUM))
7404         invalidate (stack_pointer_rtx);
7405     }
7406
7407   if (GET_CODE (x) == CLOBBER)
7408     {
7409       rtx ref = XEXP (x, 0);
7410       if (ref)
7411         {
7412           if (GET_CODE (ref) == REG || GET_CODE (ref) == SUBREG
7413               || (GET_CODE (ref) == MEM && ! w->all))
7414             invalidate (ref);
7415           else if (GET_CODE (ref) == STRICT_LOW_PART
7416                    || GET_CODE (ref) == ZERO_EXTRACT)
7417             invalidate (XEXP (ref, 0));
7418         }
7419     }
7420   else if (GET_CODE (x) == PARALLEL)
7421     {
7422       register int i;
7423       for (i = XVECLEN (x, 0) - 1; i >= 0; i--)
7424         {
7425           register rtx y = XVECEXP (x, 0, i);
7426           if (GET_CODE (y) == CLOBBER)
7427             {
7428               rtx ref = XEXP (y, 0);
7429               if (ref)
7430                 {
7431                   if (GET_CODE (ref) == REG || GET_CODE (ref) == SUBREG
7432                       || (GET_CODE (ref) == MEM && !w->all))
7433                     invalidate (ref);
7434                   else if (GET_CODE (ref) == STRICT_LOW_PART
7435                            || GET_CODE (ref) == ZERO_EXTRACT)
7436                     invalidate (XEXP (ref, 0));
7437                 }
7438             }
7439         }
7440     }
7441 }
7442 \f
7443 /* Process X, part of the REG_NOTES of an insn.  Look at any REG_EQUAL notes
7444    and replace any registers in them with either an equivalent constant
7445    or the canonical form of the register.  If we are inside an address,
7446    only do this if the address remains valid.
7447
7448    OBJECT is 0 except when within a MEM in which case it is the MEM.
7449
7450    Return the replacement for X.  */
7451
7452 static rtx
7453 cse_process_notes (x, object)
7454      rtx x;
7455      rtx object;
7456 {
7457   enum rtx_code code = GET_CODE (x);
7458   char *fmt = GET_RTX_FORMAT (code);
7459   int i;
7460
7461   switch (code)
7462     {
7463     case CONST_INT:
7464     case CONST:
7465     case SYMBOL_REF:
7466     case LABEL_REF:
7467     case CONST_DOUBLE:
7468     case PC:
7469     case CC0:
7470     case LO_SUM:
7471       return x;
7472
7473     case MEM:
7474       XEXP (x, 0) = cse_process_notes (XEXP (x, 0), x);
7475       return x;
7476
7477     case EXPR_LIST:
7478     case INSN_LIST:
7479       if (REG_NOTE_KIND (x) == REG_EQUAL)
7480         XEXP (x, 0) = cse_process_notes (XEXP (x, 0), NULL_RTX);
7481       if (XEXP (x, 1))
7482         XEXP (x, 1) = cse_process_notes (XEXP (x, 1), NULL_RTX);
7483       return x;
7484
7485     case SIGN_EXTEND:
7486     case ZERO_EXTEND:
7487       {
7488         rtx new = cse_process_notes (XEXP (x, 0), object);
7489         /* We don't substitute VOIDmode constants into these rtx,
7490            since they would impede folding.  */
7491         if (GET_MODE (new) != VOIDmode)
7492           validate_change (object, &XEXP (x, 0), new, 0);
7493         return x;
7494       }
7495
7496     case REG:
7497       i = reg_qty[REGNO (x)];
7498
7499       /* Return a constant or a constant register.  */
7500       if (REGNO_QTY_VALID_P (REGNO (x))
7501           && qty_const[i] != 0
7502           && (CONSTANT_P (qty_const[i])
7503               || GET_CODE (qty_const[i]) == REG))
7504         {
7505           rtx new = gen_lowpart_if_possible (GET_MODE (x), qty_const[i]);
7506           if (new)
7507             return new;
7508         }
7509
7510       /* Otherwise, canonicalize this register.  */
7511       return canon_reg (x, NULL_RTX);
7512     }
7513
7514   for (i = 0; i < GET_RTX_LENGTH (code); i++)
7515     if (fmt[i] == 'e')
7516       validate_change (object, &XEXP (x, i),
7517                        cse_process_notes (XEXP (x, i), object), 0);
7518
7519   return x;
7520 }
7521 \f
7522 /* Find common subexpressions between the end test of a loop and the beginning
7523    of the loop.  LOOP_START is the CODE_LABEL at the start of a loop.
7524
7525    Often we have a loop where an expression in the exit test is used
7526    in the body of the loop.  For example "while (*p) *q++ = *p++;".
7527    Because of the way we duplicate the loop exit test in front of the loop,
7528    however, we don't detect that common subexpression.  This will be caught
7529    when global cse is implemented, but this is a quite common case.
7530
7531    This function handles the most common cases of these common expressions.
7532    It is called after we have processed the basic block ending with the
7533    NOTE_INSN_LOOP_END note that ends a loop and the previous JUMP_INSN
7534    jumps to a label used only once.  */
7535
7536 static void
7537 cse_around_loop (loop_start)
7538      rtx loop_start;
7539 {
7540   rtx insn;
7541   int i;
7542   struct table_elt *p;
7543
7544   /* If the jump at the end of the loop doesn't go to the start, we don't
7545      do anything.  */
7546   for (insn = PREV_INSN (loop_start);
7547        insn && (GET_CODE (insn) == NOTE && NOTE_LINE_NUMBER (insn) >= 0);
7548        insn = PREV_INSN (insn))
7549     ;
7550
7551   if (insn == 0
7552       || GET_CODE (insn) != NOTE
7553       || NOTE_LINE_NUMBER (insn) != NOTE_INSN_LOOP_BEG)
7554     return;
7555
7556   /* If the last insn of the loop (the end test) was an NE comparison,
7557      we will interpret it as an EQ comparison, since we fell through
7558      the loop.  Any equivalences resulting from that comparison are
7559      therefore not valid and must be invalidated.  */
7560   if (last_jump_equiv_class)
7561     for (p = last_jump_equiv_class->first_same_value; p;
7562          p = p->next_same_value)
7563       if (GET_CODE (p->exp) == MEM || GET_CODE (p->exp) == REG
7564           || GET_CODE (p->exp) == SUBREG)
7565         invalidate (p->exp);
7566       else if (GET_CODE (p->exp) == STRICT_LOW_PART
7567                || GET_CODE (p->exp) == ZERO_EXTRACT)
7568         invalidate (XEXP (p->exp, 0));
7569
7570   /* Process insns starting after LOOP_START until we hit a CALL_INSN or
7571      a CODE_LABEL (we could handle a CALL_INSN, but it isn't worth it).
7572
7573      The only thing we do with SET_DEST is invalidate entries, so we
7574      can safely process each SET in order.  It is slightly less efficient
7575      to do so, but we only want to handle the most common cases.  */
7576
7577   for (insn = NEXT_INSN (loop_start);
7578        GET_CODE (insn) != CALL_INSN && GET_CODE (insn) != CODE_LABEL
7579        && ! (GET_CODE (insn) == NOTE
7580              && NOTE_LINE_NUMBER (insn) == NOTE_INSN_LOOP_END);
7581        insn = NEXT_INSN (insn))
7582     {
7583       if (GET_RTX_CLASS (GET_CODE (insn)) == 'i'
7584           && (GET_CODE (PATTERN (insn)) == SET
7585               || GET_CODE (PATTERN (insn)) == CLOBBER))
7586         cse_set_around_loop (PATTERN (insn), insn, loop_start);
7587       else if (GET_RTX_CLASS (GET_CODE (insn)) == 'i'
7588                && GET_CODE (PATTERN (insn)) == PARALLEL)
7589         for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
7590           if (GET_CODE (XVECEXP (PATTERN (insn), 0, i)) == SET
7591               || GET_CODE (XVECEXP (PATTERN (insn), 0, i)) == CLOBBER)
7592             cse_set_around_loop (XVECEXP (PATTERN (insn), 0, i), insn,
7593                                  loop_start);
7594     }
7595 }
7596 \f
7597 /* Variable used for communications between the next two routines.  */
7598
7599 static struct write_data skipped_writes_memory;
7600
7601 /* Process one SET of an insn that was skipped.  We ignore CLOBBERs
7602    since they are done elsewhere.  This function is called via note_stores.  */
7603
7604 static void
7605 invalidate_skipped_set (dest, set)
7606      rtx set;
7607      rtx dest;
7608 {
7609   if (GET_CODE (set) == CLOBBER
7610 #ifdef HAVE_cc0
7611       || dest == cc0_rtx
7612 #endif
7613       || dest == pc_rtx)
7614     return;
7615
7616   if (GET_CODE (dest) == MEM)
7617     note_mem_written (dest, &skipped_writes_memory);
7618
7619   /* There are times when an address can appear varying and be a PLUS
7620      during this scan when it would be a fixed address were we to know
7621      the proper equivalences.  So promote "nonscalar" to be "all".  */
7622   if (skipped_writes_memory.nonscalar)
7623     skipped_writes_memory.all = 1;
7624
7625   if (GET_CODE (dest) == REG || GET_CODE (dest) == SUBREG
7626       || (! skipped_writes_memory.all && ! cse_rtx_addr_varies_p (dest)))
7627     invalidate (dest);
7628   else if (GET_CODE (dest) == STRICT_LOW_PART
7629            || GET_CODE (dest) == ZERO_EXTRACT)
7630     invalidate (XEXP (dest, 0));
7631 }
7632
7633 /* Invalidate all insns from START up to the end of the function or the
7634    next label.  This called when we wish to CSE around a block that is
7635    conditionally executed.  */
7636
7637 static void
7638 invalidate_skipped_block (start)
7639      rtx start;
7640 {
7641   rtx insn;
7642   static struct write_data init = {0, 0, 0, 0};
7643   static struct write_data everything = {0, 1, 1, 1};
7644
7645   for (insn = start; insn && GET_CODE (insn) != CODE_LABEL;
7646        insn = NEXT_INSN (insn))
7647     {
7648       if (GET_RTX_CLASS (GET_CODE (insn)) != 'i')
7649         continue;
7650
7651       skipped_writes_memory = init;
7652
7653       if (GET_CODE (insn) == CALL_INSN)
7654         {
7655           invalidate_for_call ();
7656           skipped_writes_memory = everything;
7657         }
7658
7659       note_stores (PATTERN (insn), invalidate_skipped_set);
7660       invalidate_from_clobbers (&skipped_writes_memory, PATTERN (insn));
7661     }
7662 }
7663 \f
7664 /* Used for communication between the following two routines; contains a
7665    value to be checked for modification.  */
7666
7667 static rtx cse_check_loop_start_value;
7668
7669 /* If modifying X will modify the value in CSE_CHECK_LOOP_START_VALUE,
7670    indicate that fact by setting CSE_CHECK_LOOP_START_VALUE to 0.  */
7671
7672 static void
7673 cse_check_loop_start (x, set)
7674      rtx x;
7675      rtx set;
7676 {
7677   if (cse_check_loop_start_value == 0
7678       || GET_CODE (x) == CC0 || GET_CODE (x) == PC)
7679     return;
7680
7681   if ((GET_CODE (x) == MEM && GET_CODE (cse_check_loop_start_value) == MEM)
7682       || reg_overlap_mentioned_p (x, cse_check_loop_start_value))
7683     cse_check_loop_start_value = 0;
7684 }
7685
7686 /* X is a SET or CLOBBER contained in INSN that was found near the start of
7687    a loop that starts with the label at LOOP_START.
7688
7689    If X is a SET, we see if its SET_SRC is currently in our hash table.
7690    If so, we see if it has a value equal to some register used only in the
7691    loop exit code (as marked by jump.c).
7692
7693    If those two conditions are true, we search backwards from the start of
7694    the loop to see if that same value was loaded into a register that still
7695    retains its value at the start of the loop.
7696
7697    If so, we insert an insn after the load to copy the destination of that
7698    load into the equivalent register and (try to) replace our SET_SRC with that
7699    register.
7700
7701    In any event, we invalidate whatever this SET or CLOBBER modifies.  */
7702
7703 static void
7704 cse_set_around_loop (x, insn, loop_start)
7705      rtx x;
7706      rtx insn;
7707      rtx loop_start;
7708 {
7709   struct table_elt *src_elt;
7710   static struct write_data init = {0, 0, 0, 0};
7711   struct write_data writes_memory;
7712
7713   writes_memory = init;
7714
7715   /* If this is a SET, see if we can replace SET_SRC, but ignore SETs that
7716      are setting PC or CC0 or whose SET_SRC is already a register.  */
7717   if (GET_CODE (x) == SET
7718       && GET_CODE (SET_DEST (x)) != PC && GET_CODE (SET_DEST (x)) != CC0
7719       && GET_CODE (SET_SRC (x)) != REG)
7720     {
7721       src_elt = lookup (SET_SRC (x),
7722                         HASH (SET_SRC (x), GET_MODE (SET_DEST (x))),
7723                         GET_MODE (SET_DEST (x)));
7724
7725       if (src_elt)
7726         for (src_elt = src_elt->first_same_value; src_elt;
7727              src_elt = src_elt->next_same_value)
7728           if (GET_CODE (src_elt->exp) == REG && REG_LOOP_TEST_P (src_elt->exp)
7729               && COST (src_elt->exp) < COST (SET_SRC (x)))
7730             {
7731               rtx p, set;
7732
7733               /* Look for an insn in front of LOOP_START that sets
7734                  something in the desired mode to SET_SRC (x) before we hit
7735                  a label or CALL_INSN.  */
7736
7737               for (p = prev_nonnote_insn (loop_start);
7738                    p && GET_CODE (p) != CALL_INSN
7739                    && GET_CODE (p) != CODE_LABEL;
7740                    p = prev_nonnote_insn  (p))
7741                 if ((set = single_set (p)) != 0
7742                     && GET_CODE (SET_DEST (set)) == REG
7743                     && GET_MODE (SET_DEST (set)) == src_elt->mode
7744                     && rtx_equal_p (SET_SRC (set), SET_SRC (x)))
7745                   {
7746                     /* We now have to ensure that nothing between P
7747                        and LOOP_START modified anything referenced in
7748                        SET_SRC (x).  We know that nothing within the loop
7749                        can modify it, or we would have invalidated it in
7750                        the hash table.  */
7751                     rtx q;
7752
7753                     cse_check_loop_start_value = SET_SRC (x);
7754                     for (q = p; q != loop_start; q = NEXT_INSN (q))
7755                       if (GET_RTX_CLASS (GET_CODE (q)) == 'i')
7756                         note_stores (PATTERN (q), cse_check_loop_start);
7757
7758                     /* If nothing was changed and we can replace our
7759                        SET_SRC, add an insn after P to copy its destination
7760                        to what we will be replacing SET_SRC with.  */
7761                     if (cse_check_loop_start_value
7762                         && validate_change (insn, &SET_SRC (x),
7763                                             src_elt->exp, 0))
7764                       emit_insn_after (gen_move_insn (src_elt->exp,
7765                                                       SET_DEST (set)),
7766                                        p);
7767                     break;
7768                   }
7769             }
7770     }
7771
7772   /* Now invalidate anything modified by X.  */
7773   note_mem_written (SET_DEST (x), &writes_memory);
7774
7775   if (writes_memory.var)
7776     invalidate_memory (&writes_memory);
7777
7778   /* See comment on similar code in cse_insn for explanation of these tests. */
7779   if (GET_CODE (SET_DEST (x)) == REG || GET_CODE (SET_DEST (x)) == SUBREG
7780       || (GET_CODE (SET_DEST (x)) == MEM && ! writes_memory.all
7781           && ! cse_rtx_addr_varies_p (SET_DEST (x))))
7782     invalidate (SET_DEST (x));
7783   else if (GET_CODE (SET_DEST (x)) == STRICT_LOW_PART
7784            || GET_CODE (SET_DEST (x)) == ZERO_EXTRACT)
7785     invalidate (XEXP (SET_DEST (x), 0));
7786 }
7787 \f
7788 /* Find the end of INSN's basic block and return its range,
7789    the total number of SETs in all the insns of the block, the last insn of the
7790    block, and the branch path.
7791
7792    The branch path indicates which branches should be followed.  If a non-zero
7793    path size is specified, the block should be rescanned and a different set
7794    of branches will be taken.  The branch path is only used if
7795    FLAG_CSE_FOLLOW_JUMPS or FLAG_CSE_SKIP_BLOCKS is non-zero.
7796
7797    DATA is a pointer to a struct cse_basic_block_data, defined below, that is
7798    used to describe the block.  It is filled in with the information about
7799    the current block.  The incoming structure's branch path, if any, is used
7800    to construct the output branch path.  */
7801
7802 void
7803 cse_end_of_basic_block (insn, data, follow_jumps, after_loop, skip_blocks)
7804      rtx insn;
7805      struct cse_basic_block_data *data;
7806      int follow_jumps;
7807      int after_loop;
7808      int skip_blocks;
7809 {
7810   rtx p = insn, q;
7811   int nsets = 0;
7812   int low_cuid = INSN_CUID (insn), high_cuid = INSN_CUID (insn);
7813   rtx next = GET_RTX_CLASS (GET_CODE (insn)) == 'i' ? insn : next_real_insn (insn);
7814   int path_size = data->path_size;
7815   int path_entry = 0;
7816   int i;
7817
7818   /* Update the previous branch path, if any.  If the last branch was
7819      previously TAKEN, mark it NOT_TAKEN.  If it was previously NOT_TAKEN,
7820      shorten the path by one and look at the previous branch.  We know that
7821      at least one branch must have been taken if PATH_SIZE is non-zero.  */
7822   while (path_size > 0)
7823     {
7824       if (data->path[path_size - 1].status != NOT_TAKEN)
7825         {
7826           data->path[path_size - 1].status = NOT_TAKEN;
7827           break;
7828         }
7829       else
7830         path_size--;
7831     }
7832
7833   /* Scan to end of this basic block.  */
7834   while (p && GET_CODE (p) != CODE_LABEL)
7835     {
7836       /* Don't cse out the end of a loop.  This makes a difference
7837          only for the unusual loops that always execute at least once;
7838          all other loops have labels there so we will stop in any case.
7839          Cse'ing out the end of the loop is dangerous because it
7840          might cause an invariant expression inside the loop
7841          to be reused after the end of the loop.  This would make it
7842          hard to move the expression out of the loop in loop.c,
7843          especially if it is one of several equivalent expressions
7844          and loop.c would like to eliminate it.
7845
7846          If we are running after loop.c has finished, we can ignore
7847          the NOTE_INSN_LOOP_END.  */
7848
7849       if (! after_loop && GET_CODE (p) == NOTE
7850           && NOTE_LINE_NUMBER (p) == NOTE_INSN_LOOP_END)
7851         break;
7852
7853       /* Don't cse over a call to setjmp; on some machines (eg vax)
7854          the regs restored by the longjmp come from
7855          a later time than the setjmp.  */
7856       if (GET_CODE (p) == NOTE
7857           && NOTE_LINE_NUMBER (p) == NOTE_INSN_SETJMP)
7858         break;
7859
7860       /* A PARALLEL can have lots of SETs in it,
7861          especially if it is really an ASM_OPERANDS.  */
7862       if (GET_RTX_CLASS (GET_CODE (p)) == 'i'
7863           && GET_CODE (PATTERN (p)) == PARALLEL)
7864         nsets += XVECLEN (PATTERN (p), 0);
7865       else if (GET_CODE (p) != NOTE)
7866         nsets += 1;
7867
7868       /* Ignore insns made by CSE; they cannot affect the boundaries of
7869          the basic block.  */
7870
7871       if (INSN_UID (p) <= max_uid && INSN_CUID (p) > high_cuid)
7872         high_cuid = INSN_CUID (p);
7873       if (INSN_UID (p) <= max_uid && INSN_CUID (p) < low_cuid)
7874         low_cuid = INSN_CUID (p);
7875
7876       /* See if this insn is in our branch path.  If it is and we are to
7877          take it, do so.  */
7878       if (path_entry < path_size && data->path[path_entry].branch == p)
7879         {
7880           if (data->path[path_entry].status != NOT_TAKEN)
7881             p = JUMP_LABEL (p);
7882
7883           /* Point to next entry in path, if any.  */
7884           path_entry++;
7885         }
7886
7887       /* If this is a conditional jump, we can follow it if -fcse-follow-jumps
7888          was specified, we haven't reached our maximum path length, there are
7889          insns following the target of the jump, this is the only use of the
7890          jump label, and the target label is preceded by a BARRIER.
7891
7892          Alternatively, we can follow the jump if it branches around a
7893          block of code and there are no other branches into the block.
7894          In this case invalidate_skipped_block will be called to invalidate any
7895          registers set in the block when following the jump.  */
7896
7897       else if ((follow_jumps || skip_blocks) && path_size < PATHLENGTH - 1
7898                && GET_CODE (p) == JUMP_INSN
7899                && GET_CODE (PATTERN (p)) == SET
7900                && GET_CODE (SET_SRC (PATTERN (p))) == IF_THEN_ELSE
7901                && LABEL_NUSES (JUMP_LABEL (p)) == 1
7902                && NEXT_INSN (JUMP_LABEL (p)) != 0)
7903         {
7904           for (q = PREV_INSN (JUMP_LABEL (p)); q; q = PREV_INSN (q))
7905             if ((GET_CODE (q) != NOTE
7906                  || NOTE_LINE_NUMBER (q) == NOTE_INSN_LOOP_END
7907                  || NOTE_LINE_NUMBER (q) == NOTE_INSN_SETJMP)
7908                 && (GET_CODE (q) != CODE_LABEL || LABEL_NUSES (q) != 0))
7909               break;
7910
7911           /* If we ran into a BARRIER, this code is an extension of the
7912              basic block when the branch is taken.  */
7913           if (follow_jumps && q != 0 && GET_CODE (q) == BARRIER)
7914             {
7915               /* Don't allow ourself to keep walking around an
7916                  always-executed loop.  */
7917               if (next_real_insn (q) == next)
7918                 {
7919                   p = NEXT_INSN (p);
7920                   continue;
7921                 }
7922
7923               /* Similarly, don't put a branch in our path more than once.  */
7924               for (i = 0; i < path_entry; i++)
7925                 if (data->path[i].branch == p)
7926                   break;
7927
7928               if (i != path_entry)
7929                 break;
7930
7931               data->path[path_entry].branch = p;
7932               data->path[path_entry++].status = TAKEN;
7933
7934               /* This branch now ends our path.  It was possible that we
7935                  didn't see this branch the last time around (when the
7936                  insn in front of the target was a JUMP_INSN that was
7937                  turned into a no-op).  */
7938               path_size = path_entry;
7939
7940               p = JUMP_LABEL (p);
7941               /* Mark block so we won't scan it again later.  */
7942               PUT_MODE (NEXT_INSN (p), QImode);
7943             }
7944           /* Detect a branch around a block of code.  */
7945           else if (skip_blocks && q != 0 && GET_CODE (q) != CODE_LABEL)
7946             {
7947               register rtx tmp;
7948
7949               if (next_real_insn (q) == next)
7950                 {
7951                   p = NEXT_INSN (p);
7952                   continue;
7953                 }
7954
7955               for (i = 0; i < path_entry; i++)
7956                 if (data->path[i].branch == p)
7957                   break;
7958
7959               if (i != path_entry)
7960                 break;
7961
7962               /* This is no_labels_between_p (p, q) with an added check for
7963                  reaching the end of a function (in case Q precedes P).  */
7964               for (tmp = NEXT_INSN (p); tmp && tmp != q; tmp = NEXT_INSN (tmp))
7965                 if (GET_CODE (tmp) == CODE_LABEL)
7966                   break;
7967
7968               if (tmp == q)
7969                 {
7970                   data->path[path_entry].branch = p;
7971                   data->path[path_entry++].status = AROUND;
7972
7973                   path_size = path_entry;
7974
7975                   p = JUMP_LABEL (p);
7976                   /* Mark block so we won't scan it again later.  */
7977                   PUT_MODE (NEXT_INSN (p), QImode);
7978                 }
7979             }
7980         }
7981       p = NEXT_INSN (p);
7982     }
7983
7984   data->low_cuid = low_cuid;
7985   data->high_cuid = high_cuid;
7986   data->nsets = nsets;
7987   data->last = p;
7988
7989   /* If all jumps in the path are not taken, set our path length to zero
7990      so a rescan won't be done.  */
7991   for (i = path_size - 1; i >= 0; i--)
7992     if (data->path[i].status != NOT_TAKEN)
7993       break;
7994
7995   if (i == -1)
7996     data->path_size = 0;
7997   else
7998     data->path_size = path_size;
7999
8000   /* End the current branch path.  */
8001   data->path[path_size].branch = 0;
8002 }
8003 \f
8004 /* Perform cse on the instructions of a function.
8005    F is the first instruction.
8006    NREGS is one plus the highest pseudo-reg number used in the instruction.
8007
8008    AFTER_LOOP is 1 if this is the cse call done after loop optimization
8009    (only if -frerun-cse-after-loop).
8010
8011    Returns 1 if jump_optimize should be redone due to simplifications
8012    in conditional jump instructions.  */
8013
8014 int
8015 cse_main (f, nregs, after_loop, file)
8016      rtx f;
8017      int nregs;
8018      int after_loop;
8019      FILE *file;
8020 {
8021   struct cse_basic_block_data val;
8022   register rtx insn = f;
8023   register int i;
8024
8025   cse_jumps_altered = 0;
8026   constant_pool_entries_cost = 0;
8027   val.path_size = 0;
8028
8029   init_recog ();
8030
8031   max_reg = nregs;
8032
8033   all_minus_one = (int *) alloca (nregs * sizeof (int));
8034   consec_ints = (int *) alloca (nregs * sizeof (int));
8035
8036   for (i = 0; i < nregs; i++)
8037     {
8038       all_minus_one[i] = -1;
8039       consec_ints[i] = i;
8040     }
8041
8042   reg_next_eqv = (int *) alloca (nregs * sizeof (int));
8043   reg_prev_eqv = (int *) alloca (nregs * sizeof (int));
8044   reg_qty = (int *) alloca (nregs * sizeof (int));
8045   reg_in_table = (int *) alloca (nregs * sizeof (int));
8046   reg_tick = (int *) alloca (nregs * sizeof (int));
8047
8048 #ifdef LOAD_EXTEND_OP
8049
8050   /* Allocate scratch rtl here.  cse_insn will fill in the memory reference
8051      and change the code and mode as appropriate.  */
8052   memory_extend_rtx = gen_rtx (ZERO_EXTEND, VOIDmode, 0);
8053 #endif
8054
8055   /* Discard all the free elements of the previous function
8056      since they are allocated in the temporarily obstack.  */
8057   bzero ((char *) table, sizeof table);
8058   free_element_chain = 0;
8059   n_elements_made = 0;
8060
8061   /* Find the largest uid.  */
8062
8063   max_uid = get_max_uid ();
8064   uid_cuid = (int *) alloca ((max_uid + 1) * sizeof (int));
8065   bzero ((char *) uid_cuid, (max_uid + 1) * sizeof (int));
8066
8067   /* Compute the mapping from uids to cuids.
8068      CUIDs are numbers assigned to insns, like uids,
8069      except that cuids increase monotonically through the code.
8070      Don't assign cuids to line-number NOTEs, so that the distance in cuids
8071      between two insns is not affected by -g.  */
8072
8073   for (insn = f, i = 0; insn; insn = NEXT_INSN (insn))
8074     {
8075       if (GET_CODE (insn) != NOTE
8076           || NOTE_LINE_NUMBER (insn) < 0)
8077         INSN_CUID (insn) = ++i;
8078       else
8079         /* Give a line number note the same cuid as preceding insn.  */
8080         INSN_CUID (insn) = i;
8081     }
8082
8083   /* Initialize which registers are clobbered by calls.  */
8084
8085   CLEAR_HARD_REG_SET (regs_invalidated_by_call);
8086
8087   for (i = 0; i < FIRST_PSEUDO_REGISTER; i++)
8088     if ((call_used_regs[i]
8089          /* Used to check !fixed_regs[i] here, but that isn't safe;
8090             fixed regs are still call-clobbered, and sched can get
8091             confused if they can "live across calls".
8092
8093             The frame pointer is always preserved across calls.  The arg
8094             pointer is if it is fixed.  The stack pointer usually is, unless
8095             RETURN_POPS_ARGS, in which case an explicit CLOBBER
8096             will be present.  If we are generating PIC code, the PIC offset
8097             table register is preserved across calls.  */
8098
8099          && i != STACK_POINTER_REGNUM
8100          && i != FRAME_POINTER_REGNUM
8101 #if HARD_FRAME_POINTER_REGNUM != FRAME_POINTER_REGNUM
8102          && i != HARD_FRAME_POINTER_REGNUM
8103 #endif
8104 #if ARG_POINTER_REGNUM != FRAME_POINTER_REGNUM
8105          && ! (i == ARG_POINTER_REGNUM && fixed_regs[i])
8106 #endif
8107 #if defined (PIC_OFFSET_TABLE_REGNUM) && !defined (PIC_OFFSET_TABLE_REG_CALL_CLOBBERED)
8108          && ! (i == PIC_OFFSET_TABLE_REGNUM && flag_pic)
8109 #endif
8110          )
8111         || global_regs[i])
8112       SET_HARD_REG_BIT (regs_invalidated_by_call, i);
8113
8114   /* Loop over basic blocks.
8115      Compute the maximum number of qty's needed for each basic block
8116      (which is 2 for each SET).  */
8117   insn = f;
8118   while (insn)
8119     {
8120       cse_end_of_basic_block (insn, &val, flag_cse_follow_jumps, after_loop,
8121                               flag_cse_skip_blocks);
8122
8123       /* If this basic block was already processed or has no sets, skip it.  */
8124       if (val.nsets == 0 || GET_MODE (insn) == QImode)
8125         {
8126           PUT_MODE (insn, VOIDmode);
8127           insn = (val.last ? NEXT_INSN (val.last) : 0);
8128           val.path_size = 0;
8129           continue;
8130         }
8131
8132       cse_basic_block_start = val.low_cuid;
8133       cse_basic_block_end = val.high_cuid;
8134       max_qty = val.nsets * 2;
8135
8136       if (file)
8137         fprintf (file, ";; Processing block from %d to %d, %d sets.\n",
8138                  INSN_UID (insn), val.last ? INSN_UID (val.last) : 0,
8139                  val.nsets);
8140
8141       /* Make MAX_QTY bigger to give us room to optimize
8142          past the end of this basic block, if that should prove useful.  */
8143       if (max_qty < 500)
8144         max_qty = 500;
8145
8146       max_qty += max_reg;
8147
8148       /* If this basic block is being extended by following certain jumps,
8149          (see `cse_end_of_basic_block'), we reprocess the code from the start.
8150          Otherwise, we start after this basic block.  */
8151       if (val.path_size > 0)
8152         cse_basic_block (insn, val.last, val.path, 0);
8153       else
8154         {
8155           int old_cse_jumps_altered = cse_jumps_altered;
8156           rtx temp;
8157
8158           /* When cse changes a conditional jump to an unconditional
8159              jump, we want to reprocess the block, since it will give
8160              us a new branch path to investigate.  */
8161           cse_jumps_altered = 0;
8162           temp = cse_basic_block (insn, val.last, val.path, ! after_loop);
8163           if (cse_jumps_altered == 0
8164               || (flag_cse_follow_jumps == 0 && flag_cse_skip_blocks == 0))
8165             insn = temp;
8166
8167           cse_jumps_altered |= old_cse_jumps_altered;
8168         }
8169
8170 #ifdef USE_C_ALLOCA
8171       alloca (0);
8172 #endif
8173     }
8174
8175   /* Tell refers_to_mem_p that qty_const info is not available.  */
8176   qty_const = 0;
8177
8178   if (max_elements_made < n_elements_made)
8179     max_elements_made = n_elements_made;
8180
8181   return cse_jumps_altered;
8182 }
8183
8184 /* Process a single basic block.  FROM and TO and the limits of the basic
8185    block.  NEXT_BRANCH points to the branch path when following jumps or
8186    a null path when not following jumps.
8187
8188    AROUND_LOOP is non-zero if we are to try to cse around to the start of a
8189    loop.  This is true when we are being called for the last time on a
8190    block and this CSE pass is before loop.c.  */
8191
8192 static rtx
8193 cse_basic_block (from, to, next_branch, around_loop)
8194      register rtx from, to;
8195      struct branch_path *next_branch;
8196      int around_loop;
8197 {
8198   register rtx insn;
8199   int to_usage = 0;
8200   int in_libcall_block = 0;
8201
8202   /* Each of these arrays is undefined before max_reg, so only allocate
8203      the space actually needed and adjust the start below.  */
8204
8205   qty_first_reg = (int *) alloca ((max_qty - max_reg) * sizeof (int));
8206   qty_last_reg = (int *) alloca ((max_qty - max_reg) * sizeof (int));
8207   qty_mode= (enum machine_mode *) alloca ((max_qty - max_reg) * sizeof (enum machine_mode));
8208   qty_const = (rtx *) alloca ((max_qty - max_reg) * sizeof (rtx));
8209   qty_const_insn = (rtx *) alloca ((max_qty - max_reg) * sizeof (rtx));
8210   qty_comparison_code
8211     = (enum rtx_code *) alloca ((max_qty - max_reg) * sizeof (enum rtx_code));
8212   qty_comparison_qty = (int *) alloca ((max_qty - max_reg) * sizeof (int));
8213   qty_comparison_const = (rtx *) alloca ((max_qty - max_reg) * sizeof (rtx));
8214
8215   qty_first_reg -= max_reg;
8216   qty_last_reg -= max_reg;
8217   qty_mode -= max_reg;
8218   qty_const -= max_reg;
8219   qty_const_insn -= max_reg;
8220   qty_comparison_code -= max_reg;
8221   qty_comparison_qty -= max_reg;
8222   qty_comparison_const -= max_reg;
8223
8224   new_basic_block ();
8225
8226   /* TO might be a label.  If so, protect it from being deleted.  */
8227   if (to != 0 && GET_CODE (to) == CODE_LABEL)
8228     ++LABEL_NUSES (to);
8229
8230   for (insn = from; insn != to; insn = NEXT_INSN (insn))
8231     {
8232       register enum rtx_code code;
8233
8234       /* See if this is a branch that is part of the path.  If so, and it is
8235          to be taken, do so.  */
8236       if (next_branch->branch == insn)
8237         {
8238           enum taken status = next_branch++->status;
8239           if (status != NOT_TAKEN)
8240             {
8241               if (status == TAKEN)
8242                 record_jump_equiv (insn, 1);
8243               else
8244                 invalidate_skipped_block (NEXT_INSN (insn));
8245
8246               /* Set the last insn as the jump insn; it doesn't affect cc0.
8247                  Then follow this branch.  */
8248 #ifdef HAVE_cc0
8249               prev_insn_cc0 = 0;
8250 #endif
8251               prev_insn = insn;
8252               insn = JUMP_LABEL (insn);
8253               continue;
8254             }
8255         }
8256
8257       code = GET_CODE (insn);
8258       if (GET_MODE (insn) == QImode)
8259         PUT_MODE (insn, VOIDmode);
8260
8261       if (GET_RTX_CLASS (code) == 'i')
8262         {
8263           /* Process notes first so we have all notes in canonical forms when
8264              looking for duplicate operations.  */
8265
8266           if (REG_NOTES (insn))
8267             REG_NOTES (insn) = cse_process_notes (REG_NOTES (insn), NULL_RTX);
8268
8269           /* Track when we are inside in LIBCALL block.  Inside such a block,
8270              we do not want to record destinations.  The last insn of a
8271              LIBCALL block is not considered to be part of the block, since
8272              its destination is the result of the block and hence should be
8273              recorded.  */
8274
8275           if (find_reg_note (insn, REG_LIBCALL, NULL_RTX))
8276             in_libcall_block = 1;
8277           else if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
8278             in_libcall_block = 0;
8279
8280           cse_insn (insn, in_libcall_block);
8281         }
8282
8283       /* If INSN is now an unconditional jump, skip to the end of our
8284          basic block by pretending that we just did the last insn in the
8285          basic block.  If we are jumping to the end of our block, show
8286          that we can have one usage of TO.  */
8287
8288       if (simplejump_p (insn))
8289         {
8290           if (to == 0)
8291             return 0;
8292
8293           if (JUMP_LABEL (insn) == to)
8294             to_usage = 1;
8295
8296           /* Maybe TO was deleted because the jump is unconditional.
8297              If so, there is nothing left in this basic block.  */
8298           /* ??? Perhaps it would be smarter to set TO
8299              to whatever follows this insn,
8300              and pretend the basic block had always ended here.  */
8301           if (INSN_DELETED_P (to))
8302             break;
8303
8304           insn = PREV_INSN (to);
8305         }
8306
8307       /* See if it is ok to keep on going past the label
8308          which used to end our basic block.  Remember that we incremented
8309          the count of that label, so we decrement it here.  If we made
8310          a jump unconditional, TO_USAGE will be one; in that case, we don't
8311          want to count the use in that jump.  */
8312
8313       if (to != 0 && NEXT_INSN (insn) == to
8314           && GET_CODE (to) == CODE_LABEL && --LABEL_NUSES (to) == to_usage)
8315         {
8316           struct cse_basic_block_data val;
8317
8318           insn = NEXT_INSN (to);
8319
8320           if (LABEL_NUSES (to) == 0)
8321             delete_insn (to);
8322
8323           /* Find the end of the following block.  Note that we won't be
8324              following branches in this case.  If TO was the last insn
8325              in the function, we are done.  Similarly, if we deleted the
8326              insn after TO, it must have been because it was preceded by
8327              a BARRIER.  In that case, we are done with this block because it
8328              has no continuation.  */
8329
8330           if (insn == 0 || INSN_DELETED_P (insn))
8331             return 0;
8332
8333           to_usage = 0;
8334           val.path_size = 0;
8335           cse_end_of_basic_block (insn, &val, 0, 0, 0);
8336
8337           /* If the tables we allocated have enough space left
8338              to handle all the SETs in the next basic block,
8339              continue through it.  Otherwise, return,
8340              and that block will be scanned individually.  */
8341           if (val.nsets * 2 + next_qty > max_qty)
8342             break;
8343
8344           cse_basic_block_start = val.low_cuid;
8345           cse_basic_block_end = val.high_cuid;
8346           to = val.last;
8347
8348           /* Prevent TO from being deleted if it is a label.  */
8349           if (to != 0 && GET_CODE (to) == CODE_LABEL)
8350             ++LABEL_NUSES (to);
8351
8352           /* Back up so we process the first insn in the extension.  */
8353           insn = PREV_INSN (insn);
8354         }
8355     }
8356
8357   if (next_qty > max_qty)
8358     abort ();
8359
8360   /* If we are running before loop.c, we stopped on a NOTE_INSN_LOOP_END, and
8361      the previous insn is the only insn that branches to the head of a loop,
8362      we can cse into the loop.  Don't do this if we changed the jump
8363      structure of a loop unless we aren't going to be following jumps.  */
8364
8365   if ((cse_jumps_altered == 0
8366        || (flag_cse_follow_jumps == 0 && flag_cse_skip_blocks == 0))
8367       && around_loop && to != 0
8368       && GET_CODE (to) == NOTE && NOTE_LINE_NUMBER (to) == NOTE_INSN_LOOP_END
8369       && GET_CODE (PREV_INSN (to)) == JUMP_INSN
8370       && JUMP_LABEL (PREV_INSN (to)) != 0
8371       && LABEL_NUSES (JUMP_LABEL (PREV_INSN (to))) == 1)
8372     cse_around_loop (JUMP_LABEL (PREV_INSN (to)));
8373
8374   return to ? NEXT_INSN (to) : 0;
8375 }
8376 \f
8377 /* Count the number of times registers are used (not set) in X.
8378    COUNTS is an array in which we accumulate the count, INCR is how much
8379    we count each register usage.
8380
8381    Don't count a usage of DEST, which is the SET_DEST of a SET which
8382    contains X in its SET_SRC.  This is because such a SET does not
8383    modify the liveness of DEST.  */
8384
8385 static void
8386 count_reg_usage (x, counts, dest, incr)
8387      rtx x;
8388      int *counts;
8389      rtx dest;
8390      int incr;
8391 {
8392   enum rtx_code code;
8393   char *fmt;
8394   int i, j;
8395
8396   if (x == 0)
8397     return;
8398
8399   switch (code = GET_CODE (x))
8400     {
8401     case REG:
8402       if (x != dest)
8403         counts[REGNO (x)] += incr;
8404       return;
8405
8406     case PC:
8407     case CC0:
8408     case CONST:
8409     case CONST_INT:
8410     case CONST_DOUBLE:
8411     case SYMBOL_REF:
8412     case LABEL_REF:
8413     case CLOBBER:
8414       return;
8415
8416     case SET:
8417       /* Unless we are setting a REG, count everything in SET_DEST.  */
8418       if (GET_CODE (SET_DEST (x)) != REG)
8419         count_reg_usage (SET_DEST (x), counts, NULL_RTX, incr);
8420
8421       /* If SRC has side-effects, then we can't delete this insn, so the
8422          usage of SET_DEST inside SRC counts.
8423
8424          ??? Strictly-speaking, we might be preserving this insn
8425          because some other SET has side-effects, but that's hard
8426          to do and can't happen now.  */
8427       count_reg_usage (SET_SRC (x), counts,
8428                        side_effects_p (SET_SRC (x)) ? NULL_RTX : SET_DEST (x),
8429                        incr);
8430       return;
8431
8432     case CALL_INSN:
8433       count_reg_usage (CALL_INSN_FUNCTION_USAGE (x), counts, NULL_RTX, incr);
8434
8435       /* ... falls through ...  */
8436     case INSN:
8437     case JUMP_INSN:
8438       count_reg_usage (PATTERN (x), counts, NULL_RTX, incr);
8439
8440       /* Things used in a REG_EQUAL note aren't dead since loop may try to
8441          use them.  */
8442
8443       count_reg_usage (REG_NOTES (x), counts, NULL_RTX, incr);
8444       return;
8445
8446     case EXPR_LIST:
8447     case INSN_LIST:
8448       if (REG_NOTE_KIND (x) == REG_EQUAL
8449           || GET_CODE (XEXP (x,0)) == USE)
8450         count_reg_usage (XEXP (x, 0), counts, NULL_RTX, incr);
8451       count_reg_usage (XEXP (x, 1), counts, NULL_RTX, incr);
8452       return;
8453     }
8454
8455   fmt = GET_RTX_FORMAT (code);
8456   for (i = GET_RTX_LENGTH (code) - 1; i >= 0; i--)
8457     {
8458       if (fmt[i] == 'e')
8459         count_reg_usage (XEXP (x, i), counts, dest, incr);
8460       else if (fmt[i] == 'E')
8461         for (j = XVECLEN (x, i) - 1; j >= 0; j--)
8462           count_reg_usage (XVECEXP (x, i, j), counts, dest, incr);
8463     }
8464 }
8465 \f
8466 /* Scan all the insns and delete any that are dead; i.e., they store a register
8467    that is never used or they copy a register to itself.
8468
8469    This is used to remove insns made obviously dead by cse.  It improves the
8470    heuristics in loop since it won't try to move dead invariants out of loops
8471    or make givs for dead quantities.  The remaining passes of the compilation
8472    are also sped up.  */
8473
8474 void
8475 delete_dead_from_cse (insns, nreg)
8476      rtx insns;
8477      int nreg;
8478 {
8479   int *counts = (int *) alloca (nreg * sizeof (int));
8480   rtx insn, prev;
8481   rtx tem;
8482   int i;
8483   int in_libcall = 0;
8484
8485   /* First count the number of times each register is used.  */
8486   bzero ((char *) counts, sizeof (int) * nreg);
8487   for (insn = next_real_insn (insns); insn; insn = next_real_insn (insn))
8488     count_reg_usage (insn, counts, NULL_RTX, 1);
8489
8490   /* Go from the last insn to the first and delete insns that only set unused
8491      registers or copy a register to itself.  As we delete an insn, remove
8492      usage counts for registers it uses.  */
8493   for (insn = prev_real_insn (get_last_insn ()); insn; insn = prev)
8494     {
8495       int live_insn = 0;
8496
8497       prev = prev_real_insn (insn);
8498
8499       /* Don't delete any insns that are part of a libcall block.
8500          Flow or loop might get confused if we did that.  Remember
8501          that we are scanning backwards.  */
8502       if (find_reg_note (insn, REG_RETVAL, NULL_RTX))
8503         in_libcall = 1;
8504
8505       if (in_libcall)
8506         live_insn = 1;
8507       else if (GET_CODE (PATTERN (insn)) == SET)
8508         {
8509           if (GET_CODE (SET_DEST (PATTERN (insn))) == REG
8510               && SET_DEST (PATTERN (insn)) == SET_SRC (PATTERN (insn)))
8511             ;
8512
8513 #ifdef HAVE_cc0
8514           else if (GET_CODE (SET_DEST (PATTERN (insn))) == CC0
8515                    && ! side_effects_p (SET_SRC (PATTERN (insn)))
8516                    && ((tem = next_nonnote_insn (insn)) == 0
8517                        || GET_RTX_CLASS (GET_CODE (tem)) != 'i'
8518                        || ! reg_referenced_p (cc0_rtx, PATTERN (tem))))
8519             ;
8520 #endif
8521           else if (GET_CODE (SET_DEST (PATTERN (insn))) != REG
8522                    || REGNO (SET_DEST (PATTERN (insn))) < FIRST_PSEUDO_REGISTER
8523                    || counts[REGNO (SET_DEST (PATTERN (insn)))] != 0
8524                    || side_effects_p (SET_SRC (PATTERN (insn))))
8525             live_insn = 1;
8526         }
8527       else if (GET_CODE (PATTERN (insn)) == PARALLEL)
8528         for (i = XVECLEN (PATTERN (insn), 0) - 1; i >= 0; i--)
8529           {
8530             rtx elt = XVECEXP (PATTERN (insn), 0, i);
8531
8532             if (GET_CODE (elt) == SET)
8533               {
8534                 if (GET_CODE (SET_DEST (elt)) == REG
8535                     && SET_DEST (elt) == SET_SRC (elt))
8536                   ;
8537
8538 #ifdef HAVE_cc0
8539                 else if (GET_CODE (SET_DEST (elt)) == CC0
8540                          && ! side_effects_p (SET_SRC (elt))
8541                          && ((tem = next_nonnote_insn (insn)) == 0
8542                              || GET_RTX_CLASS (GET_CODE (tem)) != 'i'
8543                              || ! reg_referenced_p (cc0_rtx, PATTERN (tem))))
8544                   ;
8545 #endif
8546                 else if (GET_CODE (SET_DEST (elt)) != REG
8547                          || REGNO (SET_DEST (elt)) < FIRST_PSEUDO_REGISTER
8548                          || counts[REGNO (SET_DEST (elt))] != 0
8549                          || side_effects_p (SET_SRC (elt)))
8550                   live_insn = 1;
8551               }
8552             else if (GET_CODE (elt) != CLOBBER && GET_CODE (elt) != USE)
8553               live_insn = 1;
8554           }
8555       else
8556         live_insn = 1;
8557
8558       /* If this is a dead insn, delete it and show registers in it aren't
8559          being used.  */
8560
8561       if (! live_insn)
8562         {
8563           count_reg_usage (insn, counts, NULL_RTX, -1);
8564           delete_insn (insn);
8565         }
8566
8567       if (find_reg_note (insn, REG_LIBCALL, NULL_RTX))
8568         in_libcall = 0;
8569     }
8570 }