gcc/optabs.c

   1 /* Expand the basic unary and binary arithmetic operations, for GNU compiler.
   2    Copyright (C) 1987-2014 Free Software Foundation, Inc.
   3
   4 This file is part of GCC.
   5
   6 GCC is free software; you can redistribute it and/or modify it under
   7 the terms of the GNU General Public License as published by the Free
   8 Software Foundation; either version 3, or (at your option) any later
   9 version.
  10
  11 GCC is distributed in the hope that it will be useful, but WITHOUT ANY
  12 WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13 FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14 for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with GCC; see the file COPYING3.  If not see
  18 <http://www.gnu.org/licenses/>.  */
  19
  20
  21 #include "config.h"
  22 #include "system.h"
  23 #include "coretypes.h"
  24 #include "tm.h"
  25 #include "diagnostic-core.h"
  26
  27 /* Include insn-config.h before expr.h so that HAVE_conditional_move
  28    is properly defined.  */
  29 #include "insn-config.h"
  30 #include "rtl.h"
  31 #include "tree.h"
  32 #include "stor-layout.h"
  33 #include "stringpool.h"
  34 #include "varasm.h"
  35 #include "tm_p.h"
  36 #include "flags.h"
  37 #include "function.h"
  38 #include "except.h"
  39 #include "expr.h"
  40 #include "optabs.h"
  41 #include "libfuncs.h"
  42 #include "recog.h"
  43 #include "reload.h"
  44 #include "ggc.h"
  45 #include "basic-block.h"
  46 #include "target.h"
  47
  48 struct target_optabs default_target_optabs;
  49 struct target_libfuncs default_target_libfuncs;
  50 struct target_optabs *this_fn_optabs = &default_target_optabs;
  51 #if SWITCHABLE_TARGET
  52 struct target_optabs *this_target_optabs = &default_target_optabs;
  53 struct target_libfuncs *this_target_libfuncs = &default_target_libfuncs;
  54 #endif
  55
  56 #define libfunc_hash \
  57   (this_target_libfuncs->x_libfunc_hash)
  58
  59 static void prepare_float_lib_cmp (rtx, rtx, enum rtx_code, rtx *,
  60                                    enum machine_mode *);
  61 static rtx expand_unop_direct (enum machine_mode, optab, rtx, rtx, int);
  62 static void emit_libcall_block_1 (rtx, rtx, rtx, rtx, bool);
  63
  64 /* Debug facility for use in GDB.  */
  65 void debug_optab_libfuncs (void);
  66
  67 /* Prefixes for the current version of decimal floating point (BID vs. DPD) */
  68 #if ENABLE_DECIMAL_BID_FORMAT
  69 #define DECIMAL_PREFIX "bid_"
  70 #else
  71 #define DECIMAL_PREFIX "dpd_"
  72 #endif
  73 \f
  74 /* Used for libfunc_hash.  */
  75
  76 static hashval_t
  77 hash_libfunc (const void *p)
  78 {
  79   const struct libfunc_entry *const e = (const struct libfunc_entry *) p;
  80   return ((e->mode1 + e->mode2 * NUM_MACHINE_MODES) ^ e->op);
  81 }
  82
  83 /* Used for libfunc_hash.  */
  84
  85 static int
  86 eq_libfunc (const void *p, const void *q)
  87 {
  88   const struct libfunc_entry *const e1 = (const struct libfunc_entry *) p;
  89   const struct libfunc_entry *const e2 = (const struct libfunc_entry *) q;
  90   return e1->op == e2->op && e1->mode1 == e2->mode1 && e1->mode2 == e2->mode2;
  91 }
  92
  93 /* Return libfunc corresponding operation defined by OPTAB converting
  94    from MODE2 to MODE1.  Trigger lazy initialization if needed, return NULL
  95    if no libfunc is available.  */
  96 rtx
  97 convert_optab_libfunc (convert_optab optab, enum machine_mode mode1,
  98                        enum machine_mode mode2)
  99 {
 100   struct libfunc_entry e;
 101   struct libfunc_entry **slot;
 102
 103   /* ??? This ought to be an assert, but not all of the places
 104      that we expand optabs know about the optabs that got moved
 105      to being direct.  */
 106   if (!(optab >= FIRST_CONV_OPTAB && optab <= LAST_CONVLIB_OPTAB))
 107     return NULL_RTX;
 108
 109   e.op = optab;
 110   e.mode1 = mode1;
 111   e.mode2 = mode2;
 112   slot = (struct libfunc_entry **)
 113     htab_find_slot (libfunc_hash, &e, NO_INSERT);
 114   if (!slot)
 115     {
 116       const struct convert_optab_libcall_d *d
 117         = &convlib_def[optab - FIRST_CONV_OPTAB];
 118
 119       if (d->libcall_gen == NULL)
 120         return NULL;
 121
 122       d->libcall_gen (optab, d->libcall_basename, mode1, mode2);
 123       slot = (struct libfunc_entry **)
 124         htab_find_slot (libfunc_hash, &e, NO_INSERT);
 125       if (!slot)
 126         return NULL;
 127     }
 128   return (*slot)->libfunc;
 129 }
 130
 131 /* Return libfunc corresponding operation defined by OPTAB in MODE.
 132    Trigger lazy initialization if needed, return NULL if no libfunc is
 133    available.  */
 134 rtx
 135 optab_libfunc (optab optab, enum machine_mode mode)
 136 {
 137   struct libfunc_entry e;
 138   struct libfunc_entry **slot;
 139
 140   /* ??? This ought to be an assert, but not all of the places
 141      that we expand optabs know about the optabs that got moved
 142      to being direct.  */
 143   if (!(optab >= FIRST_NORM_OPTAB && optab <= LAST_NORMLIB_OPTAB))
 144     return NULL_RTX;
 145
 146   e.op = optab;
 147   e.mode1 = mode;
 148   e.mode2 = VOIDmode;
 149   slot = (struct libfunc_entry **)
 150     htab_find_slot (libfunc_hash, &e, NO_INSERT);
 151   if (!slot)
 152     {
 153       const struct optab_libcall_d *d
 154         = &normlib_def[optab - FIRST_NORM_OPTAB];
 155
 156       if (d->libcall_gen == NULL)
 157         return NULL;
 158
 159       d->libcall_gen (optab, d->libcall_basename, d->libcall_suffix, mode);
 160       slot = (struct libfunc_entry **)
 161         htab_find_slot (libfunc_hash, &e, NO_INSERT);
 162       if (!slot)
 163         return NULL;
 164     }
 165   return (*slot)->libfunc;
 166 }
 167
 168 \f
 169 /* Add a REG_EQUAL note to the last insn in INSNS.  TARGET is being set to
 170    the result of operation CODE applied to OP0 (and OP1 if it is a binary
 171    operation).
 172
 173    If the last insn does not set TARGET, don't do anything, but return 1.
 174
 175    If the last insn or a previous insn sets TARGET and TARGET is one of OP0
 176    or OP1, don't add the REG_EQUAL note but return 0.  Our caller can then
 177    try again, ensuring that TARGET is not one of the operands.  */
 178
 179 static int
 180 add_equal_note (rtx insns, rtx target, enum rtx_code code, rtx op0, rtx op1)
 181 {
 182   rtx last_insn, set;
 183   rtx note;
 184
 185   gcc_assert (insns && INSN_P (insns) && NEXT_INSN (insns));
 186
 187   if (GET_RTX_CLASS (code) != RTX_COMM_ARITH
 188       && GET_RTX_CLASS (code) != RTX_BIN_ARITH
 189       && GET_RTX_CLASS (code) != RTX_COMM_COMPARE
 190       && GET_RTX_CLASS (code) != RTX_COMPARE
 191       && GET_RTX_CLASS (code) != RTX_UNARY)
 192     return 1;
 193
 194   if (GET_CODE (target) == ZERO_EXTRACT)
 195     return 1;
 196
 197   for (last_insn = insns;
 198        NEXT_INSN (last_insn) != NULL_RTX;
 199        last_insn = NEXT_INSN (last_insn))
 200     ;
 201
 202   /* If TARGET is in OP0 or OP1, punt.  We'd end up with a note referencing
 203      a value changing in the insn, so the note would be invalid for CSE.  */
 204   if (reg_overlap_mentioned_p (target, op0)
 205       || (op1 && reg_overlap_mentioned_p (target, op1)))
 206     {
 207       if (MEM_P (target)
 208           && (rtx_equal_p (target, op0)
 209               || (op1 && rtx_equal_p (target, op1))))
 210         {
 211           /* For MEM target, with MEM = MEM op X, prefer no REG_EQUAL note
 212              over expanding it as temp = MEM op X, MEM = temp.  If the target
 213              supports MEM = MEM op X instructions, it is sometimes too hard
 214              to reconstruct that form later, especially if X is also a memory,
 215              and due to multiple occurrences of addresses the address might
 216              be forced into register unnecessarily.
 217              Note that not emitting the REG_EQUIV note might inhibit
 218              CSE in some cases.  */
 219           set = single_set (last_insn);
 220           if (set
 221               && GET_CODE (SET_SRC (set)) == code
 222               && MEM_P (SET_DEST (set))
 223               && (rtx_equal_p (SET_DEST (set), XEXP (SET_SRC (set), 0))
 224                   || (op1 && rtx_equal_p (SET_DEST (set),
 225                                           XEXP (SET_SRC (set), 1)))))
 226             return 1;
 227         }
 228       return 0;
 229     }
 230
 231   set = single_set (last_insn);
 232   if (set == NULL_RTX)
 233     return 1;
 234
 235   if (! rtx_equal_p (SET_DEST (set), target)
 236       /* For a STRICT_LOW_PART, the REG_NOTE applies to what is inside it.  */
 237       && (GET_CODE (SET_DEST (set)) != STRICT_LOW_PART
 238           || ! rtx_equal_p (XEXP (SET_DEST (set), 0), target)))
 239     return 1;
 240
 241   if (GET_RTX_CLASS (code) == RTX_UNARY)
 242     switch (code)
 243       {
 244       case FFS:
 245       case CLZ:
 246       case CTZ:
 247       case CLRSB:
 248       case POPCOUNT:
 249       case PARITY:
 250       case BSWAP:
 251         if (GET_MODE (op0) != VOIDmode && GET_MODE (target) != GET_MODE (op0))
 252           {
 253             note = gen_rtx_fmt_e (code, GET_MODE (op0), copy_rtx (op0));
 254             if (GET_MODE_SIZE (GET_MODE (op0))
 255                 > GET_MODE_SIZE (GET_MODE (target)))
 256               note = simplify_gen_unary (TRUNCATE, GET_MODE (target),
 257                                          note, GET_MODE (op0));
 258             else
 259               note = simplify_gen_unary (ZERO_EXTEND, GET_MODE (target),
 260                                          note, GET_MODE (op0));
 261             break;
 262           }
 263         /* FALLTHRU */
 264       default:
 265         note = gen_rtx_fmt_e (code, GET_MODE (target), copy_rtx (op0));
 266         break;
 267       }
 268   else
 269     note = gen_rtx_fmt_ee (code, GET_MODE (target), copy_rtx (op0), copy_rtx (op1));
 270
 271   set_unique_reg_note (last_insn, REG_EQUAL, note);
 272
 273   return 1;
 274 }
 275 \f
 276 /* Given two input operands, OP0 and OP1, determine what the correct from_mode
 277    for a widening operation would be.  In most cases this would be OP0, but if
 278    that's a constant it'll be VOIDmode, which isn't useful.  */
 279
 280 static enum machine_mode
 281 widened_mode (enum machine_mode to_mode, rtx op0, rtx op1)
 282 {
 283   enum machine_mode m0 = GET_MODE (op0);
 284   enum machine_mode m1 = GET_MODE (op1);
 285   enum machine_mode result;
 286
 287   if (m0 == VOIDmode && m1 == VOIDmode)
 288     return to_mode;
 289   else if (m0 == VOIDmode || GET_MODE_SIZE (m0) < GET_MODE_SIZE (m1))
 290     result = m1;
 291   else
 292     result = m0;
 293
 294   if (GET_MODE_SIZE (result) > GET_MODE_SIZE (to_mode))
 295     return to_mode;
 296
 297   return result;
 298 }
 299 \f
 300 /* Find a widening optab even if it doesn't widen as much as we want.
 301    E.g. if from_mode is HImode, and to_mode is DImode, and there is no
 302    direct HI->SI insn, then return SI->DI, if that exists.
 303    If PERMIT_NON_WIDENING is non-zero then this can be used with
 304    non-widening optabs also.  */
 305
 306 enum insn_code
 307 find_widening_optab_handler_and_mode (optab op, enum machine_mode to_mode,
 308                                       enum machine_mode from_mode,
 309                                       int permit_non_widening,
 310                                       enum machine_mode *found_mode)
 311 {
 312   for (; (permit_non_widening || from_mode != to_mode)
 313          && GET_MODE_SIZE (from_mode) <= GET_MODE_SIZE (to_mode)
 314          && from_mode != VOIDmode;
 315        from_mode = GET_MODE_WIDER_MODE (from_mode))
 316     {
 317       enum insn_code handler = widening_optab_handler (op, to_mode,
 318                                                        from_mode);
 319
 320       if (handler != CODE_FOR_nothing)
 321         {
 322           if (found_mode)
 323             *found_mode = from_mode;
 324           return handler;
 325         }
 326     }
 327
 328   return CODE_FOR_nothing;
 329 }
 330 \f
 331 /* Widen OP to MODE and return the rtx for the widened operand.  UNSIGNEDP
 332    says whether OP is signed or unsigned.  NO_EXTEND is nonzero if we need
 333    not actually do a sign-extend or zero-extend, but can leave the
 334    higher-order bits of the result rtx undefined, for example, in the case
 335    of logical operations, but not right shifts.  */
 336
 337 static rtx
 338 widen_operand (rtx op, enum machine_mode mode, enum machine_mode oldmode,
 339                int unsignedp, int no_extend)
 340 {
 341   rtx result;
 342
 343   /* If we don't have to extend and this is a constant, return it.  */
 344   if (no_extend && GET_MODE (op) == VOIDmode)
 345     return op;
 346
 347   /* If we must extend do so.  If OP is a SUBREG for a promoted object, also
 348      extend since it will be more efficient to do so unless the signedness of
 349      a promoted object differs from our extension.  */
 350   if (! no_extend
 351       || (GET_CODE (op) == SUBREG && SUBREG_PROMOTED_VAR_P (op)
 352           && SUBREG_PROMOTED_UNSIGNED_P (op) == unsignedp))
 353     return convert_modes (mode, oldmode, op, unsignedp);
 354
 355   /* If MODE is no wider than a single word, we return a lowpart or paradoxical
 356      SUBREG.  */
 357   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
 358     return gen_lowpart (mode, force_reg (GET_MODE (op), op));
 359
 360   /* Otherwise, get an object of MODE, clobber it, and set the low-order
 361      part to OP.  */
 362
 363   result = gen_reg_rtx (mode);
 364   emit_clobber (result);
 365   emit_move_insn (gen_lowpart (GET_MODE (op), result), op);
 366   return result;
 367 }
 368 \f
 369 /* Return the optab used for computing the operation given by the tree code,
 370    CODE and the tree EXP.  This function is not always usable (for example, it
 371    cannot give complete results for multiplication or division) but probably
 372    ought to be relied on more widely throughout the expander.  */
 373 optab
 374 optab_for_tree_code (enum tree_code code, const_tree type,
 375                      enum optab_subtype subtype)
 376 {
 377   bool trapv;
 378   switch (code)
 379     {
 380     case BIT_AND_EXPR:
 381       return and_optab;
 382
 383     case BIT_IOR_EXPR:
 384       return ior_optab;
 385
 386     case BIT_NOT_EXPR:
 387       return one_cmpl_optab;
 388
 389     case BIT_XOR_EXPR:
 390       return xor_optab;
 391
 392     case MULT_HIGHPART_EXPR:
 393       return TYPE_UNSIGNED (type) ? umul_highpart_optab : smul_highpart_optab;
 394
 395     case TRUNC_MOD_EXPR:
 396     case CEIL_MOD_EXPR:
 397     case FLOOR_MOD_EXPR:
 398     case ROUND_MOD_EXPR:
 399       return TYPE_UNSIGNED (type) ? umod_optab : smod_optab;
 400
 401     case RDIV_EXPR:
 402     case TRUNC_DIV_EXPR:
 403     case CEIL_DIV_EXPR:
 404     case FLOOR_DIV_EXPR:
 405     case ROUND_DIV_EXPR:
 406     case EXACT_DIV_EXPR:
 407       if (TYPE_SATURATING (type))
 408         return TYPE_UNSIGNED (type) ? usdiv_optab : ssdiv_optab;
 409       return TYPE_UNSIGNED (type) ? udiv_optab : sdiv_optab;
 410
 411     case LSHIFT_EXPR:
 412       if (TREE_CODE (type) == VECTOR_TYPE)
 413         {
 414           if (subtype == optab_vector)
 415             return TYPE_SATURATING (type) ? unknown_optab : vashl_optab;
 416
 417           gcc_assert (subtype == optab_scalar);
 418         }
 419       if (TYPE_SATURATING (type))
 420         return TYPE_UNSIGNED (type) ? usashl_optab : ssashl_optab;
 421       return ashl_optab;
 422
 423     case RSHIFT_EXPR:
 424       if (TREE_CODE (type) == VECTOR_TYPE)
 425         {
 426           if (subtype == optab_vector)
 427             return TYPE_UNSIGNED (type) ? vlshr_optab : vashr_optab;
 428
 429           gcc_assert (subtype == optab_scalar);
 430         }
 431       return TYPE_UNSIGNED (type) ? lshr_optab : ashr_optab;
 432
 433     case LROTATE_EXPR:
 434       if (TREE_CODE (type) == VECTOR_TYPE)
 435         {
 436           if (subtype == optab_vector)
 437             return vrotl_optab;
 438
 439           gcc_assert (subtype == optab_scalar);
 440         }
 441       return rotl_optab;
 442
 443     case RROTATE_EXPR:
 444       if (TREE_CODE (type) == VECTOR_TYPE)
 445         {
 446           if (subtype == optab_vector)
 447             return vrotr_optab;
 448
 449           gcc_assert (subtype == optab_scalar);
 450         }
 451       return rotr_optab;
 452
 453     case MAX_EXPR:
 454       return TYPE_UNSIGNED (type) ? umax_optab : smax_optab;
 455
 456     case MIN_EXPR:
 457       return TYPE_UNSIGNED (type) ? umin_optab : smin_optab;
 458
 459     case REALIGN_LOAD_EXPR:
 460       return vec_realign_load_optab;
 461
 462     case WIDEN_SUM_EXPR:
 463       return TYPE_UNSIGNED (type) ? usum_widen_optab : ssum_widen_optab;
 464
 465     case DOT_PROD_EXPR:
 466       return TYPE_UNSIGNED (type) ? udot_prod_optab : sdot_prod_optab;
 467
 468     case WIDEN_MULT_PLUS_EXPR:
 469       return (TYPE_UNSIGNED (type)
 470               ? (TYPE_SATURATING (type)
 471                  ? usmadd_widen_optab : umadd_widen_optab)
 472               : (TYPE_SATURATING (type)
 473                  ? ssmadd_widen_optab : smadd_widen_optab));
 474
 475     case WIDEN_MULT_MINUS_EXPR:
 476       return (TYPE_UNSIGNED (type)
 477               ? (TYPE_SATURATING (type)
 478                  ? usmsub_widen_optab : umsub_widen_optab)
 479               : (TYPE_SATURATING (type)
 480                  ? ssmsub_widen_optab : smsub_widen_optab));
 481
 482     case FMA_EXPR:
 483       return fma_optab;
 484
 485     case REDUC_MAX_EXPR:
 486       return TYPE_UNSIGNED (type) ? reduc_umax_optab : reduc_smax_optab;
 487
 488     case REDUC_MIN_EXPR:
 489       return TYPE_UNSIGNED (type) ? reduc_umin_optab : reduc_smin_optab;
 490
 491     case REDUC_PLUS_EXPR:
 492       return TYPE_UNSIGNED (type) ? reduc_uplus_optab : reduc_splus_optab;
 493
 494     case VEC_LSHIFT_EXPR:
 495       return vec_shl_optab;
 496
 497     case VEC_RSHIFT_EXPR:
 498       return vec_shr_optab;
 499
 500     case VEC_WIDEN_MULT_HI_EXPR:
 501       return TYPE_UNSIGNED (type) ?
 502         vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
 503
 504     case VEC_WIDEN_MULT_LO_EXPR:
 505       return TYPE_UNSIGNED (type) ?
 506         vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
 507
 508     case VEC_WIDEN_MULT_EVEN_EXPR:
 509       return TYPE_UNSIGNED (type) ?
 510         vec_widen_umult_even_optab : vec_widen_smult_even_optab;
 511
 512     case VEC_WIDEN_MULT_ODD_EXPR:
 513       return TYPE_UNSIGNED (type) ?
 514         vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
 515
 516     case VEC_WIDEN_LSHIFT_HI_EXPR:
 517       return TYPE_UNSIGNED (type) ?
 518         vec_widen_ushiftl_hi_optab : vec_widen_sshiftl_hi_optab;
 519
 520     case VEC_WIDEN_LSHIFT_LO_EXPR:
 521       return TYPE_UNSIGNED (type) ?
 522         vec_widen_ushiftl_lo_optab : vec_widen_sshiftl_lo_optab;
 523
 524     case VEC_UNPACK_HI_EXPR:
 525       return TYPE_UNSIGNED (type) ?
 526         vec_unpacku_hi_optab : vec_unpacks_hi_optab;
 527
 528     case VEC_UNPACK_LO_EXPR:
 529       return TYPE_UNSIGNED (type) ?
 530         vec_unpacku_lo_optab : vec_unpacks_lo_optab;
 531
 532     case VEC_UNPACK_FLOAT_HI_EXPR:
 533       /* The signedness is determined from input operand.  */
 534       return TYPE_UNSIGNED (type) ?
 535         vec_unpacku_float_hi_optab : vec_unpacks_float_hi_optab;
 536
 537     case VEC_UNPACK_FLOAT_LO_EXPR:
 538       /* The signedness is determined from input operand.  */
 539       return TYPE_UNSIGNED (type) ?
 540         vec_unpacku_float_lo_optab : vec_unpacks_float_lo_optab;
 541
 542     case VEC_PACK_TRUNC_EXPR:
 543       return vec_pack_trunc_optab;
 544
 545     case VEC_PACK_SAT_EXPR:
 546       return TYPE_UNSIGNED (type) ? vec_pack_usat_optab : vec_pack_ssat_optab;
 547
 548     case VEC_PACK_FIX_TRUNC_EXPR:
 549       /* The signedness is determined from output operand.  */
 550       return TYPE_UNSIGNED (type) ?
 551         vec_pack_ufix_trunc_optab : vec_pack_sfix_trunc_optab;
 552
 553     default:
 554       break;
 555     }
 556
 557   trapv = INTEGRAL_TYPE_P (type) && TYPE_OVERFLOW_TRAPS (type);
 558   switch (code)
 559     {
 560     case POINTER_PLUS_EXPR:
 561     case PLUS_EXPR:
 562       if (TYPE_SATURATING (type))
 563         return TYPE_UNSIGNED (type) ? usadd_optab : ssadd_optab;
 564       return trapv ? addv_optab : add_optab;
 565
 566     case MINUS_EXPR:
 567       if (TYPE_SATURATING (type))
 568         return TYPE_UNSIGNED (type) ? ussub_optab : sssub_optab;
 569       return trapv ? subv_optab : sub_optab;
 570
 571     case MULT_EXPR:
 572       if (TYPE_SATURATING (type))
 573         return TYPE_UNSIGNED (type) ? usmul_optab : ssmul_optab;
 574       return trapv ? smulv_optab : smul_optab;
 575
 576     case NEGATE_EXPR:
 577       if (TYPE_SATURATING (type))
 578         return TYPE_UNSIGNED (type) ? usneg_optab : ssneg_optab;
 579       return trapv ? negv_optab : neg_optab;
 580
 581     case ABS_EXPR:
 582       return trapv ? absv_optab : abs_optab;
 583
 584     default:
 585       return unknown_optab;
 586     }
 587 }
 588 \f
 589
 590 /* Expand vector widening operations.
 591
 592    There are two different classes of operations handled here:
 593    1) Operations whose result is wider than all the arguments to the operation.
 594       Examples: VEC_UNPACK_HI/LO_EXPR, VEC_WIDEN_MULT_HI/LO_EXPR
 595       In this case OP0 and optionally OP1 would be initialized,
 596       but WIDE_OP wouldn't (not relevant for this case).
 597    2) Operations whose result is of the same size as the last argument to the
 598       operation, but wider than all the other arguments to the operation.
 599       Examples: WIDEN_SUM_EXPR, VEC_DOT_PROD_EXPR.
 600       In the case WIDE_OP, OP0 and optionally OP1 would be initialized.
 601
 602    E.g, when called to expand the following operations, this is how
 603    the arguments will be initialized:
 604                                 nops    OP0     OP1     WIDE_OP
 605    widening-sum                 2       oprnd0  -       oprnd1
 606    widening-dot-product         3       oprnd0  oprnd1  oprnd2
 607    widening-mult                2       oprnd0  oprnd1  -
 608    type-promotion (vec-unpack)  1       oprnd0  -       -  */
 609
 610 rtx
 611 expand_widen_pattern_expr (sepops ops, rtx op0, rtx op1, rtx wide_op,
 612                            rtx target, int unsignedp)
 613 {
 614   struct expand_operand eops[4];
 615   tree oprnd0, oprnd1, oprnd2;
 616   enum machine_mode wmode = VOIDmode, tmode0, tmode1 = VOIDmode;
 617   optab widen_pattern_optab;
 618   enum insn_code icode;
 619   int nops = TREE_CODE_LENGTH (ops->code);
 620   int op;
 621
 622   oprnd0 = ops->op0;
 623   tmode0 = TYPE_MODE (TREE_TYPE (oprnd0));
 624   widen_pattern_optab =
 625     optab_for_tree_code (ops->code, TREE_TYPE (oprnd0), optab_default);
 626   if (ops->code == WIDEN_MULT_PLUS_EXPR
 627       || ops->code == WIDEN_MULT_MINUS_EXPR)
 628     icode = find_widening_optab_handler (widen_pattern_optab,
 629                                          TYPE_MODE (TREE_TYPE (ops->op2)),
 630                                          tmode0, 0);
 631   else
 632     icode = optab_handler (widen_pattern_optab, tmode0);
 633   gcc_assert (icode != CODE_FOR_nothing);
 634
 635   if (nops >= 2)
 636     {
 637       oprnd1 = ops->op1;
 638       tmode1 = TYPE_MODE (TREE_TYPE (oprnd1));
 639     }
 640
 641   /* The last operand is of a wider mode than the rest of the operands.  */
 642   if (nops == 2)
 643     wmode = tmode1;
 644   else if (nops == 3)
 645     {
 646       gcc_assert (tmode1 == tmode0);
 647       gcc_assert (op1);
 648       oprnd2 = ops->op2;
 649       wmode = TYPE_MODE (TREE_TYPE (oprnd2));
 650     }
 651
 652   op = 0;
 653   create_output_operand (&eops[op++], target, TYPE_MODE (ops->type));
 654   create_convert_operand_from (&eops[op++], op0, tmode0, unsignedp);
 655   if (op1)
 656     create_convert_operand_from (&eops[op++], op1, tmode1, unsignedp);
 657   if (wide_op)
 658     create_convert_operand_from (&eops[op++], wide_op, wmode, unsignedp);
 659   expand_insn (icode, op, eops);
 660   return eops[0].value;
 661 }
 662
 663 /* Generate code to perform an operation specified by TERNARY_OPTAB
 664    on operands OP0, OP1 and OP2, with result having machine-mode MODE.
 665
 666    UNSIGNEDP is for the case where we have to widen the operands
 667    to perform the operation.  It says to use zero-extension.
 668
 669    If TARGET is nonzero, the value
 670    is generated there, if it is convenient to do so.
 671    In all cases an rtx is returned for the locus of the value;
 672    this may or may not be TARGET.  */
 673
 674 rtx
 675 expand_ternary_op (enum machine_mode mode, optab ternary_optab, rtx op0,
 676                    rtx op1, rtx op2, rtx target, int unsignedp)
 677 {
 678   struct expand_operand ops[4];
 679   enum insn_code icode = optab_handler (ternary_optab, mode);
 680
 681   gcc_assert (optab_handler (ternary_optab, mode) != CODE_FOR_nothing);
 682
 683   create_output_operand (&ops[0], target, mode);
 684   create_convert_operand_from (&ops[1], op0, mode, unsignedp);
 685   create_convert_operand_from (&ops[2], op1, mode, unsignedp);
 686   create_convert_operand_from (&ops[3], op2, mode, unsignedp);
 687   expand_insn (icode, 4, ops);
 688   return ops[0].value;
 689 }
 690
 691
 692 /* Like expand_binop, but return a constant rtx if the result can be
 693    calculated at compile time.  The arguments and return value are
 694    otherwise the same as for expand_binop.  */
 695
 696 rtx
 697 simplify_expand_binop (enum machine_mode mode, optab binoptab,
 698                        rtx op0, rtx op1, rtx target, int unsignedp,
 699                        enum optab_methods methods)
 700 {
 701   if (CONSTANT_P (op0) && CONSTANT_P (op1))
 702     {
 703       rtx x = simplify_binary_operation (optab_to_code (binoptab),
 704                                          mode, op0, op1);
 705       if (x)
 706         return x;
 707     }
 708
 709   return expand_binop (mode, binoptab, op0, op1, target, unsignedp, methods);
 710 }
 711
 712 /* Like simplify_expand_binop, but always put the result in TARGET.
 713    Return true if the expansion succeeded.  */
 714
 715 bool
 716 force_expand_binop (enum machine_mode mode, optab binoptab,
 717                     rtx op0, rtx op1, rtx target, int unsignedp,
 718                     enum optab_methods methods)
 719 {
 720   rtx x = simplify_expand_binop (mode, binoptab, op0, op1,
 721                                  target, unsignedp, methods);
 722   if (x == 0)
 723     return false;
 724   if (x != target)
 725     emit_move_insn (target, x);
 726   return true;
 727 }
 728
 729 /* Generate insns for VEC_LSHIFT_EXPR, VEC_RSHIFT_EXPR.  */
 730
 731 rtx
 732 expand_vec_shift_expr (sepops ops, rtx target)
 733 {
 734   struct expand_operand eops[3];
 735   enum insn_code icode;
 736   rtx rtx_op1, rtx_op2;
 737   enum machine_mode mode = TYPE_MODE (ops->type);
 738   tree vec_oprnd = ops->op0;
 739   tree shift_oprnd = ops->op1;
 740   optab shift_optab;
 741
 742   switch (ops->code)
 743     {
 744       case VEC_RSHIFT_EXPR:
 745         shift_optab = vec_shr_optab;
 746         break;
 747       case VEC_LSHIFT_EXPR:
 748         shift_optab = vec_shl_optab;
 749         break;
 750       default:
 751         gcc_unreachable ();
 752     }
 753
 754   icode = optab_handler (shift_optab, mode);
 755   gcc_assert (icode != CODE_FOR_nothing);
 756
 757   rtx_op1 = expand_normal (vec_oprnd);
 758   rtx_op2 = expand_normal (shift_oprnd);
 759
 760   create_output_operand (&eops[0], target, mode);
 761   create_input_operand (&eops[1], rtx_op1, GET_MODE (rtx_op1));
 762   create_convert_operand_from_type (&eops[2], rtx_op2, TREE_TYPE (shift_oprnd));
 763   expand_insn (icode, 3, eops);
 764
 765   return eops[0].value;
 766 }
 767
 768 /* Create a new vector value in VMODE with all elements set to OP.  The
 769    mode of OP must be the element mode of VMODE.  If OP is a constant,
 770    then the return value will be a constant.  */
 771
 772 static rtx
 773 expand_vector_broadcast (enum machine_mode vmode, rtx op)
 774 {
 775   enum insn_code icode;
 776   rtvec vec;
 777   rtx ret;
 778   int i, n;
 779
 780   gcc_checking_assert (VECTOR_MODE_P (vmode));
 781
 782   n = GET_MODE_NUNITS (vmode);
 783   vec = rtvec_alloc (n);
 784   for (i = 0; i < n; ++i)
 785     RTVEC_ELT (vec, i) = op;
 786
 787   if (CONSTANT_P (op))
 788     return gen_rtx_CONST_VECTOR (vmode, vec);
 789
 790   /* ??? If the target doesn't have a vec_init, then we have no easy way
 791      of performing this operation.  Most of this sort of generic support
 792      is hidden away in the vector lowering support in gimple.  */
 793   icode = optab_handler (vec_init_optab, vmode);
 794   if (icode == CODE_FOR_nothing)
 795     return NULL;
 796
 797   ret = gen_reg_rtx (vmode);
 798   emit_insn (GEN_FCN (icode) (ret, gen_rtx_PARALLEL (vmode, vec)));
 799
 800   return ret;
 801 }
 802
 803 /* This subroutine of expand_doubleword_shift handles the cases in which
 804    the effective shift value is >= BITS_PER_WORD.  The arguments and return
 805    value are the same as for the parent routine, except that SUPERWORD_OP1
 806    is the shift count to use when shifting OUTOF_INPUT into INTO_TARGET.
 807    INTO_TARGET may be null if the caller has decided to calculate it.  */
 808
 809 static bool
 810 expand_superword_shift (optab binoptab, rtx outof_input, rtx superword_op1,
 811                         rtx outof_target, rtx into_target,
 812                         int unsignedp, enum optab_methods methods)
 813 {
 814   if (into_target != 0)
 815     if (!force_expand_binop (word_mode, binoptab, outof_input, superword_op1,
 816                              into_target, unsignedp, methods))
 817       return false;
 818
 819   if (outof_target != 0)
 820     {
 821       /* For a signed right shift, we must fill OUTOF_TARGET with copies
 822          of the sign bit, otherwise we must fill it with zeros.  */
 823       if (binoptab != ashr_optab)
 824         emit_move_insn (outof_target, CONST0_RTX (word_mode));
 825       else
 826         if (!force_expand_binop (word_mode, binoptab,
 827                                  outof_input, GEN_INT (BITS_PER_WORD - 1),
 828                                  outof_target, unsignedp, methods))
 829           return false;
 830     }
 831   return true;
 832 }
 833
 834 /* This subroutine of expand_doubleword_shift handles the cases in which
 835    the effective shift value is < BITS_PER_WORD.  The arguments and return
 836    value are the same as for the parent routine.  */
 837
 838 static bool
 839 expand_subword_shift (enum machine_mode op1_mode, optab binoptab,
 840                       rtx outof_input, rtx into_input, rtx op1,
 841                       rtx outof_target, rtx into_target,
 842                       int unsignedp, enum optab_methods methods,
 843                       unsigned HOST_WIDE_INT shift_mask)
 844 {
 845   optab reverse_unsigned_shift, unsigned_shift;
 846   rtx tmp, carries;
 847
 848   reverse_unsigned_shift = (binoptab == ashl_optab ? lshr_optab : ashl_optab);
 849   unsigned_shift = (binoptab == ashl_optab ? ashl_optab : lshr_optab);
 850
 851   /* The low OP1 bits of INTO_TARGET come from the high bits of OUTOF_INPUT.
 852      We therefore need to shift OUTOF_INPUT by (BITS_PER_WORD - OP1) bits in
 853      the opposite direction to BINOPTAB.  */
 854   if (CONSTANT_P (op1) || shift_mask >= BITS_PER_WORD)
 855     {
 856       carries = outof_input;
 857       tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD,
 858                                             op1_mode), op1_mode);
 859       tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 860                                    0, true, methods);
 861     }
 862   else
 863     {
 864       /* We must avoid shifting by BITS_PER_WORD bits since that is either
 865          the same as a zero shift (if shift_mask == BITS_PER_WORD - 1) or
 866          has unknown behavior.  Do a single shift first, then shift by the
 867          remainder.  It's OK to use ~OP1 as the remainder if shift counts
 868          are truncated to the mode size.  */
 869       carries = expand_binop (word_mode, reverse_unsigned_shift,
 870                               outof_input, const1_rtx, 0, unsignedp, methods);
 871       if (shift_mask == BITS_PER_WORD - 1)
 872         {
 873           tmp = immed_wide_int_const
 874             (wi::minus_one (GET_MODE_PRECISION (op1_mode)), op1_mode);
 875           tmp = simplify_expand_binop (op1_mode, xor_optab, op1, tmp,
 876                                        0, true, methods);
 877         }
 878       else
 879         {
 880           tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD - 1,
 881                                                 op1_mode), op1_mode);
 882           tmp = simplify_expand_binop (op1_mode, sub_optab, tmp, op1,
 883                                        0, true, methods);
 884         }
 885     }
 886   if (tmp == 0 || carries == 0)
 887     return false;
 888   carries = expand_binop (word_mode, reverse_unsigned_shift,
 889                           carries, tmp, 0, unsignedp, methods);
 890   if (carries == 0)
 891     return false;
 892
 893   /* Shift INTO_INPUT logically by OP1.  This is the last use of INTO_INPUT
 894      so the result can go directly into INTO_TARGET if convenient.  */
 895   tmp = expand_binop (word_mode, unsigned_shift, into_input, op1,
 896                       into_target, unsignedp, methods);
 897   if (tmp == 0)
 898     return false;
 899
 900   /* Now OR in the bits carried over from OUTOF_INPUT.  */
 901   if (!force_expand_binop (word_mode, ior_optab, tmp, carries,
 902                            into_target, unsignedp, methods))
 903     return false;
 904
 905   /* Use a standard word_mode shift for the out-of half.  */
 906   if (outof_target != 0)
 907     if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
 908                              outof_target, unsignedp, methods))
 909       return false;
 910
 911   return true;
 912 }
 913
 914
 915 #ifdef HAVE_conditional_move
 916 /* Try implementing expand_doubleword_shift using conditional moves.
 917    The shift is by < BITS_PER_WORD if (CMP_CODE CMP1 CMP2) is true,
 918    otherwise it is by >= BITS_PER_WORD.  SUBWORD_OP1 and SUPERWORD_OP1
 919    are the shift counts to use in the former and latter case.  All other
 920    arguments are the same as the parent routine.  */
 921
 922 static bool
 923 expand_doubleword_shift_condmove (enum machine_mode op1_mode, optab binoptab,
 924                                   enum rtx_code cmp_code, rtx cmp1, rtx cmp2,
 925                                   rtx outof_input, rtx into_input,
 926                                   rtx subword_op1, rtx superword_op1,
 927                                   rtx outof_target, rtx into_target,
 928                                   int unsignedp, enum optab_methods methods,
 929                                   unsigned HOST_WIDE_INT shift_mask)
 930 {
 931   rtx outof_superword, into_superword;
 932
 933   /* Put the superword version of the output into OUTOF_SUPERWORD and
 934      INTO_SUPERWORD.  */
 935   outof_superword = outof_target != 0 ? gen_reg_rtx (word_mode) : 0;
 936   if (outof_target != 0 && subword_op1 == superword_op1)
 937     {
 938       /* The value INTO_TARGET >> SUBWORD_OP1, which we later store in
 939          OUTOF_TARGET, is the same as the value of INTO_SUPERWORD.  */
 940       into_superword = outof_target;
 941       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 942                                    outof_superword, 0, unsignedp, methods))
 943         return false;
 944     }
 945   else
 946     {
 947       into_superword = gen_reg_rtx (word_mode);
 948       if (!expand_superword_shift (binoptab, outof_input, superword_op1,
 949                                    outof_superword, into_superword,
 950                                    unsignedp, methods))
 951         return false;
 952     }
 953
 954   /* Put the subword version directly in OUTOF_TARGET and INTO_TARGET.  */
 955   if (!expand_subword_shift (op1_mode, binoptab,
 956                              outof_input, into_input, subword_op1,
 957                              outof_target, into_target,
 958                              unsignedp, methods, shift_mask))
 959     return false;
 960
 961   /* Select between them.  Do the INTO half first because INTO_SUPERWORD
 962      might be the current value of OUTOF_TARGET.  */
 963   if (!emit_conditional_move (into_target, cmp_code, cmp1, cmp2, op1_mode,
 964                               into_target, into_superword, word_mode, false))
 965     return false;
 966
 967   if (outof_target != 0)
 968     if (!emit_conditional_move (outof_target, cmp_code, cmp1, cmp2, op1_mode,
 969                                 outof_target, outof_superword,
 970                                 word_mode, false))
 971       return false;
 972
 973   return true;
 974 }
 975 #endif
 976
 977 /* Expand a doubleword shift (ashl, ashr or lshr) using word-mode shifts.
 978    OUTOF_INPUT and INTO_INPUT are the two word-sized halves of the first
 979    input operand; the shift moves bits in the direction OUTOF_INPUT->
 980    INTO_TARGET.  OUTOF_TARGET and INTO_TARGET are the equivalent words
 981    of the target.  OP1 is the shift count and OP1_MODE is its mode.
 982    If OP1 is constant, it will have been truncated as appropriate
 983    and is known to be nonzero.
 984
 985    If SHIFT_MASK is zero, the result of word shifts is undefined when the
 986    shift count is outside the range [0, BITS_PER_WORD).  This routine must
 987    avoid generating such shifts for OP1s in the range [0, BITS_PER_WORD * 2).
 988
 989    If SHIFT_MASK is nonzero, all word-mode shift counts are effectively
 990    masked by it and shifts in the range [BITS_PER_WORD, SHIFT_MASK) will
 991    fill with zeros or sign bits as appropriate.
 992
 993    If SHIFT_MASK is BITS_PER_WORD - 1, this routine will synthesize
 994    a doubleword shift whose equivalent mask is BITS_PER_WORD * 2 - 1.
 995    Doing this preserves semantics required by SHIFT_COUNT_TRUNCATED.
 996    In all other cases, shifts by values outside [0, BITS_PER_UNIT * 2)
 997    are undefined.
 998
 999    BINOPTAB, UNSIGNEDP and METHODS are as for expand_binop.  This function
1000    may not use INTO_INPUT after modifying INTO_TARGET, and similarly for
1001    OUTOF_INPUT and OUTOF_TARGET.  OUTOF_TARGET can be null if the parent
1002    function wants to calculate it itself.
1003
1004    Return true if the shift could be successfully synthesized.  */
1005
1006 static bool
1007 expand_doubleword_shift (enum machine_mode op1_mode, optab binoptab,
1008                          rtx outof_input, rtx into_input, rtx op1,
1009                          rtx outof_target, rtx into_target,
1010                          int unsignedp, enum optab_methods methods,
1011                          unsigned HOST_WIDE_INT shift_mask)
1012 {
1013   rtx superword_op1, tmp, cmp1, cmp2;
1014   rtx subword_label, done_label;
1015   enum rtx_code cmp_code;
1016
1017   /* See if word-mode shifts by BITS_PER_WORD...BITS_PER_WORD * 2 - 1 will
1018      fill the result with sign or zero bits as appropriate.  If so, the value
1019      of OUTOF_TARGET will always be (SHIFT OUTOF_INPUT OP1).   Recursively call
1020      this routine to calculate INTO_TARGET (which depends on both OUTOF_INPUT
1021      and INTO_INPUT), then emit code to set up OUTOF_TARGET.
1022
1023      This isn't worthwhile for constant shifts since the optimizers will
1024      cope better with in-range shift counts.  */
1025   if (shift_mask >= BITS_PER_WORD
1026       && outof_target != 0
1027       && !CONSTANT_P (op1))
1028     {
1029       if (!expand_doubleword_shift (op1_mode, binoptab,
1030                                     outof_input, into_input, op1,
1031                                     0, into_target,
1032                                     unsignedp, methods, shift_mask))
1033         return false;
1034       if (!force_expand_binop (word_mode, binoptab, outof_input, op1,
1035                                outof_target, unsignedp, methods))
1036         return false;
1037       return true;
1038     }
1039
1040   /* Set CMP_CODE, CMP1 and CMP2 so that the rtx (CMP_CODE CMP1 CMP2)
1041      is true when the effective shift value is less than BITS_PER_WORD.
1042      Set SUPERWORD_OP1 to the shift count that should be used to shift
1043      OUTOF_INPUT into INTO_TARGET when the condition is false.  */
1044   tmp = immed_wide_int_const (wi::shwi (BITS_PER_WORD, op1_mode), op1_mode);
1045   if (!CONSTANT_P (op1) && shift_mask == BITS_PER_WORD - 1)
1046     {
1047       /* Set CMP1 to OP1 & BITS_PER_WORD.  The result is zero iff OP1
1048          is a subword shift count.  */
1049       cmp1 = simplify_expand_binop (op1_mode, and_optab, op1, tmp,
1050                                     0, true, methods);
1051       cmp2 = CONST0_RTX (op1_mode);
1052       cmp_code = EQ;
1053       superword_op1 = op1;
1054     }
1055   else
1056     {
1057       /* Set CMP1 to OP1 - BITS_PER_WORD.  */
1058       cmp1 = simplify_expand_binop (op1_mode, sub_optab, op1, tmp,
1059                                     0, true, methods);
1060       cmp2 = CONST0_RTX (op1_mode);
1061       cmp_code = LT;
1062       superword_op1 = cmp1;
1063     }
1064   if (cmp1 == 0)
1065     return false;
1066
1067   /* If we can compute the condition at compile time, pick the
1068      appropriate subroutine.  */
1069   tmp = simplify_relational_operation (cmp_code, SImode, op1_mode, cmp1, cmp2);
1070   if (tmp != 0 && CONST_INT_P (tmp))
1071     {
1072       if (tmp == const0_rtx)
1073         return expand_superword_shift (binoptab, outof_input, superword_op1,
1074                                        outof_target, into_target,
1075                                        unsignedp, methods);
1076       else
1077         return expand_subword_shift (op1_mode, binoptab,
1078                                      outof_input, into_input, op1,
1079                                      outof_target, into_target,
1080                                      unsignedp, methods, shift_mask);
1081     }
1082
1083 #ifdef HAVE_conditional_move
1084   /* Try using conditional moves to generate straight-line code.  */
1085   {
1086     rtx start = get_last_insn ();
1087     if (expand_doubleword_shift_condmove (op1_mode, binoptab,
1088                                           cmp_code, cmp1, cmp2,
1089                                           outof_input, into_input,
1090                                           op1, superword_op1,
1091                                           outof_target, into_target,
1092                                           unsignedp, methods, shift_mask))
1093       return true;
1094     delete_insns_since (start);
1095   }
1096 #endif
1097
1098   /* As a last resort, use branches to select the correct alternative.  */
1099   subword_label = gen_label_rtx ();
1100   done_label = gen_label_rtx ();
1101
1102   NO_DEFER_POP;
1103   do_compare_rtx_and_jump (cmp1, cmp2, cmp_code, false, op1_mode,
1104                            0, 0, subword_label, -1);
1105   OK_DEFER_POP;
1106
1107   if (!expand_superword_shift (binoptab, outof_input, superword_op1,
1108                                outof_target, into_target,
1109                                unsignedp, methods))
1110     return false;
1111
1112   emit_jump_insn (gen_jump (done_label));
1113   emit_barrier ();
1114   emit_label (subword_label);
1115
1116   if (!expand_subword_shift (op1_mode, binoptab,
1117                              outof_input, into_input, op1,
1118                              outof_target, into_target,
1119                              unsignedp, methods, shift_mask))
1120     return false;
1121
1122   emit_label (done_label);
1123   return true;
1124 }
1125 \f
1126 /* Subroutine of expand_binop.  Perform a double word multiplication of
1127    operands OP0 and OP1 both of mode MODE, which is exactly twice as wide
1128    as the target's word_mode.  This function return NULL_RTX if anything
1129    goes wrong, in which case it may have already emitted instructions
1130    which need to be deleted.
1131
1132    If we want to multiply two two-word values and have normal and widening
1133    multiplies of single-word values, we can do this with three smaller
1134    multiplications.
1135
1136    The multiplication proceeds as follows:
1137                                  _______________________
1138                                 [__op0_high_|__op0_low__]
1139                                  _______________________
1140         *                       [__op1_high_|__op1_low__]
1141         _______________________________________________
1142                                  _______________________
1143     (1)                         [__op0_low__*__op1_low__]
1144                      _______________________
1145     (2a)            [__op0_low__*__op1_high_]
1146                      _______________________
1147     (2b)            [__op0_high_*__op1_low__]
1148          _______________________
1149     (3) [__op0_high_*__op1_high_]
1150
1151
1152   This gives a 4-word result.  Since we are only interested in the
1153   lower 2 words, partial result (3) and the upper words of (2a) and
1154   (2b) don't need to be calculated.  Hence (2a) and (2b) can be
1155   calculated using non-widening multiplication.
1156
1157   (1), however, needs to be calculated with an unsigned widening
1158   multiplication.  If this operation is not directly supported we
1159   try using a signed widening multiplication and adjust the result.
1160   This adjustment works as follows:
1161
1162       If both operands are positive then no adjustment is needed.
1163
1164       If the operands have different signs, for example op0_low < 0 and
1165       op1_low >= 0, the instruction treats the most significant bit of
1166       op0_low as a sign bit instead of a bit with significance
1167       2**(BITS_PER_WORD-1), i.e. the instruction multiplies op1_low
1168       with 2**BITS_PER_WORD - op0_low, and two's complements the
1169       result.  Conclusion: We need to add op1_low * 2**BITS_PER_WORD to
1170       the result.
1171
1172       Similarly, if both operands are negative, we need to add
1173       (op0_low + op1_low) * 2**BITS_PER_WORD.
1174
1175       We use a trick to adjust quickly.  We logically shift op0_low right
1176       (op1_low) BITS_PER_WORD-1 steps to get 0 or 1, and add this to
1177       op0_high (op1_high) before it is used to calculate 2b (2a).  If no
1178       logical shift exists, we do an arithmetic right shift and subtract
1179       the 0 or -1.  */
1180
1181 static rtx
1182 expand_doubleword_mult (enum machine_mode mode, rtx op0, rtx op1, rtx target,
1183                        bool umulp, enum optab_methods methods)
1184 {
1185   int low = (WORDS_BIG_ENDIAN ? 1 : 0);
1186   int high = (WORDS_BIG_ENDIAN ? 0 : 1);
1187   rtx wordm1 = umulp ? NULL_RTX : GEN_INT (BITS_PER_WORD - 1);
1188   rtx product, adjust, product_high, temp;
1189
1190   rtx op0_high = operand_subword_force (op0, high, mode);
1191   rtx op0_low = operand_subword_force (op0, low, mode);
1192   rtx op1_high = operand_subword_force (op1, high, mode);
1193   rtx op1_low = operand_subword_force (op1, low, mode);
1194
1195   /* If we're using an unsigned multiply to directly compute the product
1196      of the low-order words of the operands and perform any required
1197      adjustments of the operands, we begin by trying two more multiplications
1198      and then computing the appropriate sum.
1199
1200      We have checked above that the required addition is provided.
1201      Full-word addition will normally always succeed, especially if
1202      it is provided at all, so we don't worry about its failure.  The
1203      multiplication may well fail, however, so we do handle that.  */
1204
1205   if (!umulp)
1206     {
1207       /* ??? This could be done with emit_store_flag where available.  */
1208       temp = expand_binop (word_mode, lshr_optab, op0_low, wordm1,
1209                            NULL_RTX, 1, methods);
1210       if (temp)
1211         op0_high = expand_binop (word_mode, add_optab, op0_high, temp,
1212                                  NULL_RTX, 0, OPTAB_DIRECT);
1213       else
1214         {
1215           temp = expand_binop (word_mode, ashr_optab, op0_low, wordm1,
1216                                NULL_RTX, 0, methods);
1217           if (!temp)
1218             return NULL_RTX;
1219           op0_high = expand_binop (word_mode, sub_optab, op0_high, temp,
1220                                    NULL_RTX, 0, OPTAB_DIRECT);
1221         }
1222
1223       if (!op0_high)
1224         return NULL_RTX;
1225     }
1226
1227   adjust = expand_binop (word_mode, smul_optab, op0_high, op1_low,
1228                          NULL_RTX, 0, OPTAB_DIRECT);
1229   if (!adjust)
1230     return NULL_RTX;
1231
1232   /* OP0_HIGH should now be dead.  */
1233
1234   if (!umulp)
1235     {
1236       /* ??? This could be done with emit_store_flag where available.  */
1237       temp = expand_binop (word_mode, lshr_optab, op1_low, wordm1,
1238                            NULL_RTX, 1, methods);
1239       if (temp)
1240         op1_high = expand_binop (word_mode, add_optab, op1_high, temp,
1241                                  NULL_RTX, 0, OPTAB_DIRECT);
1242       else
1243         {
1244           temp = expand_binop (word_mode, ashr_optab, op1_low, wordm1,
1245                                NULL_RTX, 0, methods);
1246           if (!temp)
1247             return NULL_RTX;
1248           op1_high = expand_binop (word_mode, sub_optab, op1_high, temp,
1249                                    NULL_RTX, 0, OPTAB_DIRECT);
1250         }
1251
1252       if (!op1_high)
1253         return NULL_RTX;
1254     }
1255
1256   temp = expand_binop (word_mode, smul_optab, op1_high, op0_low,
1257                        NULL_RTX, 0, OPTAB_DIRECT);
1258   if (!temp)
1259     return NULL_RTX;
1260
1261   /* OP1_HIGH should now be dead.  */
1262
1263   adjust = expand_binop (word_mode, add_optab, adjust, temp,
1264                          NULL_RTX, 0, OPTAB_DIRECT);
1265
1266   if (target && !REG_P (target))
1267     target = NULL_RTX;
1268
1269   if (umulp)
1270     product = expand_binop (mode, umul_widen_optab, op0_low, op1_low,
1271                             target, 1, OPTAB_DIRECT);
1272   else
1273     product = expand_binop (mode, smul_widen_optab, op0_low, op1_low,
1274                             target, 1, OPTAB_DIRECT);
1275
1276   if (!product)
1277     return NULL_RTX;
1278
1279   product_high = operand_subword (product, high, 1, mode);
1280   adjust = expand_binop (word_mode, add_optab, product_high, adjust,
1281                          NULL_RTX, 0, OPTAB_DIRECT);
1282   emit_move_insn (product_high, adjust);
1283   return product;
1284 }
1285 \f
1286 /* Wrapper around expand_binop which takes an rtx code to specify
1287    the operation to perform, not an optab pointer.  All other
1288    arguments are the same.  */
1289 rtx
1290 expand_simple_binop (enum machine_mode mode, enum rtx_code code, rtx op0,
1291                      rtx op1, rtx target, int unsignedp,
1292                      enum optab_methods methods)
1293 {
1294   optab binop = code_to_optab (code);
1295   gcc_assert (binop);
1296
1297   return expand_binop (mode, binop, op0, op1, target, unsignedp, methods);
1298 }
1299
1300 /* Return whether OP0 and OP1 should be swapped when expanding a commutative
1301    binop.  Order them according to commutative_operand_precedence and, if
1302    possible, try to put TARGET or a pseudo first.  */
1303 static bool
1304 swap_commutative_operands_with_target (rtx target, rtx op0, rtx op1)
1305 {
1306   int op0_prec = commutative_operand_precedence (op0);
1307   int op1_prec = commutative_operand_precedence (op1);
1308
1309   if (op0_prec < op1_prec)
1310     return true;
1311
1312   if (op0_prec > op1_prec)
1313     return false;
1314
1315   /* With equal precedence, both orders are ok, but it is better if the
1316      first operand is TARGET, or if both TARGET and OP0 are pseudos.  */
1317   if (target == 0 || REG_P (target))
1318     return (REG_P (op1) && !REG_P (op0)) || target == op1;
1319   else
1320     return rtx_equal_p (op1, target);
1321 }
1322
1323 /* Return true if BINOPTAB implements a shift operation.  */
1324
1325 static bool
1326 shift_optab_p (optab binoptab)
1327 {
1328   switch (optab_to_code (binoptab))
1329     {
1330     case ASHIFT:
1331     case SS_ASHIFT:
1332     case US_ASHIFT:
1333     case ASHIFTRT:
1334     case LSHIFTRT:
1335     case ROTATE:
1336     case ROTATERT:
1337       return true;
1338
1339     default:
1340       return false;
1341     }
1342 }
1343
1344 /* Return true if BINOPTAB implements a commutative binary operation.  */
1345
1346 static bool
1347 commutative_optab_p (optab binoptab)
1348 {
1349   return (GET_RTX_CLASS (optab_to_code (binoptab)) == RTX_COMM_ARITH
1350           || binoptab == smul_widen_optab
1351           || binoptab == umul_widen_optab
1352           || binoptab == smul_highpart_optab
1353           || binoptab == umul_highpart_optab);
1354 }
1355
1356 /* X is to be used in mode MODE as operand OPN to BINOPTAB.  If we're
1357    optimizing, and if the operand is a constant that costs more than
1358    1 instruction, force the constant into a register and return that
1359    register.  Return X otherwise.  UNSIGNEDP says whether X is unsigned.  */
1360
1361 static rtx
1362 avoid_expensive_constant (enum machine_mode mode, optab binoptab,
1363                           int opn, rtx x, bool unsignedp)
1364 {
1365   bool speed = optimize_insn_for_speed_p ();
1366
1367   if (mode != VOIDmode
1368       && optimize
1369       && CONSTANT_P (x)
1370       && (rtx_cost (x, optab_to_code (binoptab), opn, speed)
1371           > set_src_cost (x, speed)))
1372     {
1373       if (CONST_INT_P (x))
1374         {
1375           HOST_WIDE_INT intval = trunc_int_for_mode (INTVAL (x), mode);
1376           if (intval != INTVAL (x))
1377             x = GEN_INT (intval);
1378         }
1379       else
1380         x = convert_modes (mode, VOIDmode, x, unsignedp);
1381       x = force_reg (mode, x);
1382     }
1383   return x;
1384 }
1385
1386 /* Helper function for expand_binop: handle the case where there
1387    is an insn that directly implements the indicated operation.
1388    Returns null if this is not possible.  */
1389 static rtx
1390 expand_binop_directly (enum machine_mode mode, optab binoptab,
1391                        rtx op0, rtx op1,
1392                        rtx target, int unsignedp, enum optab_methods methods,
1393                        rtx last)
1394 {
1395   enum machine_mode from_mode = widened_mode (mode, op0, op1);
1396   enum insn_code icode = find_widening_optab_handler (binoptab, mode,
1397                                                       from_mode, 1);
1398   enum machine_mode xmode0 = insn_data[(int) icode].operand[1].mode;
1399   enum machine_mode xmode1 = insn_data[(int) icode].operand[2].mode;
1400   enum machine_mode mode0, mode1, tmp_mode;
1401   struct expand_operand ops[3];
1402   bool commutative_p;
1403   rtx pat;
1404   rtx xop0 = op0, xop1 = op1;
1405   rtx swap;
1406
1407   /* If it is a commutative operator and the modes would match
1408      if we would swap the operands, we can save the conversions.  */
1409   commutative_p = commutative_optab_p (binoptab);
1410   if (commutative_p
1411       && GET_MODE (xop0) != xmode0 && GET_MODE (xop1) != xmode1
1412       && GET_MODE (xop0) == xmode1 && GET_MODE (xop1) == xmode1)
1413     {
1414       swap = xop0;
1415       xop0 = xop1;
1416       xop1 = swap;
1417     }
1418
1419   /* If we are optimizing, force expensive constants into a register.  */
1420   xop0 = avoid_expensive_constant (xmode0, binoptab, 0, xop0, unsignedp);
1421   if (!shift_optab_p (binoptab))
1422     xop1 = avoid_expensive_constant (xmode1, binoptab, 1, xop1, unsignedp);
1423
1424   /* In case the insn wants input operands in modes different from
1425      those of the actual operands, convert the operands.  It would
1426      seem that we don't need to convert CONST_INTs, but we do, so
1427      that they're properly zero-extended, sign-extended or truncated
1428      for their mode.  */
1429
1430   mode0 = GET_MODE (xop0) != VOIDmode ? GET_MODE (xop0) : mode;
1431   if (xmode0 != VOIDmode && xmode0 != mode0)
1432     {
1433       xop0 = convert_modes (xmode0, mode0, xop0, unsignedp);
1434       mode0 = xmode0;
1435     }
1436
1437   mode1 = GET_MODE (xop1) != VOIDmode ? GET_MODE (xop1) : mode;
1438   if (xmode1 != VOIDmode && xmode1 != mode1)
1439     {
1440       xop1 = convert_modes (xmode1, mode1, xop1, unsignedp);
1441       mode1 = xmode1;
1442     }
1443
1444   /* If operation is commutative,
1445      try to make the first operand a register.
1446      Even better, try to make it the same as the target.
1447      Also try to make the last operand a constant.  */
1448   if (commutative_p
1449       && swap_commutative_operands_with_target (target, xop0, xop1))
1450     {
1451       swap = xop1;
1452       xop1 = xop0;
1453       xop0 = swap;
1454     }
1455
1456   /* Now, if insn's predicates don't allow our operands, put them into
1457      pseudo regs.  */
1458
1459   if (binoptab == vec_pack_trunc_optab
1460       || binoptab == vec_pack_usat_optab
1461       || binoptab == vec_pack_ssat_optab
1462       || binoptab == vec_pack_ufix_trunc_optab
1463       || binoptab == vec_pack_sfix_trunc_optab)
1464     {
1465       /* The mode of the result is different then the mode of the
1466          arguments.  */
1467       tmp_mode = insn_data[(int) icode].operand[0].mode;
1468       if (GET_MODE_NUNITS (tmp_mode) != 2 * GET_MODE_NUNITS (mode))
1469         {
1470           delete_insns_since (last);
1471           return NULL_RTX;
1472         }
1473     }
1474   else
1475     tmp_mode = mode;
1476
1477   create_output_operand (&ops[0], target, tmp_mode);
1478   create_input_operand (&ops[1], xop0, mode0);
1479   create_input_operand (&ops[2], xop1, mode1);
1480   pat = maybe_gen_insn (icode, 3, ops);
1481   if (pat)
1482     {
1483       /* If PAT is composed of more than one insn, try to add an appropriate
1484          REG_EQUAL note to it.  If we can't because TEMP conflicts with an
1485          operand, call expand_binop again, this time without a target.  */
1486       if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
1487           && ! add_equal_note (pat, ops[0].value, optab_to_code (binoptab),
1488                                ops[1].value, ops[2].value))
1489         {
1490           delete_insns_since (last);
1491           return expand_binop (mode, binoptab, op0, op1, NULL_RTX,
1492                                unsignedp, methods);
1493         }
1494
1495       emit_insn (pat);
1496       return ops[0].value;
1497     }
1498   delete_insns_since (last);
1499   return NULL_RTX;
1500 }
1501
1502 /* Generate code to perform an operation specified by BINOPTAB
1503    on operands OP0 and OP1, with result having machine-mode MODE.
1504
1505    UNSIGNEDP is for the case where we have to widen the operands
1506    to perform the operation.  It says to use zero-extension.
1507
1508    If TARGET is nonzero, the value
1509    is generated there, if it is convenient to do so.
1510    In all cases an rtx is returned for the locus of the value;
1511    this may or may not be TARGET.  */
1512
1513 rtx
1514 expand_binop (enum machine_mode mode, optab binoptab, rtx op0, rtx op1,
1515               rtx target, int unsignedp, enum optab_methods methods)
1516 {
1517   enum optab_methods next_methods
1518     = (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN
1519        ? OPTAB_WIDEN : methods);
1520   enum mode_class mclass;
1521   enum machine_mode wider_mode;
1522   rtx libfunc;
1523   rtx temp;
1524   rtx entry_last = get_last_insn ();
1525   rtx last;
1526
1527   mclass = GET_MODE_CLASS (mode);
1528
1529   /* If subtracting an integer constant, convert this into an addition of
1530      the negated constant.  */
1531
1532   if (binoptab == sub_optab && CONST_INT_P (op1))
1533     {
1534       op1 = negate_rtx (mode, op1);
1535       binoptab = add_optab;
1536     }
1537
1538   /* Record where to delete back to if we backtrack.  */
1539   last = get_last_insn ();
1540
1541   /* If we can do it with a three-operand insn, do so.  */
1542
1543   if (methods != OPTAB_MUST_WIDEN
1544       && find_widening_optab_handler (binoptab, mode,
1545                                       widened_mode (mode, op0, op1), 1)
1546             != CODE_FOR_nothing)
1547     {
1548       temp = expand_binop_directly (mode, binoptab, op0, op1, target,
1549                                     unsignedp, methods, last);
1550       if (temp)
1551         return temp;
1552     }
1553
1554   /* If we were trying to rotate, and that didn't work, try rotating
1555      the other direction before falling back to shifts and bitwise-or.  */
1556   if (((binoptab == rotl_optab
1557         && optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
1558        || (binoptab == rotr_optab
1559            && optab_handler (rotl_optab, mode) != CODE_FOR_nothing))
1560       && mclass == MODE_INT)
1561     {
1562       optab otheroptab = (binoptab == rotl_optab ? rotr_optab : rotl_optab);
1563       rtx newop1;
1564       unsigned int bits = GET_MODE_PRECISION (mode);
1565
1566       if (CONST_INT_P (op1))
1567         newop1 = GEN_INT (bits - INTVAL (op1));
1568       else if (targetm.shift_truncation_mask (mode) == bits - 1)
1569         newop1 = negate_rtx (GET_MODE (op1), op1);
1570       else
1571         newop1 = expand_binop (GET_MODE (op1), sub_optab,
1572                                gen_int_mode (bits, GET_MODE (op1)), op1,
1573                                NULL_RTX, unsignedp, OPTAB_DIRECT);
1574
1575       temp = expand_binop_directly (mode, otheroptab, op0, newop1,
1576                                     target, unsignedp, methods, last);
1577       if (temp)
1578         return temp;
1579     }
1580
1581   /* If this is a multiply, see if we can do a widening operation that
1582      takes operands of this mode and makes a wider mode.  */
1583
1584   if (binoptab == smul_optab
1585       && GET_MODE_2XWIDER_MODE (mode) != VOIDmode
1586       && (widening_optab_handler ((unsignedp ? umul_widen_optab
1587                                              : smul_widen_optab),
1588                                   GET_MODE_2XWIDER_MODE (mode), mode)
1589           != CODE_FOR_nothing))
1590     {
1591       temp = expand_binop (GET_MODE_2XWIDER_MODE (mode),
1592                            unsignedp ? umul_widen_optab : smul_widen_optab,
1593                            op0, op1, NULL_RTX, unsignedp, OPTAB_DIRECT);
1594
1595       if (temp != 0)
1596         {
1597           if (GET_MODE_CLASS (mode) == MODE_INT
1598               && TRULY_NOOP_TRUNCATION_MODES_P (mode, GET_MODE (temp)))
1599             return gen_lowpart (mode, temp);
1600           else
1601             return convert_to_mode (mode, temp, unsignedp);
1602         }
1603     }
1604
1605   /* If this is a vector shift by a scalar, see if we can do a vector
1606      shift by a vector.  If so, broadcast the scalar into a vector.  */
1607   if (mclass == MODE_VECTOR_INT)
1608     {
1609       optab otheroptab = unknown_optab;
1610
1611       if (binoptab == ashl_optab)
1612         otheroptab = vashl_optab;
1613       else if (binoptab == ashr_optab)
1614         otheroptab = vashr_optab;
1615       else if (binoptab == lshr_optab)
1616         otheroptab = vlshr_optab;
1617       else if (binoptab == rotl_optab)
1618         otheroptab = vrotl_optab;
1619       else if (binoptab == rotr_optab)
1620         otheroptab = vrotr_optab;
1621
1622       if (otheroptab && optab_handler (otheroptab, mode) != CODE_FOR_nothing)
1623         {
1624           rtx vop1 = expand_vector_broadcast (mode, op1);
1625           if (vop1)
1626             {
1627               temp = expand_binop_directly (mode, otheroptab, op0, vop1,
1628                                             target, unsignedp, methods, last);
1629               if (temp)
1630                 return temp;
1631             }
1632         }
1633     }
1634
1635   /* Look for a wider mode of the same class for which we think we
1636      can open-code the operation.  Check for a widening multiply at the
1637      wider mode as well.  */
1638
1639   if (CLASS_HAS_WIDER_MODES_P (mclass)
1640       && methods != OPTAB_DIRECT && methods != OPTAB_LIB)
1641     for (wider_mode = GET_MODE_WIDER_MODE (mode);
1642          wider_mode != VOIDmode;
1643          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
1644       {
1645         if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing
1646             || (binoptab == smul_optab
1647                 && GET_MODE_WIDER_MODE (wider_mode) != VOIDmode
1648                 && (find_widening_optab_handler ((unsignedp
1649                                                   ? umul_widen_optab
1650                                                   : smul_widen_optab),
1651                                                  GET_MODE_WIDER_MODE (wider_mode),
1652                                                  mode, 0)
1653                     != CODE_FOR_nothing)))
1654           {
1655             rtx xop0 = op0, xop1 = op1;
1656             int no_extend = 0;
1657
1658             /* For certain integer operations, we need not actually extend
1659                the narrow operands, as long as we will truncate
1660                the results to the same narrowness.  */
1661
1662             if ((binoptab == ior_optab || binoptab == and_optab
1663                  || binoptab == xor_optab
1664                  || binoptab == add_optab || binoptab == sub_optab
1665                  || binoptab == smul_optab || binoptab == ashl_optab)
1666                 && mclass == MODE_INT)
1667               {
1668                 no_extend = 1;
1669                 xop0 = avoid_expensive_constant (mode, binoptab, 0,
1670                                                  xop0, unsignedp);
1671                 if (binoptab != ashl_optab)
1672                   xop1 = avoid_expensive_constant (mode, binoptab, 1,
1673                                                    xop1, unsignedp);
1674               }
1675
1676             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp, no_extend);
1677
1678             /* The second operand of a shift must always be extended.  */
1679             xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
1680                                   no_extend && binoptab != ashl_optab);
1681
1682             temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
1683                                  unsignedp, OPTAB_DIRECT);
1684             if (temp)
1685               {
1686                 if (mclass != MODE_INT
1687                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
1688                   {
1689                     if (target == 0)
1690                       target = gen_reg_rtx (mode);
1691                     convert_move (target, temp, 0);
1692                     return target;
1693                   }
1694                 else
1695                   return gen_lowpart (mode, temp);
1696               }
1697             else
1698               delete_insns_since (last);
1699           }
1700       }
1701
1702   /* If operation is commutative,
1703      try to make the first operand a register.
1704      Even better, try to make it the same as the target.
1705      Also try to make the last operand a constant.  */
1706   if (commutative_optab_p (binoptab)
1707       && swap_commutative_operands_with_target (target, op0, op1))
1708     {
1709       temp = op1;
1710       op1 = op0;
1711       op0 = temp;
1712     }
1713
1714   /* These can be done a word at a time.  */
1715   if ((binoptab == and_optab || binoptab == ior_optab || binoptab == xor_optab)
1716       && mclass == MODE_INT
1717       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
1718       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1719     {
1720       int i;
1721       rtx insns;
1722
1723       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1724          won't be accurate, so use a new target.  */
1725       if (target == 0
1726           || target == op0
1727           || target == op1
1728           || !valid_multiword_target_p (target))
1729         target = gen_reg_rtx (mode);
1730
1731       start_sequence ();
1732
1733       /* Do the actual arithmetic.  */
1734       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
1735         {
1736           rtx target_piece = operand_subword (target, i, 1, mode);
1737           rtx x = expand_binop (word_mode, binoptab,
1738                                 operand_subword_force (op0, i, mode),
1739                                 operand_subword_force (op1, i, mode),
1740                                 target_piece, unsignedp, next_methods);
1741
1742           if (x == 0)
1743             break;
1744
1745           if (target_piece != x)
1746             emit_move_insn (target_piece, x);
1747         }
1748
1749       insns = get_insns ();
1750       end_sequence ();
1751
1752       if (i == GET_MODE_BITSIZE (mode) / BITS_PER_WORD)
1753         {
1754           emit_insn (insns);
1755           return target;
1756         }
1757     }
1758
1759   /* Synthesize double word shifts from single word shifts.  */
1760   if ((binoptab == lshr_optab || binoptab == ashl_optab
1761        || binoptab == ashr_optab)
1762       && mclass == MODE_INT
1763       && (CONST_INT_P (op1) || optimize_insn_for_speed_p ())
1764       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
1765       && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode)
1766       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing
1767       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1768       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1769     {
1770       unsigned HOST_WIDE_INT shift_mask, double_shift_mask;
1771       enum machine_mode op1_mode;
1772
1773       double_shift_mask = targetm.shift_truncation_mask (mode);
1774       shift_mask = targetm.shift_truncation_mask (word_mode);
1775       op1_mode = GET_MODE (op1) != VOIDmode ? GET_MODE (op1) : word_mode;
1776
1777       /* Apply the truncation to constant shifts.  */
1778       if (double_shift_mask > 0 && CONST_INT_P (op1))
1779         op1 = GEN_INT (INTVAL (op1) & double_shift_mask);
1780
1781       if (op1 == CONST0_RTX (op1_mode))
1782         return op0;
1783
1784       /* Make sure that this is a combination that expand_doubleword_shift
1785          can handle.  See the comments there for details.  */
1786       if (double_shift_mask == 0
1787           || (shift_mask == BITS_PER_WORD - 1
1788               && double_shift_mask == BITS_PER_WORD * 2 - 1))
1789         {
1790           rtx insns;
1791           rtx into_target, outof_target;
1792           rtx into_input, outof_input;
1793           int left_shift, outof_word;
1794
1795           /* If TARGET is the same as one of the operands, the REG_EQUAL note
1796              won't be accurate, so use a new target.  */
1797           if (target == 0
1798               || target == op0
1799               || target == op1
1800               || !valid_multiword_target_p (target))
1801             target = gen_reg_rtx (mode);
1802
1803           start_sequence ();
1804
1805           /* OUTOF_* is the word we are shifting bits away from, and
1806              INTO_* is the word that we are shifting bits towards, thus
1807              they differ depending on the direction of the shift and
1808              WORDS_BIG_ENDIAN.  */
1809
1810           left_shift = binoptab == ashl_optab;
1811           outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1812
1813           outof_target = operand_subword (target, outof_word, 1, mode);
1814           into_target = operand_subword (target, 1 - outof_word, 1, mode);
1815
1816           outof_input = operand_subword_force (op0, outof_word, mode);
1817           into_input = operand_subword_force (op0, 1 - outof_word, mode);
1818
1819           if (expand_doubleword_shift (op1_mode, binoptab,
1820                                        outof_input, into_input, op1,
1821                                        outof_target, into_target,
1822                                        unsignedp, next_methods, shift_mask))
1823             {
1824               insns = get_insns ();
1825               end_sequence ();
1826
1827               emit_insn (insns);
1828               return target;
1829             }
1830           end_sequence ();
1831         }
1832     }
1833
1834   /* Synthesize double word rotates from single word shifts.  */
1835   if ((binoptab == rotl_optab || binoptab == rotr_optab)
1836       && mclass == MODE_INT
1837       && CONST_INT_P (op1)
1838       && GET_MODE_PRECISION (mode) == 2 * BITS_PER_WORD
1839       && optab_handler (ashl_optab, word_mode) != CODE_FOR_nothing
1840       && optab_handler (lshr_optab, word_mode) != CODE_FOR_nothing)
1841     {
1842       rtx insns;
1843       rtx into_target, outof_target;
1844       rtx into_input, outof_input;
1845       rtx inter;
1846       int shift_count, left_shift, outof_word;
1847
1848       /* If TARGET is the same as one of the operands, the REG_EQUAL note
1849          won't be accurate, so use a new target. Do this also if target is not
1850          a REG, first because having a register instead may open optimization
1851          opportunities, and second because if target and op0 happen to be MEMs
1852          designating the same location, we would risk clobbering it too early
1853          in the code sequence we generate below.  */
1854       if (target == 0
1855           || target == op0
1856           || target == op1
1857           || !REG_P (target)
1858           || !valid_multiword_target_p (target))
1859         target = gen_reg_rtx (mode);
1860
1861       start_sequence ();
1862
1863       shift_count = INTVAL (op1);
1864
1865       /* OUTOF_* is the word we are shifting bits away from, and
1866          INTO_* is the word that we are shifting bits towards, thus
1867          they differ depending on the direction of the shift and
1868          WORDS_BIG_ENDIAN.  */
1869
1870       left_shift = (binoptab == rotl_optab);
1871       outof_word = left_shift ^ ! WORDS_BIG_ENDIAN;
1872
1873       outof_target = operand_subword (target, outof_word, 1, mode);
1874       into_target = operand_subword (target, 1 - outof_word, 1, mode);
1875
1876       outof_input = operand_subword_force (op0, outof_word, mode);
1877       into_input = operand_subword_force (op0, 1 - outof_word, mode);
1878
1879       if (shift_count == BITS_PER_WORD)
1880         {
1881           /* This is just a word swap.  */
1882           emit_move_insn (outof_target, into_input);
1883           emit_move_insn (into_target, outof_input);
1884           inter = const0_rtx;
1885         }
1886       else
1887         {
1888           rtx into_temp1, into_temp2, outof_temp1, outof_temp2;
1889           rtx first_shift_count, second_shift_count;
1890           optab reverse_unsigned_shift, unsigned_shift;
1891
1892           reverse_unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1893                                     ? lshr_optab : ashl_optab);
1894
1895           unsigned_shift = (left_shift ^ (shift_count < BITS_PER_WORD)
1896                             ? ashl_optab : lshr_optab);
1897
1898           if (shift_count > BITS_PER_WORD)
1899             {
1900               first_shift_count = GEN_INT (shift_count - BITS_PER_WORD);
1901               second_shift_count = GEN_INT (2 * BITS_PER_WORD - shift_count);
1902             }
1903           else
1904             {
1905               first_shift_count = GEN_INT (BITS_PER_WORD - shift_count);
1906               second_shift_count = GEN_INT (shift_count);
1907             }
1908
1909           into_temp1 = expand_binop (word_mode, unsigned_shift,
1910                                      outof_input, first_shift_count,
1911                                      NULL_RTX, unsignedp, next_methods);
1912           into_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1913                                      into_input, second_shift_count,
1914                                      NULL_RTX, unsignedp, next_methods);
1915
1916           if (into_temp1 != 0 && into_temp2 != 0)
1917             inter = expand_binop (word_mode, ior_optab, into_temp1, into_temp2,
1918                                   into_target, unsignedp, next_methods);
1919           else
1920             inter = 0;
1921
1922           if (inter != 0 && inter != into_target)
1923             emit_move_insn (into_target, inter);
1924
1925           outof_temp1 = expand_binop (word_mode, unsigned_shift,
1926                                       into_input, first_shift_count,
1927                                       NULL_RTX, unsignedp, next_methods);
1928           outof_temp2 = expand_binop (word_mode, reverse_unsigned_shift,
1929                                       outof_input, second_shift_count,
1930                                       NULL_RTX, unsignedp, next_methods);
1931
1932           if (inter != 0 && outof_temp1 != 0 && outof_temp2 != 0)
1933             inter = expand_binop (word_mode, ior_optab,
1934                                   outof_temp1, outof_temp2,
1935                                   outof_target, unsignedp, next_methods);
1936
1937           if (inter != 0 && inter != outof_target)
1938             emit_move_insn (outof_target, inter);
1939         }
1940
1941       insns = get_insns ();
1942       end_sequence ();
1943
1944       if (inter != 0)
1945         {
1946           emit_insn (insns);
1947           return target;
1948         }
1949     }
1950
1951   /* These can be done a word at a time by propagating carries.  */
1952   if ((binoptab == add_optab || binoptab == sub_optab)
1953       && mclass == MODE_INT
1954       && GET_MODE_SIZE (mode) >= 2 * UNITS_PER_WORD
1955       && optab_handler (binoptab, word_mode) != CODE_FOR_nothing)
1956     {
1957       unsigned int i;
1958       optab otheroptab = binoptab == add_optab ? sub_optab : add_optab;
1959       const unsigned int nwords = GET_MODE_BITSIZE (mode) / BITS_PER_WORD;
1960       rtx carry_in = NULL_RTX, carry_out = NULL_RTX;
1961       rtx xop0, xop1, xtarget;
1962
1963       /* We can handle either a 1 or -1 value for the carry.  If STORE_FLAG
1964          value is one of those, use it.  Otherwise, use 1 since it is the
1965          one easiest to get.  */
1966 #if STORE_FLAG_VALUE == 1 || STORE_FLAG_VALUE == -1
1967       int normalizep = STORE_FLAG_VALUE;
1968 #else
1969       int normalizep = 1;
1970 #endif
1971
1972       /* Prepare the operands.  */
1973       xop0 = force_reg (mode, op0);
1974       xop1 = force_reg (mode, op1);
1975
1976       xtarget = gen_reg_rtx (mode);
1977
1978       if (target == 0 || !REG_P (target) || !valid_multiword_target_p (target))
1979         target = xtarget;
1980
1981       /* Indicate for flow that the entire target reg is being set.  */
1982       if (REG_P (target))
1983         emit_clobber (xtarget);
1984
1985       /* Do the actual arithmetic.  */
1986       for (i = 0; i < nwords; i++)
1987         {
1988           int index = (WORDS_BIG_ENDIAN ? nwords - i - 1 : i);
1989           rtx target_piece = operand_subword (xtarget, index, 1, mode);
1990           rtx op0_piece = operand_subword_force (xop0, index, mode);
1991           rtx op1_piece = operand_subword_force (xop1, index, mode);
1992           rtx x;
1993
1994           /* Main add/subtract of the input operands.  */
1995           x = expand_binop (word_mode, binoptab,
1996                             op0_piece, op1_piece,
1997                             target_piece, unsignedp, next_methods);
1998           if (x == 0)
1999             break;
2000
2001           if (i + 1 < nwords)
2002             {
2003               /* Store carry from main add/subtract.  */
2004               carry_out = gen_reg_rtx (word_mode);
2005               carry_out = emit_store_flag_force (carry_out,
2006                                                  (binoptab == add_optab
2007                                                   ? LT : GT),
2008                                                  x, op0_piece,
2009                                                  word_mode, 1, normalizep);
2010             }
2011
2012           if (i > 0)
2013             {
2014               rtx newx;
2015
2016               /* Add/subtract previous carry to main result.  */
2017               newx = expand_binop (word_mode,
2018                                    normalizep == 1 ? binoptab : otheroptab,
2019                                    x, carry_in,
2020                                    NULL_RTX, 1, next_methods);
2021
2022               if (i + 1 < nwords)
2023                 {
2024                   /* Get out carry from adding/subtracting carry in.  */
2025                   rtx carry_tmp = gen_reg_rtx (word_mode);
2026                   carry_tmp = emit_store_flag_force (carry_tmp,
2027                                                      (binoptab == add_optab
2028                                                       ? LT : GT),
2029                                                      newx, x,
2030                                                      word_mode, 1, normalizep);
2031
2032                   /* Logical-ior the two poss. carry together.  */
2033                   carry_out = expand_binop (word_mode, ior_optab,
2034                                             carry_out, carry_tmp,
2035                                             carry_out, 0, next_methods);
2036                   if (carry_out == 0)
2037                     break;
2038                 }
2039               emit_move_insn (target_piece, newx);
2040             }
2041           else
2042             {
2043               if (x != target_piece)
2044                 emit_move_insn (target_piece, x);
2045             }
2046
2047           carry_in = carry_out;
2048         }
2049
2050       if (i == GET_MODE_BITSIZE (mode) / (unsigned) BITS_PER_WORD)
2051         {
2052           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing
2053               || ! rtx_equal_p (target, xtarget))
2054             {
2055               rtx temp = emit_move_insn (target, xtarget);
2056
2057               set_dst_reg_note (temp, REG_EQUAL,
2058                                 gen_rtx_fmt_ee (optab_to_code (binoptab),
2059                                                 mode, copy_rtx (xop0),
2060                                                 copy_rtx (xop1)),
2061                                 target);
2062             }
2063           else
2064             target = xtarget;
2065
2066           return target;
2067         }
2068
2069       else
2070         delete_insns_since (last);
2071     }
2072
2073   /* Attempt to synthesize double word multiplies using a sequence of word
2074      mode multiplications.  We first attempt to generate a sequence using a
2075      more efficient unsigned widening multiply, and if that fails we then
2076      try using a signed widening multiply.  */
2077
2078   if (binoptab == smul_optab
2079       && mclass == MODE_INT
2080       && GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
2081       && optab_handler (smul_optab, word_mode) != CODE_FOR_nothing
2082       && optab_handler (add_optab, word_mode) != CODE_FOR_nothing)
2083     {
2084       rtx product = NULL_RTX;
2085       if (widening_optab_handler (umul_widen_optab, mode, word_mode)
2086             != CODE_FOR_nothing)
2087         {
2088           product = expand_doubleword_mult (mode, op0, op1, target,
2089                                             true, methods);
2090           if (!product)
2091             delete_insns_since (last);
2092         }
2093
2094       if (product == NULL_RTX
2095           && widening_optab_handler (smul_widen_optab, mode, word_mode)
2096                 != CODE_FOR_nothing)
2097         {
2098           product = expand_doubleword_mult (mode, op0, op1, target,
2099                                             false, methods);
2100           if (!product)
2101             delete_insns_since (last);
2102         }
2103
2104       if (product != NULL_RTX)
2105         {
2106           if (optab_handler (mov_optab, mode) != CODE_FOR_nothing)
2107             {
2108               temp = emit_move_insn (target ? target : product, product);
2109               set_dst_reg_note (temp,
2110                                 REG_EQUAL,
2111                                 gen_rtx_fmt_ee (MULT, mode,
2112                                                 copy_rtx (op0),
2113                                                 copy_rtx (op1)),
2114                                 target ? target : product);
2115             }
2116           return product;
2117         }
2118     }
2119
2120   /* It can't be open-coded in this mode.
2121      Use a library call if one is available and caller says that's ok.  */
2122
2123   libfunc = optab_libfunc (binoptab, mode);
2124   if (libfunc
2125       && (methods == OPTAB_LIB || methods == OPTAB_LIB_WIDEN))
2126     {
2127       rtx insns;
2128       rtx op1x = op1;
2129       enum machine_mode op1_mode = mode;
2130       rtx value;
2131
2132       start_sequence ();
2133
2134       if (shift_optab_p (binoptab))
2135         {
2136           op1_mode = targetm.libgcc_shift_count_mode ();
2137           /* Specify unsigned here,
2138              since negative shift counts are meaningless.  */
2139           op1x = convert_to_mode (op1_mode, op1, 1);
2140         }
2141
2142       if (GET_MODE (op0) != VOIDmode
2143           && GET_MODE (op0) != mode)
2144         op0 = convert_to_mode (mode, op0, unsignedp);
2145
2146       /* Pass 1 for NO_QUEUE so we don't lose any increments
2147          if the libcall is cse'd or moved.  */
2148       value = emit_library_call_value (libfunc,
2149                                        NULL_RTX, LCT_CONST, mode, 2,
2150                                        op0, mode, op1x, op1_mode);
2151
2152       insns = get_insns ();
2153       end_sequence ();
2154
2155       target = gen_reg_rtx (mode);
2156       emit_libcall_block_1 (insns, target, value,
2157                             gen_rtx_fmt_ee (optab_to_code (binoptab),
2158                                             mode, op0, op1),
2159                             trapv_binoptab_p (binoptab));
2160
2161       return target;
2162     }
2163
2164   delete_insns_since (last);
2165
2166   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2167
2168   if (! (methods == OPTAB_WIDEN || methods == OPTAB_LIB_WIDEN
2169          || methods == OPTAB_MUST_WIDEN))
2170     {
2171       /* Caller says, don't even try.  */
2172       delete_insns_since (entry_last);
2173       return 0;
2174     }
2175
2176   /* Compute the value of METHODS to pass to recursive calls.
2177      Don't allow widening to be tried recursively.  */
2178
2179   methods = (methods == OPTAB_LIB_WIDEN ? OPTAB_LIB : OPTAB_DIRECT);
2180
2181   /* Look for a wider mode of the same class for which it appears we can do
2182      the operation.  */
2183
2184   if (CLASS_HAS_WIDER_MODES_P (mclass))
2185     {
2186       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2187            wider_mode != VOIDmode;
2188            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2189         {
2190           if (find_widening_optab_handler (binoptab, wider_mode, mode, 1)
2191                   != CODE_FOR_nothing
2192               || (methods == OPTAB_LIB
2193                   && optab_libfunc (binoptab, wider_mode)))
2194             {
2195               rtx xop0 = op0, xop1 = op1;
2196               int no_extend = 0;
2197
2198               /* For certain integer operations, we need not actually extend
2199                  the narrow operands, as long as we will truncate
2200                  the results to the same narrowness.  */
2201
2202               if ((binoptab == ior_optab || binoptab == and_optab
2203                    || binoptab == xor_optab
2204                    || binoptab == add_optab || binoptab == sub_optab
2205                    || binoptab == smul_optab || binoptab == ashl_optab)
2206                   && mclass == MODE_INT)
2207                 no_extend = 1;
2208
2209               xop0 = widen_operand (xop0, wider_mode, mode,
2210                                     unsignedp, no_extend);
2211
2212               /* The second operand of a shift must always be extended.  */
2213               xop1 = widen_operand (xop1, wider_mode, mode, unsignedp,
2214                                     no_extend && binoptab != ashl_optab);
2215
2216               temp = expand_binop (wider_mode, binoptab, xop0, xop1, NULL_RTX,
2217                                    unsignedp, methods);
2218               if (temp)
2219                 {
2220                   if (mclass != MODE_INT
2221                       || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
2222                     {
2223                       if (target == 0)
2224                         target = gen_reg_rtx (mode);
2225                       convert_move (target, temp, 0);
2226                       return target;
2227                     }
2228                   else
2229                     return gen_lowpart (mode, temp);
2230                 }
2231               else
2232                 delete_insns_since (last);
2233             }
2234         }
2235     }
2236
2237   delete_insns_since (entry_last);
2238   return 0;
2239 }
2240 \f
2241 /* Expand a binary operator which has both signed and unsigned forms.
2242    UOPTAB is the optab for unsigned operations, and SOPTAB is for
2243    signed operations.
2244
2245    If we widen unsigned operands, we may use a signed wider operation instead
2246    of an unsigned wider operation, since the result would be the same.  */
2247
2248 rtx
2249 sign_expand_binop (enum machine_mode mode, optab uoptab, optab soptab,
2250                    rtx op0, rtx op1, rtx target, int unsignedp,
2251                    enum optab_methods methods)
2252 {
2253   rtx temp;
2254   optab direct_optab = unsignedp ? uoptab : soptab;
2255   bool save_enable;
2256
2257   /* Do it without widening, if possible.  */
2258   temp = expand_binop (mode, direct_optab, op0, op1, target,
2259                        unsignedp, OPTAB_DIRECT);
2260   if (temp || methods == OPTAB_DIRECT)
2261     return temp;
2262
2263   /* Try widening to a signed int.  Disable any direct use of any
2264      signed insn in the current mode.  */
2265   save_enable = swap_optab_enable (soptab, mode, false);
2266
2267   temp = expand_binop (mode, soptab, op0, op1, target,
2268                        unsignedp, OPTAB_WIDEN);
2269
2270   /* For unsigned operands, try widening to an unsigned int.  */
2271   if (!temp && unsignedp)
2272     temp = expand_binop (mode, uoptab, op0, op1, target,
2273                          unsignedp, OPTAB_WIDEN);
2274   if (temp || methods == OPTAB_WIDEN)
2275     goto egress;
2276
2277   /* Use the right width libcall if that exists.  */
2278   temp = expand_binop (mode, direct_optab, op0, op1, target,
2279                        unsignedp, OPTAB_LIB);
2280   if (temp || methods == OPTAB_LIB)
2281     goto egress;
2282
2283   /* Must widen and use a libcall, use either signed or unsigned.  */
2284   temp = expand_binop (mode, soptab, op0, op1, target,
2285                        unsignedp, methods);
2286   if (!temp && unsignedp)
2287     temp = expand_binop (mode, uoptab, op0, op1, target,
2288                          unsignedp, methods);
2289
2290  egress:
2291   /* Undo the fiddling above.  */
2292   if (save_enable)
2293     swap_optab_enable (soptab, mode, true);
2294   return temp;
2295 }
2296 \f
2297 /* Generate code to perform an operation specified by UNOPPTAB
2298    on operand OP0, with two results to TARG0 and TARG1.
2299    We assume that the order of the operands for the instruction
2300    is TARG0, TARG1, OP0.
2301
2302    Either TARG0 or TARG1 may be zero, but what that means is that
2303    the result is not actually wanted.  We will generate it into
2304    a dummy pseudo-reg and discard it.  They may not both be zero.
2305
2306    Returns 1 if this operation can be performed; 0 if not.  */
2307
2308 int
2309 expand_twoval_unop (optab unoptab, rtx op0, rtx targ0, rtx targ1,
2310                     int unsignedp)
2311 {
2312   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2313   enum mode_class mclass;
2314   enum machine_mode wider_mode;
2315   rtx entry_last = get_last_insn ();
2316   rtx last;
2317
2318   mclass = GET_MODE_CLASS (mode);
2319
2320   if (!targ0)
2321     targ0 = gen_reg_rtx (mode);
2322   if (!targ1)
2323     targ1 = gen_reg_rtx (mode);
2324
2325   /* Record where to go back to if we fail.  */
2326   last = get_last_insn ();
2327
2328   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2329     {
2330       struct expand_operand ops[3];
2331       enum insn_code icode = optab_handler (unoptab, mode);
2332
2333       create_fixed_operand (&ops[0], targ0);
2334       create_fixed_operand (&ops[1], targ1);
2335       create_convert_operand_from (&ops[2], op0, mode, unsignedp);
2336       if (maybe_expand_insn (icode, 3, ops))
2337         return 1;
2338     }
2339
2340   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2341
2342   if (CLASS_HAS_WIDER_MODES_P (mclass))
2343     {
2344       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2345            wider_mode != VOIDmode;
2346            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2347         {
2348           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2349             {
2350               rtx t0 = gen_reg_rtx (wider_mode);
2351               rtx t1 = gen_reg_rtx (wider_mode);
2352               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2353
2354               if (expand_twoval_unop (unoptab, cop0, t0, t1, unsignedp))
2355                 {
2356                   convert_move (targ0, t0, unsignedp);
2357                   convert_move (targ1, t1, unsignedp);
2358                   return 1;
2359                 }
2360               else
2361                 delete_insns_since (last);
2362             }
2363         }
2364     }
2365
2366   delete_insns_since (entry_last);
2367   return 0;
2368 }
2369 \f
2370 /* Generate code to perform an operation specified by BINOPTAB
2371    on operands OP0 and OP1, with two results to TARG1 and TARG2.
2372    We assume that the order of the operands for the instruction
2373    is TARG0, OP0, OP1, TARG1, which would fit a pattern like
2374    [(set TARG0 (operate OP0 OP1)) (set TARG1 (operate ...))].
2375
2376    Either TARG0 or TARG1 may be zero, but what that means is that
2377    the result is not actually wanted.  We will generate it into
2378    a dummy pseudo-reg and discard it.  They may not both be zero.
2379
2380    Returns 1 if this operation can be performed; 0 if not.  */
2381
2382 int
2383 expand_twoval_binop (optab binoptab, rtx op0, rtx op1, rtx targ0, rtx targ1,
2384                      int unsignedp)
2385 {
2386   enum machine_mode mode = GET_MODE (targ0 ? targ0 : targ1);
2387   enum mode_class mclass;
2388   enum machine_mode wider_mode;
2389   rtx entry_last = get_last_insn ();
2390   rtx last;
2391
2392   mclass = GET_MODE_CLASS (mode);
2393
2394   if (!targ0)
2395     targ0 = gen_reg_rtx (mode);
2396   if (!targ1)
2397     targ1 = gen_reg_rtx (mode);
2398
2399   /* Record where to go back to if we fail.  */
2400   last = get_last_insn ();
2401
2402   if (optab_handler (binoptab, mode) != CODE_FOR_nothing)
2403     {
2404       struct expand_operand ops[4];
2405       enum insn_code icode = optab_handler (binoptab, mode);
2406       enum machine_mode mode0 = insn_data[icode].operand[1].mode;
2407       enum machine_mode mode1 = insn_data[icode].operand[2].mode;
2408       rtx xop0 = op0, xop1 = op1;
2409
2410       /* If we are optimizing, force expensive constants into a register.  */
2411       xop0 = avoid_expensive_constant (mode0, binoptab, 0, xop0, unsignedp);
2412       xop1 = avoid_expensive_constant (mode1, binoptab, 1, xop1, unsignedp);
2413
2414       create_fixed_operand (&ops[0], targ0);
2415       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2416       create_convert_operand_from (&ops[2], op1, mode, unsignedp);
2417       create_fixed_operand (&ops[3], targ1);
2418       if (maybe_expand_insn (icode, 4, ops))
2419         return 1;
2420       delete_insns_since (last);
2421     }
2422
2423   /* It can't be done in this mode.  Can we do it in a wider mode?  */
2424
2425   if (CLASS_HAS_WIDER_MODES_P (mclass))
2426     {
2427       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2428            wider_mode != VOIDmode;
2429            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2430         {
2431           if (optab_handler (binoptab, wider_mode) != CODE_FOR_nothing)
2432             {
2433               rtx t0 = gen_reg_rtx (wider_mode);
2434               rtx t1 = gen_reg_rtx (wider_mode);
2435               rtx cop0 = convert_modes (wider_mode, mode, op0, unsignedp);
2436               rtx cop1 = convert_modes (wider_mode, mode, op1, unsignedp);
2437
2438               if (expand_twoval_binop (binoptab, cop0, cop1,
2439                                        t0, t1, unsignedp))
2440                 {
2441                   convert_move (targ0, t0, unsignedp);
2442                   convert_move (targ1, t1, unsignedp);
2443                   return 1;
2444                 }
2445               else
2446                 delete_insns_since (last);
2447             }
2448         }
2449     }
2450
2451   delete_insns_since (entry_last);
2452   return 0;
2453 }
2454
2455 /* Expand the two-valued library call indicated by BINOPTAB, but
2456    preserve only one of the values.  If TARG0 is non-NULL, the first
2457    value is placed into TARG0; otherwise the second value is placed
2458    into TARG1.  Exactly one of TARG0 and TARG1 must be non-NULL.  The
2459    value stored into TARG0 or TARG1 is equivalent to (CODE OP0 OP1).
2460    This routine assumes that the value returned by the library call is
2461    as if the return value was of an integral mode twice as wide as the
2462    mode of OP0.  Returns 1 if the call was successful.  */
2463
2464 bool
2465 expand_twoval_binop_libfunc (optab binoptab, rtx op0, rtx op1,
2466                              rtx targ0, rtx targ1, enum rtx_code code)
2467 {
2468   enum machine_mode mode;
2469   enum machine_mode libval_mode;
2470   rtx libval;
2471   rtx insns;
2472   rtx libfunc;
2473
2474   /* Exactly one of TARG0 or TARG1 should be non-NULL.  */
2475   gcc_assert (!targ0 != !targ1);
2476
2477   mode = GET_MODE (op0);
2478   libfunc = optab_libfunc (binoptab, mode);
2479   if (!libfunc)
2480     return false;
2481
2482   /* The value returned by the library function will have twice as
2483      many bits as the nominal MODE.  */
2484   libval_mode = smallest_mode_for_size (2 * GET_MODE_BITSIZE (mode),
2485                                         MODE_INT);
2486   start_sequence ();
2487   libval = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
2488                                     libval_mode, 2,
2489                                     op0, mode,
2490                                     op1, mode);
2491   /* Get the part of VAL containing the value that we want.  */
2492   libval = simplify_gen_subreg (mode, libval, libval_mode,
2493                                 targ0 ? 0 : GET_MODE_SIZE (mode));
2494   insns = get_insns ();
2495   end_sequence ();
2496   /* Move the into the desired location.  */
2497   emit_libcall_block (insns, targ0 ? targ0 : targ1, libval,
2498                       gen_rtx_fmt_ee (code, mode, op0, op1));
2499
2500   return true;
2501 }
2502
2503 \f
2504 /* Wrapper around expand_unop which takes an rtx code to specify
2505    the operation to perform, not an optab pointer.  All other
2506    arguments are the same.  */
2507 rtx
2508 expand_simple_unop (enum machine_mode mode, enum rtx_code code, rtx op0,
2509                     rtx target, int unsignedp)
2510 {
2511   optab unop = code_to_optab (code);
2512   gcc_assert (unop);
2513
2514   return expand_unop (mode, unop, op0, target, unsignedp);
2515 }
2516
2517 /* Try calculating
2518         (clz:narrow x)
2519    as
2520         (clz:wide (zero_extend:wide x)) - ((width wide) - (width narrow)).
2521
2522    A similar operation can be used for clrsb.  UNOPTAB says which operation
2523    we are trying to expand.  */
2524 static rtx
2525 widen_leading (enum machine_mode mode, rtx op0, rtx target, optab unoptab)
2526 {
2527   enum mode_class mclass = GET_MODE_CLASS (mode);
2528   if (CLASS_HAS_WIDER_MODES_P (mclass))
2529     {
2530       enum machine_mode wider_mode;
2531       for (wider_mode = GET_MODE_WIDER_MODE (mode);
2532            wider_mode != VOIDmode;
2533            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2534         {
2535           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
2536             {
2537               rtx xop0, temp, last;
2538
2539               last = get_last_insn ();
2540
2541               if (target == 0)
2542                 target = gen_reg_rtx (mode);
2543               xop0 = widen_operand (op0, wider_mode, mode,
2544                                     unoptab != clrsb_optab, false);
2545               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
2546                                   unoptab != clrsb_optab);
2547               if (temp != 0)
2548                 temp = expand_binop
2549                   (wider_mode, sub_optab, temp,
2550                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
2551                                  - GET_MODE_PRECISION (mode),
2552                                  wider_mode),
2553                    target, true, OPTAB_DIRECT);
2554               if (temp == 0)
2555                 delete_insns_since (last);
2556
2557               return temp;
2558             }
2559         }
2560     }
2561   return 0;
2562 }
2563
2564 /* Try calculating clz of a double-word quantity as two clz's of word-sized
2565    quantities, choosing which based on whether the high word is nonzero.  */
2566 static rtx
2567 expand_doubleword_clz (enum machine_mode mode, rtx op0, rtx target)
2568 {
2569   rtx xop0 = force_reg (mode, op0);
2570   rtx subhi = gen_highpart (word_mode, xop0);
2571   rtx sublo = gen_lowpart (word_mode, xop0);
2572   rtx hi0_label = gen_label_rtx ();
2573   rtx after_label = gen_label_rtx ();
2574   rtx seq, temp, result;
2575
2576   /* If we were not given a target, use a word_mode register, not a
2577      'mode' register.  The result will fit, and nobody is expecting
2578      anything bigger (the return type of __builtin_clz* is int).  */
2579   if (!target)
2580     target = gen_reg_rtx (word_mode);
2581
2582   /* In any case, write to a word_mode scratch in both branches of the
2583      conditional, so we can ensure there is a single move insn setting
2584      'target' to tag a REG_EQUAL note on.  */
2585   result = gen_reg_rtx (word_mode);
2586
2587   start_sequence ();
2588
2589   /* If the high word is not equal to zero,
2590      then clz of the full value is clz of the high word.  */
2591   emit_cmp_and_jump_insns (subhi, CONST0_RTX (word_mode), EQ, 0,
2592                            word_mode, true, hi0_label);
2593
2594   temp = expand_unop_direct (word_mode, clz_optab, subhi, result, true);
2595   if (!temp)
2596     goto fail;
2597
2598   if (temp != result)
2599     convert_move (result, temp, true);
2600
2601   emit_jump_insn (gen_jump (after_label));
2602   emit_barrier ();
2603
2604   /* Else clz of the full value is clz of the low word plus the number
2605      of bits in the high word.  */
2606   emit_label (hi0_label);
2607
2608   temp = expand_unop_direct (word_mode, clz_optab, sublo, 0, true);
2609   if (!temp)
2610     goto fail;
2611   temp = expand_binop (word_mode, add_optab, temp,
2612                        gen_int_mode (GET_MODE_BITSIZE (word_mode), word_mode),
2613                        result, true, OPTAB_DIRECT);
2614   if (!temp)
2615     goto fail;
2616   if (temp != result)
2617     convert_move (result, temp, true);
2618
2619   emit_label (after_label);
2620   convert_move (target, result, true);
2621
2622   seq = get_insns ();
2623   end_sequence ();
2624
2625   add_equal_note (seq, target, CLZ, xop0, 0);
2626   emit_insn (seq);
2627   return target;
2628
2629  fail:
2630   end_sequence ();
2631   return 0;
2632 }
2633
2634 /* Try calculating
2635         (bswap:narrow x)
2636    as
2637         (lshiftrt:wide (bswap:wide x) ((width wide) - (width narrow))).  */
2638 static rtx
2639 widen_bswap (enum machine_mode mode, rtx op0, rtx target)
2640 {
2641   enum mode_class mclass = GET_MODE_CLASS (mode);
2642   enum machine_mode wider_mode;
2643   rtx x, last;
2644
2645   if (!CLASS_HAS_WIDER_MODES_P (mclass))
2646     return NULL_RTX;
2647
2648   for (wider_mode = GET_MODE_WIDER_MODE (mode);
2649        wider_mode != VOIDmode;
2650        wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2651     if (optab_handler (bswap_optab, wider_mode) != CODE_FOR_nothing)
2652       goto found;
2653   return NULL_RTX;
2654
2655  found:
2656   last = get_last_insn ();
2657
2658   x = widen_operand (op0, wider_mode, mode, true, true);
2659   x = expand_unop (wider_mode, bswap_optab, x, NULL_RTX, true);
2660
2661   gcc_assert (GET_MODE_PRECISION (wider_mode) == GET_MODE_BITSIZE (wider_mode)
2662               && GET_MODE_PRECISION (mode) == GET_MODE_BITSIZE (mode));
2663   if (x != 0)
2664     x = expand_shift (RSHIFT_EXPR, wider_mode, x,
2665                       GET_MODE_BITSIZE (wider_mode)
2666                       - GET_MODE_BITSIZE (mode),
2667                       NULL_RTX, true);
2668
2669   if (x != 0)
2670     {
2671       if (target == 0)
2672         target = gen_reg_rtx (mode);
2673       emit_move_insn (target, gen_lowpart (mode, x));
2674     }
2675   else
2676     delete_insns_since (last);
2677
2678   return target;
2679 }
2680
2681 /* Try calculating bswap as two bswaps of two word-sized operands.  */
2682
2683 static rtx
2684 expand_doubleword_bswap (enum machine_mode mode, rtx op, rtx target)
2685 {
2686   rtx t0, t1;
2687
2688   t1 = expand_unop (word_mode, bswap_optab,
2689                     operand_subword_force (op, 0, mode), NULL_RTX, true);
2690   t0 = expand_unop (word_mode, bswap_optab,
2691                     operand_subword_force (op, 1, mode), NULL_RTX, true);
2692
2693   if (target == 0 || !valid_multiword_target_p (target))
2694     target = gen_reg_rtx (mode);
2695   if (REG_P (target))
2696     emit_clobber (target);
2697   emit_move_insn (operand_subword (target, 0, 1, mode), t0);
2698   emit_move_insn (operand_subword (target, 1, 1, mode), t1);
2699
2700   return target;
2701 }
2702
2703 /* Try calculating (parity x) as (and (popcount x) 1), where
2704    popcount can also be done in a wider mode.  */
2705 static rtx
2706 expand_parity (enum machine_mode mode, rtx op0, rtx target)
2707 {
2708   enum mode_class mclass = GET_MODE_CLASS (mode);
2709   if (CLASS_HAS_WIDER_MODES_P (mclass))
2710     {
2711       enum machine_mode wider_mode;
2712       for (wider_mode = mode; wider_mode != VOIDmode;
2713            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
2714         {
2715           if (optab_handler (popcount_optab, wider_mode) != CODE_FOR_nothing)
2716             {
2717               rtx xop0, temp, last;
2718
2719               last = get_last_insn ();
2720
2721               if (target == 0)
2722                 target = gen_reg_rtx (mode);
2723               xop0 = widen_operand (op0, wider_mode, mode, true, false);
2724               temp = expand_unop (wider_mode, popcount_optab, xop0, NULL_RTX,
2725                                   true);
2726               if (temp != 0)
2727                 temp = expand_binop (wider_mode, and_optab, temp, const1_rtx,
2728                                      target, true, OPTAB_DIRECT);
2729               if (temp == 0)
2730                 delete_insns_since (last);
2731
2732               return temp;
2733             }
2734         }
2735     }
2736   return 0;
2737 }
2738
2739 /* Try calculating ctz(x) as K - clz(x & -x) ,
2740    where K is GET_MODE_PRECISION(mode) - 1.
2741
2742    Both __builtin_ctz and __builtin_clz are undefined at zero, so we
2743    don't have to worry about what the hardware does in that case.  (If
2744    the clz instruction produces the usual value at 0, which is K, the
2745    result of this code sequence will be -1; expand_ffs, below, relies
2746    on this.  It might be nice to have it be K instead, for consistency
2747    with the (very few) processors that provide a ctz with a defined
2748    value, but that would take one more instruction, and it would be
2749    less convenient for expand_ffs anyway.  */
2750
2751 static rtx
2752 expand_ctz (enum machine_mode mode, rtx op0, rtx target)
2753 {
2754   rtx seq, temp;
2755
2756   if (optab_handler (clz_optab, mode) == CODE_FOR_nothing)
2757     return 0;
2758
2759   start_sequence ();
2760
2761   temp = expand_unop_direct (mode, neg_optab, op0, NULL_RTX, true);
2762   if (temp)
2763     temp = expand_binop (mode, and_optab, op0, temp, NULL_RTX,
2764                          true, OPTAB_DIRECT);
2765   if (temp)
2766     temp = expand_unop_direct (mode, clz_optab, temp, NULL_RTX, true);
2767   if (temp)
2768     temp = expand_binop (mode, sub_optab,
2769                          gen_int_mode (GET_MODE_PRECISION (mode) - 1, mode),
2770                          temp, target,
2771                          true, OPTAB_DIRECT);
2772   if (temp == 0)
2773     {
2774       end_sequence ();
2775       return 0;
2776     }
2777
2778   seq = get_insns ();
2779   end_sequence ();
2780
2781   add_equal_note (seq, temp, CTZ, op0, 0);
2782   emit_insn (seq);
2783   return temp;
2784 }
2785
2786
2787 /* Try calculating ffs(x) using ctz(x) if we have that instruction, or
2788    else with the sequence used by expand_clz.
2789
2790    The ffs builtin promises to return zero for a zero value and ctz/clz
2791    may have an undefined value in that case.  If they do not give us a
2792    convenient value, we have to generate a test and branch.  */
2793 static rtx
2794 expand_ffs (enum machine_mode mode, rtx op0, rtx target)
2795 {
2796   HOST_WIDE_INT val = 0;
2797   bool defined_at_zero = false;
2798   rtx temp, seq;
2799
2800   if (optab_handler (ctz_optab, mode) != CODE_FOR_nothing)
2801     {
2802       start_sequence ();
2803
2804       temp = expand_unop_direct (mode, ctz_optab, op0, 0, true);
2805       if (!temp)
2806         goto fail;
2807
2808       defined_at_zero = (CTZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2);
2809     }
2810   else if (optab_handler (clz_optab, mode) != CODE_FOR_nothing)
2811     {
2812       start_sequence ();
2813       temp = expand_ctz (mode, op0, 0);
2814       if (!temp)
2815         goto fail;
2816
2817       if (CLZ_DEFINED_VALUE_AT_ZERO (mode, val) == 2)
2818         {
2819           defined_at_zero = true;
2820           val = (GET_MODE_PRECISION (mode) - 1) - val;
2821         }
2822     }
2823   else
2824     return 0;
2825
2826   if (defined_at_zero && val == -1)
2827     /* No correction needed at zero.  */;
2828   else
2829     {
2830       /* We don't try to do anything clever with the situation found
2831          on some processors (eg Alpha) where ctz(0:mode) ==
2832          bitsize(mode).  If someone can think of a way to send N to -1
2833          and leave alone all values in the range 0..N-1 (where N is a
2834          power of two), cheaper than this test-and-branch, please add it.
2835
2836          The test-and-branch is done after the operation itself, in case
2837          the operation sets condition codes that can be recycled for this.
2838          (This is true on i386, for instance.)  */
2839
2840       rtx nonzero_label = gen_label_rtx ();
2841       emit_cmp_and_jump_insns (op0, CONST0_RTX (mode), NE, 0,
2842                                mode, true, nonzero_label);
2843
2844       convert_move (temp, GEN_INT (-1), false);
2845       emit_label (nonzero_label);
2846     }
2847
2848   /* temp now has a value in the range -1..bitsize-1.  ffs is supposed
2849      to produce a value in the range 0..bitsize.  */
2850   temp = expand_binop (mode, add_optab, temp, gen_int_mode (1, mode),
2851                        target, false, OPTAB_DIRECT);
2852   if (!temp)
2853     goto fail;
2854
2855   seq = get_insns ();
2856   end_sequence ();
2857
2858   add_equal_note (seq, temp, FFS, op0, 0);
2859   emit_insn (seq);
2860   return temp;
2861
2862  fail:
2863   end_sequence ();
2864   return 0;
2865 }
2866
2867 /* Extract the OMODE lowpart from VAL, which has IMODE.  Under certain
2868    conditions, VAL may already be a SUBREG against which we cannot generate
2869    a further SUBREG.  In this case, we expect forcing the value into a
2870    register will work around the situation.  */
2871
2872 static rtx
2873 lowpart_subreg_maybe_copy (enum machine_mode omode, rtx val,
2874                            enum machine_mode imode)
2875 {
2876   rtx ret;
2877   ret = lowpart_subreg (omode, val, imode);
2878   if (ret == NULL)
2879     {
2880       val = force_reg (imode, val);
2881       ret = lowpart_subreg (omode, val, imode);
2882       gcc_assert (ret != NULL);
2883     }
2884   return ret;
2885 }
2886
2887 /* Expand a floating point absolute value or negation operation via a
2888    logical operation on the sign bit.  */
2889
2890 static rtx
2891 expand_absneg_bit (enum rtx_code code, enum machine_mode mode,
2892                    rtx op0, rtx target)
2893 {
2894   const struct real_format *fmt;
2895   int bitpos, word, nwords, i;
2896   enum machine_mode imode;
2897   rtx temp, insns;
2898
2899   /* The format has to have a simple sign bit.  */
2900   fmt = REAL_MODE_FORMAT (mode);
2901   if (fmt == NULL)
2902     return NULL_RTX;
2903
2904   bitpos = fmt->signbit_rw;
2905   if (bitpos < 0)
2906     return NULL_RTX;
2907
2908   /* Don't create negative zeros if the format doesn't support them.  */
2909   if (code == NEG && !fmt->has_signed_zero)
2910     return NULL_RTX;
2911
2912   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
2913     {
2914       imode = int_mode_for_mode (mode);
2915       if (imode == BLKmode)
2916         return NULL_RTX;
2917       word = 0;
2918       nwords = 1;
2919     }
2920   else
2921     {
2922       imode = word_mode;
2923
2924       if (FLOAT_WORDS_BIG_ENDIAN)
2925         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
2926       else
2927         word = bitpos / BITS_PER_WORD;
2928       bitpos = bitpos % BITS_PER_WORD;
2929       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
2930     }
2931
2932   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
2933   if (code == ABS)
2934     mask = ~mask;
2935
2936   if (target == 0
2937       || target == op0
2938       || (nwords > 1 && !valid_multiword_target_p (target)))
2939     target = gen_reg_rtx (mode);
2940
2941   if (nwords > 1)
2942     {
2943       start_sequence ();
2944
2945       for (i = 0; i < nwords; ++i)
2946         {
2947           rtx targ_piece = operand_subword (target, i, 1, mode);
2948           rtx op0_piece = operand_subword_force (op0, i, mode);
2949
2950           if (i == word)
2951             {
2952               temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2953                                    op0_piece,
2954                                    immed_wide_int_const (mask, imode),
2955                                    targ_piece, 1, OPTAB_LIB_WIDEN);
2956               if (temp != targ_piece)
2957                 emit_move_insn (targ_piece, temp);
2958             }
2959           else
2960             emit_move_insn (targ_piece, op0_piece);
2961         }
2962
2963       insns = get_insns ();
2964       end_sequence ();
2965
2966       emit_insn (insns);
2967     }
2968   else
2969     {
2970       temp = expand_binop (imode, code == ABS ? and_optab : xor_optab,
2971                            gen_lowpart (imode, op0),
2972                            immed_wide_int_const (mask, imode),
2973                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
2974       target = lowpart_subreg_maybe_copy (mode, temp, imode);
2975
2976       set_dst_reg_note (get_last_insn (), REG_EQUAL,
2977                         gen_rtx_fmt_e (code, mode, copy_rtx (op0)),
2978                         target);
2979     }
2980
2981   return target;
2982 }
2983
2984 /* As expand_unop, but will fail rather than attempt the operation in a
2985    different mode or with a libcall.  */
2986 static rtx
2987 expand_unop_direct (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
2988              int unsignedp)
2989 {
2990   if (optab_handler (unoptab, mode) != CODE_FOR_nothing)
2991     {
2992       struct expand_operand ops[2];
2993       enum insn_code icode = optab_handler (unoptab, mode);
2994       rtx last = get_last_insn ();
2995       rtx pat;
2996
2997       create_output_operand (&ops[0], target, mode);
2998       create_convert_operand_from (&ops[1], op0, mode, unsignedp);
2999       pat = maybe_gen_insn (icode, 2, ops);
3000       if (pat)
3001         {
3002           if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX
3003               && ! add_equal_note (pat, ops[0].value, optab_to_code (unoptab),
3004                                    ops[1].value, NULL_RTX))
3005             {
3006               delete_insns_since (last);
3007               return expand_unop (mode, unoptab, op0, NULL_RTX, unsignedp);
3008             }
3009
3010           emit_insn (pat);
3011
3012           return ops[0].value;
3013         }
3014     }
3015   return 0;
3016 }
3017
3018 /* Generate code to perform an operation specified by UNOPTAB
3019    on operand OP0, with result having machine-mode MODE.
3020
3021    UNSIGNEDP is for the case where we have to widen the operands
3022    to perform the operation.  It says to use zero-extension.
3023
3024    If TARGET is nonzero, the value
3025    is generated there, if it is convenient to do so.
3026    In all cases an rtx is returned for the locus of the value;
3027    this may or may not be TARGET.  */
3028
3029 rtx
3030 expand_unop (enum machine_mode mode, optab unoptab, rtx op0, rtx target,
3031              int unsignedp)
3032 {
3033   enum mode_class mclass = GET_MODE_CLASS (mode);
3034   enum machine_mode wider_mode;
3035   rtx temp;
3036   rtx libfunc;
3037
3038   temp = expand_unop_direct (mode, unoptab, op0, target, unsignedp);
3039   if (temp)
3040     return temp;
3041
3042   /* It can't be done in this mode.  Can we open-code it in a wider mode?  */
3043
3044   /* Widening (or narrowing) clz needs special treatment.  */
3045   if (unoptab == clz_optab)
3046     {
3047       temp = widen_leading (mode, op0, target, unoptab);
3048       if (temp)
3049         return temp;
3050
3051       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3052           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3053         {
3054           temp = expand_doubleword_clz (mode, op0, target);
3055           if (temp)
3056             return temp;
3057         }
3058
3059       goto try_libcall;
3060     }
3061
3062   if (unoptab == clrsb_optab)
3063     {
3064       temp = widen_leading (mode, op0, target, unoptab);
3065       if (temp)
3066         return temp;
3067       goto try_libcall;
3068     }
3069
3070   /* Widening (or narrowing) bswap needs special treatment.  */
3071   if (unoptab == bswap_optab)
3072     {
3073       /* HImode is special because in this mode BSWAP is equivalent to ROTATE
3074          or ROTATERT.  First try these directly; if this fails, then try the
3075          obvious pair of shifts with allowed widening, as this will probably
3076          be always more efficient than the other fallback methods.  */
3077       if (mode == HImode)
3078         {
3079           rtx last, temp1, temp2;
3080
3081           if (optab_handler (rotl_optab, mode) != CODE_FOR_nothing)
3082             {
3083               temp = expand_binop (mode, rotl_optab, op0, GEN_INT (8), target,
3084                                    unsignedp, OPTAB_DIRECT);
3085               if (temp)
3086                 return temp;
3087              }
3088
3089           if (optab_handler (rotr_optab, mode) != CODE_FOR_nothing)
3090             {
3091               temp = expand_binop (mode, rotr_optab, op0, GEN_INT (8), target,
3092                                    unsignedp, OPTAB_DIRECT);
3093               if (temp)
3094                 return temp;
3095             }
3096
3097           last = get_last_insn ();
3098
3099           temp1 = expand_binop (mode, ashl_optab, op0, GEN_INT (8), NULL_RTX,
3100                                 unsignedp, OPTAB_WIDEN);
3101           temp2 = expand_binop (mode, lshr_optab, op0, GEN_INT (8), NULL_RTX,
3102                                 unsignedp, OPTAB_WIDEN);
3103           if (temp1 && temp2)
3104             {
3105               temp = expand_binop (mode, ior_optab, temp1, temp2, target,
3106                                    unsignedp, OPTAB_WIDEN);
3107               if (temp)
3108                 return temp;
3109             }
3110
3111           delete_insns_since (last);
3112         }
3113
3114       temp = widen_bswap (mode, op0, target);
3115       if (temp)
3116         return temp;
3117
3118       if (GET_MODE_SIZE (mode) == 2 * UNITS_PER_WORD
3119           && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3120         {
3121           temp = expand_doubleword_bswap (mode, op0, target);
3122           if (temp)
3123             return temp;
3124         }
3125
3126       goto try_libcall;
3127     }
3128
3129   if (CLASS_HAS_WIDER_MODES_P (mclass))
3130     for (wider_mode = GET_MODE_WIDER_MODE (mode);
3131          wider_mode != VOIDmode;
3132          wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3133       {
3134         if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing)
3135           {
3136             rtx xop0 = op0;
3137             rtx last = get_last_insn ();
3138
3139             /* For certain operations, we need not actually extend
3140                the narrow operand, as long as we will truncate the
3141                results to the same narrowness.  */
3142
3143             xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3144                                   (unoptab == neg_optab
3145                                    || unoptab == one_cmpl_optab)
3146                                   && mclass == MODE_INT);
3147
3148             temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3149                                 unsignedp);
3150
3151             if (temp)
3152               {
3153                 if (mclass != MODE_INT
3154                     || !TRULY_NOOP_TRUNCATION_MODES_P (mode, wider_mode))
3155                   {
3156                     if (target == 0)
3157                       target = gen_reg_rtx (mode);
3158                     convert_move (target, temp, 0);
3159                     return target;
3160                   }
3161                 else
3162                   return gen_lowpart (mode, temp);
3163               }
3164             else
3165               delete_insns_since (last);
3166           }
3167       }
3168
3169   /* These can be done a word at a time.  */
3170   if (unoptab == one_cmpl_optab
3171       && mclass == MODE_INT
3172       && GET_MODE_SIZE (mode) > UNITS_PER_WORD
3173       && optab_handler (unoptab, word_mode) != CODE_FOR_nothing)
3174     {
3175       int i;
3176       rtx insns;
3177
3178       if (target == 0 || target == op0 || !valid_multiword_target_p (target))
3179         target = gen_reg_rtx (mode);
3180
3181       start_sequence ();
3182
3183       /* Do the actual arithmetic.  */
3184       for (i = 0; i < GET_MODE_BITSIZE (mode) / BITS_PER_WORD; i++)
3185         {
3186           rtx target_piece = operand_subword (target, i, 1, mode);
3187           rtx x = expand_unop (word_mode, unoptab,
3188                                operand_subword_force (op0, i, mode),
3189                                target_piece, unsignedp);
3190
3191           if (target_piece != x)
3192             emit_move_insn (target_piece, x);
3193         }
3194
3195       insns = get_insns ();
3196       end_sequence ();
3197
3198       emit_insn (insns);
3199       return target;
3200     }
3201
3202   if (optab_to_code (unoptab) == NEG)
3203     {
3204       /* Try negating floating point values by flipping the sign bit.  */
3205       if (SCALAR_FLOAT_MODE_P (mode))
3206         {
3207           temp = expand_absneg_bit (NEG, mode, op0, target);
3208           if (temp)
3209             return temp;
3210         }
3211
3212       /* If there is no negation pattern, and we have no negative zero,
3213          try subtracting from zero.  */
3214       if (!HONOR_SIGNED_ZEROS (mode))
3215         {
3216           temp = expand_binop (mode, (unoptab == negv_optab
3217                                       ? subv_optab : sub_optab),
3218                                CONST0_RTX (mode), op0, target,
3219                                unsignedp, OPTAB_DIRECT);
3220           if (temp)
3221             return temp;
3222         }
3223     }
3224
3225   /* Try calculating parity (x) as popcount (x) % 2.  */
3226   if (unoptab == parity_optab)
3227     {
3228       temp = expand_parity (mode, op0, target);
3229       if (temp)
3230         return temp;
3231     }
3232
3233   /* Try implementing ffs (x) in terms of clz (x).  */
3234   if (unoptab == ffs_optab)
3235     {
3236       temp = expand_ffs (mode, op0, target);
3237       if (temp)
3238         return temp;
3239     }
3240
3241   /* Try implementing ctz (x) in terms of clz (x).  */
3242   if (unoptab == ctz_optab)
3243     {
3244       temp = expand_ctz (mode, op0, target);
3245       if (temp)
3246         return temp;
3247     }
3248
3249  try_libcall:
3250   /* Now try a library call in this mode.  */
3251   libfunc = optab_libfunc (unoptab, mode);
3252   if (libfunc)
3253     {
3254       rtx insns;
3255       rtx value;
3256       rtx eq_value;
3257       enum machine_mode outmode = mode;
3258
3259       /* All of these functions return small values.  Thus we choose to
3260          have them return something that isn't a double-word.  */
3261       if (unoptab == ffs_optab || unoptab == clz_optab || unoptab == ctz_optab
3262           || unoptab == clrsb_optab || unoptab == popcount_optab
3263           || unoptab == parity_optab)
3264         outmode
3265           = GET_MODE (hard_libcall_value (TYPE_MODE (integer_type_node),
3266                                           optab_libfunc (unoptab, mode)));
3267
3268       start_sequence ();
3269
3270       /* Pass 1 for NO_QUEUE so we don't lose any increments
3271          if the libcall is cse'd or moved.  */
3272       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, outmode,
3273                                        1, op0, mode);
3274       insns = get_insns ();
3275       end_sequence ();
3276
3277       target = gen_reg_rtx (outmode);
3278       eq_value = gen_rtx_fmt_e (optab_to_code (unoptab), mode, op0);
3279       if (GET_MODE_SIZE (outmode) < GET_MODE_SIZE (mode))
3280         eq_value = simplify_gen_unary (TRUNCATE, outmode, eq_value, mode);
3281       else if (GET_MODE_SIZE (outmode) > GET_MODE_SIZE (mode))
3282         eq_value = simplify_gen_unary (ZERO_EXTEND, outmode, eq_value, mode);
3283       emit_libcall_block_1 (insns, target, value, eq_value,
3284                             trapv_unoptab_p (unoptab));
3285
3286       return target;
3287     }
3288
3289   /* It can't be done in this mode.  Can we do it in a wider mode?  */
3290
3291   if (CLASS_HAS_WIDER_MODES_P (mclass))
3292     {
3293       for (wider_mode = GET_MODE_WIDER_MODE (mode);
3294            wider_mode != VOIDmode;
3295            wider_mode = GET_MODE_WIDER_MODE (wider_mode))
3296         {
3297           if (optab_handler (unoptab, wider_mode) != CODE_FOR_nothing
3298               || optab_libfunc (unoptab, wider_mode))
3299             {
3300               rtx xop0 = op0;
3301               rtx last = get_last_insn ();
3302
3303               /* For certain operations, we need not actually extend
3304                  the narrow operand, as long as we will truncate the
3305                  results to the same narrowness.  */
3306               xop0 = widen_operand (xop0, wider_mode, mode, unsignedp,
3307                                     (unoptab == neg_optab
3308                                      || unoptab == one_cmpl_optab
3309                                      || unoptab == bswap_optab)
3310                                     && mclass == MODE_INT);
3311
3312               temp = expand_unop (wider_mode, unoptab, xop0, NULL_RTX,
3313                                   unsignedp);
3314
3315               /* If we are generating clz using wider mode, adjust the
3316                  result.  Similarly for clrsb.  */
3317               if ((unoptab == clz_optab || unoptab == clrsb_optab)
3318                   && temp != 0)
3319                 temp = expand_binop
3320                   (wider_mode, sub_optab, temp,
3321                    gen_int_mode (GET_MODE_PRECISION (wider_mode)
3322                                  - GET_MODE_PRECISION (mode),
3323                                  wider_mode),
3324                    target, true, OPTAB_DIRECT);
3325
3326               /* Likewise for bswap.  */
3327               if (unoptab == bswap_optab && temp != 0)
3328                 {
3329                   gcc_assert (GET_MODE_PRECISION (wider_mode)
3330                               == GET_MODE_BITSIZE (wider_mode)
3331                               && GET_MODE_PRECISION (mode)
3332                                  == GET_MODE_BITSIZE (mode));
3333
3334                   temp = expand_shift (RSHIFT_EXPR, wider_mode, temp,
3335                                        GET_MODE_BITSIZE (wider_mode)
3336                                        - GET_MODE_BITSIZE (mode),
3337                                        NULL_RTX, true);
3338                 }
3339
3340               if (temp)
3341                 {
3342                   if (mclass != MODE_INT)
3343                     {
3344                       if (target == 0)
3345                         target = gen_reg_rtx (mode);
3346                       convert_move (target, temp, 0);
3347                       return target;
3348                     }
3349                   else
3350                     return gen_lowpart (mode, temp);
3351                 }
3352               else
3353                 delete_insns_since (last);
3354             }
3355         }
3356     }
3357
3358   /* One final attempt at implementing negation via subtraction,
3359      this time allowing widening of the operand.  */
3360   if (optab_to_code (unoptab) == NEG && !HONOR_SIGNED_ZEROS (mode))
3361     {
3362       rtx temp;
3363       temp = expand_binop (mode,
3364                            unoptab == negv_optab ? subv_optab : sub_optab,
3365                            CONST0_RTX (mode), op0,
3366                            target, unsignedp, OPTAB_LIB_WIDEN);
3367       if (temp)
3368         return temp;
3369     }
3370
3371   return 0;
3372 }
3373 \f
3374 /* Emit code to compute the absolute value of OP0, with result to
3375    TARGET if convenient.  (TARGET may be 0.)  The return value says
3376    where the result actually is to be found.
3377
3378    MODE is the mode of the operand; the mode of the result is
3379    different but can be deduced from MODE.
3380
3381  */
3382
3383 rtx
3384 expand_abs_nojump (enum machine_mode mode, rtx op0, rtx target,
3385                    int result_unsignedp)
3386 {
3387   rtx temp;
3388
3389   if (GET_MODE_CLASS (mode) != MODE_INT
3390       || ! flag_trapv)
3391     result_unsignedp = 1;
3392
3393   /* First try to do it with a special abs instruction.  */
3394   temp = expand_unop (mode, result_unsignedp ? abs_optab : absv_optab,
3395                       op0, target, 0);
3396   if (temp != 0)
3397     return temp;
3398
3399   /* For floating point modes, try clearing the sign bit.  */
3400   if (SCALAR_FLOAT_MODE_P (mode))
3401     {
3402       temp = expand_absneg_bit (ABS, mode, op0, target);
3403       if (temp)
3404         return temp;
3405     }
3406
3407   /* If we have a MAX insn, we can do this as MAX (x, -x).  */
3408   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing
3409       && !HONOR_SIGNED_ZEROS (mode))
3410     {
3411       rtx last = get_last_insn ();
3412
3413       temp = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3414                           op0, NULL_RTX, 0);
3415       if (temp != 0)
3416         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3417                              OPTAB_WIDEN);
3418
3419       if (temp != 0)
3420         return temp;
3421
3422       delete_insns_since (last);
3423     }
3424
3425   /* If this machine has expensive jumps, we can do integer absolute
3426      value of X as (((signed) x >> (W-1)) ^ x) - ((signed) x >> (W-1)),
3427      where W is the width of MODE.  */
3428
3429   if (GET_MODE_CLASS (mode) == MODE_INT
3430       && BRANCH_COST (optimize_insn_for_speed_p (),
3431                       false) >= 2)
3432     {
3433       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3434                                    GET_MODE_PRECISION (mode) - 1,
3435                                    NULL_RTX, 0);
3436
3437       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3438                            OPTAB_LIB_WIDEN);
3439       if (temp != 0)
3440         temp = expand_binop (mode, result_unsignedp ? sub_optab : subv_optab,
3441                              temp, extended, target, 0, OPTAB_LIB_WIDEN);
3442
3443       if (temp != 0)
3444         return temp;
3445     }
3446
3447   return NULL_RTX;
3448 }
3449
3450 rtx
3451 expand_abs (enum machine_mode mode, rtx op0, rtx target,
3452             int result_unsignedp, int safe)
3453 {
3454   rtx temp, op1;
3455
3456   if (GET_MODE_CLASS (mode) != MODE_INT
3457       || ! flag_trapv)
3458     result_unsignedp = 1;
3459
3460   temp = expand_abs_nojump (mode, op0, target, result_unsignedp);
3461   if (temp != 0)
3462     return temp;
3463
3464   /* If that does not win, use conditional jump and negate.  */
3465
3466   /* It is safe to use the target if it is the same
3467      as the source if this is also a pseudo register */
3468   if (op0 == target && REG_P (op0)
3469       && REGNO (op0) >= FIRST_PSEUDO_REGISTER)
3470     safe = 1;
3471
3472   op1 = gen_label_rtx ();
3473   if (target == 0 || ! safe
3474       || GET_MODE (target) != mode
3475       || (MEM_P (target) && MEM_VOLATILE_P (target))
3476       || (REG_P (target)
3477           && REGNO (target) < FIRST_PSEUDO_REGISTER))
3478     target = gen_reg_rtx (mode);
3479
3480   emit_move_insn (target, op0);
3481   NO_DEFER_POP;
3482
3483   do_compare_rtx_and_jump (target, CONST0_RTX (mode), GE, 0, mode,
3484                            NULL_RTX, NULL_RTX, op1, -1);
3485
3486   op0 = expand_unop (mode, result_unsignedp ? neg_optab : negv_optab,
3487                      target, target, 0);
3488   if (op0 != target)
3489     emit_move_insn (target, op0);
3490   emit_label (op1);
3491   OK_DEFER_POP;
3492   return target;
3493 }
3494
3495 /* Emit code to compute the one's complement absolute value of OP0
3496    (if (OP0 < 0) OP0 = ~OP0), with result to TARGET if convenient.
3497    (TARGET may be NULL_RTX.)  The return value says where the result
3498    actually is to be found.
3499
3500    MODE is the mode of the operand; the mode of the result is
3501    different but can be deduced from MODE.  */
3502
3503 rtx
3504 expand_one_cmpl_abs_nojump (enum machine_mode mode, rtx op0, rtx target)
3505 {
3506   rtx temp;
3507
3508   /* Not applicable for floating point modes.  */
3509   if (FLOAT_MODE_P (mode))
3510     return NULL_RTX;
3511
3512   /* If we have a MAX insn, we can do this as MAX (x, ~x).  */
3513   if (optab_handler (smax_optab, mode) != CODE_FOR_nothing)
3514     {
3515       rtx last = get_last_insn ();
3516
3517       temp = expand_unop (mode, one_cmpl_optab, op0, NULL_RTX, 0);
3518       if (temp != 0)
3519         temp = expand_binop (mode, smax_optab, op0, temp, target, 0,
3520                              OPTAB_WIDEN);
3521
3522       if (temp != 0)
3523         return temp;
3524
3525       delete_insns_since (last);
3526     }
3527
3528   /* If this machine has expensive jumps, we can do one's complement
3529      absolute value of X as (((signed) x >> (W-1)) ^ x).  */
3530
3531   if (GET_MODE_CLASS (mode) == MODE_INT
3532       && BRANCH_COST (optimize_insn_for_speed_p (),
3533                      false) >= 2)
3534     {
3535       rtx extended = expand_shift (RSHIFT_EXPR, mode, op0,
3536                                    GET_MODE_PRECISION (mode) - 1,
3537                                    NULL_RTX, 0);
3538
3539       temp = expand_binop (mode, xor_optab, extended, op0, target, 0,
3540                            OPTAB_LIB_WIDEN);
3541
3542       if (temp != 0)
3543         return temp;
3544     }
3545
3546   return NULL_RTX;
3547 }
3548
3549 /* A subroutine of expand_copysign, perform the copysign operation using the
3550    abs and neg primitives advertised to exist on the target.  The assumption
3551    is that we have a split register file, and leaving op0 in fp registers,
3552    and not playing with subregs so much, will help the register allocator.  */
3553
3554 static rtx
3555 expand_copysign_absneg (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3556                         int bitpos, bool op0_is_abs)
3557 {
3558   enum machine_mode imode;
3559   enum insn_code icode;
3560   rtx sign, label;
3561
3562   if (target == op1)
3563     target = NULL_RTX;
3564
3565   /* Check if the back end provides an insn that handles signbit for the
3566      argument's mode. */
3567   icode = optab_handler (signbit_optab, mode);
3568   if (icode != CODE_FOR_nothing)
3569     {
3570       imode = insn_data[(int) icode].operand[0].mode;
3571       sign = gen_reg_rtx (imode);
3572       emit_unop_insn (icode, sign, op1, UNKNOWN);
3573     }
3574   else
3575     {
3576       if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3577         {
3578           imode = int_mode_for_mode (mode);
3579           if (imode == BLKmode)
3580             return NULL_RTX;
3581           op1 = gen_lowpart (imode, op1);
3582         }
3583       else
3584         {
3585           int word;
3586
3587           imode = word_mode;
3588           if (FLOAT_WORDS_BIG_ENDIAN)
3589             word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3590           else
3591             word = bitpos / BITS_PER_WORD;
3592           bitpos = bitpos % BITS_PER_WORD;
3593           op1 = operand_subword_force (op1, word, mode);
3594         }
3595
3596       wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3597       sign = expand_binop (imode, and_optab, op1,
3598                            immed_wide_int_const (mask, imode),
3599                            NULL_RTX, 1, OPTAB_LIB_WIDEN);
3600     }
3601
3602   if (!op0_is_abs)
3603     {
3604       op0 = expand_unop (mode, abs_optab, op0, target, 0);
3605       if (op0 == NULL)
3606         return NULL_RTX;
3607       target = op0;
3608     }
3609   else
3610     {
3611       if (target == NULL_RTX)
3612         target = copy_to_reg (op0);
3613       else
3614         emit_move_insn (target, op0);
3615     }
3616
3617   label = gen_label_rtx ();
3618   emit_cmp_and_jump_insns (sign, const0_rtx, EQ, NULL_RTX, imode, 1, label);
3619
3620   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3621     op0 = simplify_unary_operation (NEG, mode, op0, mode);
3622   else
3623     op0 = expand_unop (mode, neg_optab, op0, target, 0);
3624   if (op0 != target)
3625     emit_move_insn (target, op0);
3626
3627   emit_label (label);
3628
3629   return target;
3630 }
3631
3632
3633 /* A subroutine of expand_copysign, perform the entire copysign operation
3634    with integer bitmasks.  BITPOS is the position of the sign bit; OP0_IS_ABS
3635    is true if op0 is known to have its sign bit clear.  */
3636
3637 static rtx
3638 expand_copysign_bit (enum machine_mode mode, rtx op0, rtx op1, rtx target,
3639                      int bitpos, bool op0_is_abs)
3640 {
3641   enum machine_mode imode;
3642   int word, nwords, i;
3643   rtx temp, insns;
3644
3645   if (GET_MODE_SIZE (mode) <= UNITS_PER_WORD)
3646     {
3647       imode = int_mode_for_mode (mode);
3648       if (imode == BLKmode)
3649         return NULL_RTX;
3650       word = 0;
3651       nwords = 1;
3652     }
3653   else
3654     {
3655       imode = word_mode;
3656
3657       if (FLOAT_WORDS_BIG_ENDIAN)
3658         word = (GET_MODE_BITSIZE (mode) - bitpos) / BITS_PER_WORD;
3659       else
3660         word = bitpos / BITS_PER_WORD;
3661       bitpos = bitpos % BITS_PER_WORD;
3662       nwords = (GET_MODE_BITSIZE (mode) + BITS_PER_WORD - 1) / BITS_PER_WORD;
3663     }
3664
3665   wide_int mask = wi::set_bit_in_zero (bitpos, GET_MODE_PRECISION (imode));
3666
3667   if (target == 0
3668       || target == op0
3669       || target == op1
3670       || (nwords > 1 && !valid_multiword_target_p (target)))
3671     target = gen_reg_rtx (mode);
3672
3673   if (nwords > 1)
3674     {
3675       start_sequence ();
3676
3677       for (i = 0; i < nwords; ++i)
3678         {
3679           rtx targ_piece = operand_subword (target, i, 1, mode);
3680           rtx op0_piece = operand_subword_force (op0, i, mode);
3681
3682           if (i == word)
3683             {
3684               if (!op0_is_abs)
3685                 op0_piece
3686                   = expand_binop (imode, and_optab, op0_piece,
3687                                   immed_wide_int_const (~mask, imode),
3688                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3689               op1 = expand_binop (imode, and_optab,
3690                                   operand_subword_force (op1, i, mode),
3691                                   immed_wide_int_const (mask, imode),
3692                                   NULL_RTX, 1, OPTAB_LIB_WIDEN);
3693
3694               temp = expand_binop (imode, ior_optab, op0_piece, op1,
3695                                    targ_piece, 1, OPTAB_LIB_WIDEN);
3696               if (temp != targ_piece)
3697                 emit_move_insn (targ_piece, temp);
3698             }
3699           else
3700             emit_move_insn (targ_piece, op0_piece);
3701         }
3702
3703       insns = get_insns ();
3704       end_sequence ();
3705
3706       emit_insn (insns);
3707     }
3708   else
3709     {
3710       op1 = expand_binop (imode, and_optab, gen_lowpart (imode, op1),
3711                           immed_wide_int_const (mask, imode),
3712                           NULL_RTX, 1, OPTAB_LIB_WIDEN);
3713
3714       op0 = gen_lowpart (imode, op0);
3715       if (!op0_is_abs)
3716         op0 = expand_binop (imode, and_optab, op0,
3717                             immed_wide_int_const (~mask, imode),
3718                             NULL_RTX, 1, OPTAB_LIB_WIDEN);
3719
3720       temp = expand_binop (imode, ior_optab, op0, op1,
3721                            gen_lowpart (imode, target), 1, OPTAB_LIB_WIDEN);
3722       target = lowpart_subreg_maybe_copy (mode, temp, imode);
3723     }
3724
3725   return target;
3726 }
3727
3728 /* Expand the C99 copysign operation.  OP0 and OP1 must be the same
3729    scalar floating point mode.  Return NULL if we do not know how to
3730    expand the operation inline.  */
3731
3732 rtx
3733 expand_copysign (rtx op0, rtx op1, rtx target)
3734 {
3735   enum machine_mode mode = GET_MODE (op0);
3736   const struct real_format *fmt;
3737   bool op0_is_abs;
3738   rtx temp;
3739
3740   gcc_assert (SCALAR_FLOAT_MODE_P (mode));
3741   gcc_assert (GET_MODE (op1) == mode);
3742
3743   /* First try to do it with a special instruction.  */
3744   temp = expand_binop (mode, copysign_optab, op0, op1,
3745                        target, 0, OPTAB_DIRECT);
3746   if (temp)
3747     return temp;
3748
3749   fmt = REAL_MODE_FORMAT (mode);
3750   if (fmt == NULL || !fmt->has_signed_zero)
3751     return NULL_RTX;
3752
3753   op0_is_abs = false;
3754   if (CONST_DOUBLE_AS_FLOAT_P (op0))
3755     {
3756       if (real_isneg (CONST_DOUBLE_REAL_VALUE (op0)))
3757         op0 = simplify_unary_operation (ABS, mode, op0, mode);
3758       op0_is_abs = true;
3759     }
3760
3761   if (fmt->signbit_ro >= 0
3762       && (CONST_DOUBLE_AS_FLOAT_P (op0)
3763           || (optab_handler (neg_optab, mode) != CODE_FOR_nothing
3764               && optab_handler (abs_optab, mode) != CODE_FOR_nothing)))
3765     {
3766       temp = expand_copysign_absneg (mode, op0, op1, target,
3767                                      fmt->signbit_ro, op0_is_abs);
3768       if (temp)
3769         return temp;
3770     }
3771
3772   if (fmt->signbit_rw < 0)
3773     return NULL_RTX;
3774   return expand_copysign_bit (mode, op0, op1, target,
3775                               fmt->signbit_rw, op0_is_abs);
3776 }
3777 \f
3778 /* Generate an instruction whose insn-code is INSN_CODE,
3779    with two operands: an output TARGET and an input OP0.
3780    TARGET *must* be nonzero, and the output is always stored there.
3781    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3782    the value that is stored into TARGET.
3783
3784    Return false if expansion failed.  */
3785
3786 bool
3787 maybe_emit_unop_insn (enum insn_code icode, rtx target, rtx op0,
3788                       enum rtx_code code)
3789 {
3790   struct expand_operand ops[2];
3791   rtx pat;
3792
3793   create_output_operand (&ops[0], target, GET_MODE (target));
3794   create_input_operand (&ops[1], op0, GET_MODE (op0));
3795   pat = maybe_gen_insn (icode, 2, ops);
3796   if (!pat)
3797     return false;
3798
3799   if (INSN_P (pat) && NEXT_INSN (pat) != NULL_RTX && code != UNKNOWN)
3800     add_equal_note (pat, ops[0].value, code, ops[1].value, NULL_RTX);
3801
3802   emit_insn (pat);
3803
3804   if (ops[0].value != target)
3805     emit_move_insn (target, ops[0].value);
3806   return true;
3807 }
3808 /* Generate an instruction whose insn-code is INSN_CODE,
3809    with two operands: an output TARGET and an input OP0.
3810    TARGET *must* be nonzero, and the output is always stored there.
3811    CODE is an rtx code such that (CODE OP0) is an rtx that describes
3812    the value that is stored into TARGET.  */
3813
3814 void
3815 emit_unop_insn (enum insn_code icode, rtx target, rtx op0, enum rtx_code code)
3816 {
3817   bool ok = maybe_emit_unop_insn (icode, target, op0, code);
3818   gcc_assert (ok);
3819 }
3820 \f
3821 struct no_conflict_data
3822 {
3823   rtx target, first, insn;
3824   bool must_stay;
3825 };
3826
3827 /* Called via note_stores by emit_libcall_block.  Set P->must_stay if
3828    the currently examined clobber / store has to stay in the list of
3829    insns that constitute the actual libcall block.  */
3830 static void
3831 no_conflict_move_test (rtx dest, const_rtx set, void *p0)
3832 {
3833   struct no_conflict_data *p= (struct no_conflict_data *) p0;
3834
3835   /* If this inns directly contributes to setting the target, it must stay.  */
3836   if (reg_overlap_mentioned_p (p->target, dest))
3837     p->must_stay = true;
3838   /* If we haven't committed to keeping any other insns in the list yet,
3839      there is nothing more to check.  */
3840   else if (p->insn == p->first)
3841     return;
3842   /* If this insn sets / clobbers a register that feeds one of the insns
3843      already in the list, this insn has to stay too.  */
3844   else if (reg_overlap_mentioned_p (dest, PATTERN (p->first))
3845            || (CALL_P (p->first) && (find_reg_fusage (p->first, USE, dest)))
3846            || reg_used_between_p (dest, p->first, p->insn)
3847            /* Likewise if this insn depends on a register set by a previous
3848               insn in the list, or if it sets a result (presumably a hard
3849               register) that is set or clobbered by a previous insn.
3850               N.B. the modified_*_p (SET_DEST...) tests applied to a MEM
3851               SET_DEST perform the former check on the address, and the latter
3852               check on the MEM.  */
3853            || (GET_CODE (set) == SET
3854                && (modified_in_p (SET_SRC (set), p->first)
3855                    || modified_in_p (SET_DEST (set), p->first)
3856                    || modified_between_p (SET_SRC (set), p->first, p->insn)
3857                    || modified_between_p (SET_DEST (set), p->first, p->insn))))
3858     p->must_stay = true;
3859 }
3860
3861 \f
3862 /* Emit code to make a call to a constant function or a library call.
3863
3864    INSNS is a list containing all insns emitted in the call.
3865    These insns leave the result in RESULT.  Our block is to copy RESULT
3866    to TARGET, which is logically equivalent to EQUIV.
3867
3868    We first emit any insns that set a pseudo on the assumption that these are
3869    loading constants into registers; doing so allows them to be safely cse'ed
3870    between blocks.  Then we emit all the other insns in the block, followed by
3871    an insn to move RESULT to TARGET.  This last insn will have a REQ_EQUAL
3872    note with an operand of EQUIV.  */
3873
3874 static void
3875 emit_libcall_block_1 (rtx insns, rtx target, rtx result, rtx equiv,
3876                       bool equiv_may_trap)
3877 {
3878   rtx final_dest = target;
3879   rtx next, last, insn;
3880
3881   /* If this is a reg with REG_USERVAR_P set, then it could possibly turn
3882      into a MEM later.  Protect the libcall block from this change.  */
3883   if (! REG_P (target) || REG_USERVAR_P (target))
3884     target = gen_reg_rtx (GET_MODE (target));
3885
3886   /* If we're using non-call exceptions, a libcall corresponding to an
3887      operation that may trap may also trap.  */
3888   /* ??? See the comment in front of make_reg_eh_region_note.  */
3889   if (cfun->can_throw_non_call_exceptions
3890       && (equiv_may_trap || may_trap_p (equiv)))
3891     {
3892       for (insn = insns; insn; insn = NEXT_INSN (insn))
3893         if (CALL_P (insn))
3894           {
3895             rtx note = find_reg_note (insn, REG_EH_REGION, NULL_RTX);
3896             if (note)
3897               {
3898                 int lp_nr = INTVAL (XEXP (note, 0));
3899                 if (lp_nr == 0 || lp_nr == INT_MIN)
3900                   remove_note (insn, note);
3901               }
3902           }
3903     }
3904   else
3905     {
3906       /* Look for any CALL_INSNs in this sequence, and attach a REG_EH_REGION
3907          reg note to indicate that this call cannot throw or execute a nonlocal
3908          goto (unless there is already a REG_EH_REGION note, in which case
3909          we update it).  */
3910       for (insn = insns; insn; insn = NEXT_INSN (insn))
3911         if (CALL_P (insn))
3912           make_reg_eh_region_note_nothrow_nononlocal (insn);
3913     }
3914
3915   /* First emit all insns that set pseudos.  Remove them from the list as
3916      we go.  Avoid insns that set pseudos which were referenced in previous
3917      insns.  These can be generated by move_by_pieces, for example,
3918      to update an address.  Similarly, avoid insns that reference things
3919      set in previous insns.  */
3920
3921   for (insn = insns; insn; insn = next)
3922     {
3923       rtx set = single_set (insn);
3924
3925       next = NEXT_INSN (insn);
3926
3927       if (set != 0 && REG_P (SET_DEST (set))
3928           && REGNO (SET_DEST (set)) >= FIRST_PSEUDO_REGISTER)
3929         {
3930           struct no_conflict_data data;
3931
3932           data.target = const0_rtx;
3933           data.first = insns;
3934           data.insn = insn;
3935           data.must_stay = 0;
3936           note_stores (PATTERN (insn), no_conflict_move_test, &data);
3937           if (! data.must_stay)
3938             {
3939               if (PREV_INSN (insn))
3940                 NEXT_INSN (PREV_INSN (insn)) = next;
3941               else
3942                 insns = next;
3943
3944               if (next)
3945                 PREV_INSN (next) = PREV_INSN (insn);
3946
3947               add_insn (insn);
3948             }
3949         }
3950
3951       /* Some ports use a loop to copy large arguments onto the stack.
3952          Don't move anything outside such a loop.  */
3953       if (LABEL_P (insn))
3954         break;
3955     }
3956
3957   /* Write the remaining insns followed by the final copy.  */
3958   for (insn = insns; insn; insn = next)
3959     {
3960       next = NEXT_INSN (insn);
3961
3962       add_insn (insn);
3963     }
3964
3965   last = emit_move_insn (target, result);
3966   set_dst_reg_note (last, REG_EQUAL, copy_rtx (equiv), target);
3967
3968   if (final_dest != target)
3969     emit_move_insn (final_dest, target);
3970 }
3971
3972 void
3973 emit_libcall_block (rtx insns, rtx target, rtx result, rtx equiv)
3974 {
3975   emit_libcall_block_1 (insns, target, result, equiv, false);
3976 }
3977 \f
3978 /* Nonzero if we can perform a comparison of mode MODE straightforwardly.
3979    PURPOSE describes how this comparison will be used.  CODE is the rtx
3980    comparison code we will be using.
3981
3982    ??? Actually, CODE is slightly weaker than that.  A target is still
3983    required to implement all of the normal bcc operations, but not
3984    required to implement all (or any) of the unordered bcc operations.  */
3985
3986 int
3987 can_compare_p (enum rtx_code code, enum machine_mode mode,
3988                enum can_compare_purpose purpose)
3989 {
3990   rtx test;
3991   test = gen_rtx_fmt_ee (code, mode, const0_rtx, const0_rtx);
3992   do
3993     {
3994       enum insn_code icode;
3995
3996       if (purpose == ccp_jump
3997           && (icode = optab_handler (cbranch_optab, mode)) != CODE_FOR_nothing
3998           && insn_operand_matches (icode, 0, test))
3999         return 1;
4000       if (purpose == ccp_store_flag
4001           && (icode = optab_handler (cstore_optab, mode)) != CODE_FOR_nothing
4002           && insn_operand_matches (icode, 1, test))
4003         return 1;
4004       if (purpose == ccp_cmov
4005           && optab_handler (cmov_optab, mode) != CODE_FOR_nothing)
4006         return 1;
4007
4008       mode = GET_MODE_WIDER_MODE (mode);
4009       PUT_MODE (test, mode);
4010     }
4011   while (mode != VOIDmode);
4012
4013   return 0;
4014 }
4015
4016 /* This function is called when we are going to emit a compare instruction that
4017    compares the values found in *PX and *PY, using the rtl operator COMPARISON.
4018
4019    *PMODE is the mode of the inputs (in case they are const_int).
4020    *PUNSIGNEDP nonzero says that the operands are unsigned;
4021    this matters if they need to be widened (as given by METHODS).
4022
4023    If they have mode BLKmode, then SIZE specifies the size of both operands.
4024
4025    This function performs all the setup necessary so that the caller only has
4026    to emit a single comparison insn.  This setup can involve doing a BLKmode
4027    comparison or emitting a library call to perform the comparison if no insn
4028    is available to handle it.
4029    The values which are passed in through pointers can be modified; the caller
4030    should perform the comparison on the modified values.  Constant
4031    comparisons must have already been folded.  */
4032
4033 static void
4034 prepare_cmp_insn (rtx x, rtx y, enum rtx_code comparison, rtx size,
4035                   int unsignedp, enum optab_methods methods,
4036                   rtx *ptest, enum machine_mode *pmode)
4037 {
4038   enum machine_mode mode = *pmode;
4039   rtx libfunc, test;
4040   enum machine_mode cmp_mode;
4041   enum mode_class mclass;
4042
4043   /* The other methods are not needed.  */
4044   gcc_assert (methods == OPTAB_DIRECT || methods == OPTAB_WIDEN
4045               || methods == OPTAB_LIB_WIDEN);
4046
4047   /* If we are optimizing, force expensive constants into a register.  */
4048   if (CONSTANT_P (x) && optimize
4049       && (rtx_cost (x, COMPARE, 0, optimize_insn_for_speed_p ())
4050           > COSTS_N_INSNS (1)))
4051     x = force_reg (mode, x);
4052
4053   if (CONSTANT_P (y) && optimize
4054       && (rtx_cost (y, COMPARE, 1, optimize_insn_for_speed_p ())
4055           > COSTS_N_INSNS (1)))
4056     y = force_reg (mode, y);
4057
4058 #ifdef HAVE_cc0
4059   /* Make sure if we have a canonical comparison.  The RTL
4060      documentation states that canonical comparisons are required only
4061      for targets which have cc0.  */
4062   gcc_assert (!CONSTANT_P (x) || CONSTANT_P (y));
4063 #endif
4064
4065   /* Don't let both operands fail to indicate the mode.  */
4066   if (GET_MODE (x) == VOIDmode && GET_MODE (y) == VOIDmode)
4067     x = force_reg (mode, x);
4068   if (mode == VOIDmode)
4069     mode = GET_MODE (x) != VOIDmode ? GET_MODE (x) : GET_MODE (y);
4070
4071   /* Handle all BLKmode compares.  */
4072
4073   if (mode == BLKmode)
4074     {
4075       enum machine_mode result_mode;
4076       enum insn_code cmp_code;
4077       tree length_type;
4078       rtx libfunc;
4079       rtx result;
4080       rtx opalign
4081         = GEN_INT (MIN (MEM_ALIGN (x), MEM_ALIGN (y)) / BITS_PER_UNIT);
4082
4083       gcc_assert (size);
4084
4085       /* Try to use a memory block compare insn - either cmpstr
4086          or cmpmem will do.  */
4087       for (cmp_mode = GET_CLASS_NARROWEST_MODE (MODE_INT);
4088            cmp_mode != VOIDmode;
4089            cmp_mode = GET_MODE_WIDER_MODE (cmp_mode))
4090         {
4091           cmp_code = direct_optab_handler (cmpmem_optab, cmp_mode);
4092           if (cmp_code == CODE_FOR_nothing)
4093             cmp_code = direct_optab_handler (cmpstr_optab, cmp_mode);
4094           if (cmp_code == CODE_FOR_nothing)
4095             cmp_code = direct_optab_handler (cmpstrn_optab, cmp_mode);
4096           if (cmp_code == CODE_FOR_nothing)
4097             continue;
4098
4099           /* Must make sure the size fits the insn's mode.  */
4100           if ((CONST_INT_P (size)
4101                && INTVAL (size) >= (1 << GET_MODE_BITSIZE (cmp_mode)))
4102               || (GET_MODE_BITSIZE (GET_MODE (size))
4103                   > GET_MODE_BITSIZE (cmp_mode)))
4104             continue;
4105
4106           result_mode = insn_data[cmp_code].operand[0].mode;
4107           result = gen_reg_rtx (result_mode);
4108           size = convert_to_mode (cmp_mode, size, 1);
4109           emit_insn (GEN_FCN (cmp_code) (result, x, y, size, opalign));
4110
4111           *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, result, const0_rtx);
4112           *pmode = result_mode;
4113           return;
4114         }
4115
4116       if (methods != OPTAB_LIB && methods != OPTAB_LIB_WIDEN)
4117         goto fail;
4118
4119       /* Otherwise call a library function, memcmp.  */
4120       libfunc = memcmp_libfunc;
4121       length_type = sizetype;
4122       result_mode = TYPE_MODE (integer_type_node);
4123       cmp_mode = TYPE_MODE (length_type);
4124       size = convert_to_mode (TYPE_MODE (length_type), size,
4125                               TYPE_UNSIGNED (length_type));
4126
4127       result = emit_library_call_value (libfunc, 0, LCT_PURE,
4128                                         result_mode, 3,
4129                                         XEXP (x, 0), Pmode,
4130                                         XEXP (y, 0), Pmode,
4131                                         size, cmp_mode);
4132       x = result;
4133       y = const0_rtx;
4134       mode = result_mode;
4135       methods = OPTAB_LIB_WIDEN;
4136       unsignedp = false;
4137     }
4138
4139   /* Don't allow operands to the compare to trap, as that can put the
4140      compare and branch in different basic blocks.  */
4141   if (cfun->can_throw_non_call_exceptions)
4142     {
4143       if (may_trap_p (x))
4144         x = force_reg (mode, x);
4145       if (may_trap_p (y))
4146         y = force_reg (mode, y);
4147     }
4148
4149   if (GET_MODE_CLASS (mode) == MODE_CC)
4150     {
4151       gcc_assert (can_compare_p (comparison, CCmode, ccp_jump));
4152       *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4153       return;
4154     }
4155
4156   mclass = GET_MODE_CLASS (mode);
4157   test = gen_rtx_fmt_ee (comparison, VOIDmode, x, y);
4158   cmp_mode = mode;
4159   do
4160    {
4161       enum insn_code icode;
4162       icode = optab_handler (cbranch_optab, cmp_mode);
4163       if (icode != CODE_FOR_nothing
4164           && insn_operand_matches (icode, 0, test))
4165         {
4166           rtx last = get_last_insn ();
4167           rtx op0 = prepare_operand (icode, x, 1, mode, cmp_mode, unsignedp);
4168           rtx op1 = prepare_operand (icode, y, 2, mode, cmp_mode, unsignedp);
4169           if (op0 && op1
4170               && insn_operand_matches (icode, 1, op0)
4171               && insn_operand_matches (icode, 2, op1))
4172             {
4173               XEXP (test, 0) = op0;
4174               XEXP (test, 1) = op1;
4175               *ptest = test;
4176               *pmode = cmp_mode;
4177               return;
4178             }
4179           delete_insns_since (last);
4180         }
4181
4182       if (methods == OPTAB_DIRECT || !CLASS_HAS_WIDER_MODES_P (mclass))
4183         break;
4184       cmp_mode = GET_MODE_WIDER_MODE (cmp_mode);
4185     }
4186   while (cmp_mode != VOIDmode);
4187
4188   if (methods != OPTAB_LIB_WIDEN)
4189     goto fail;
4190
4191   if (!SCALAR_FLOAT_MODE_P (mode))
4192     {
4193       rtx result;
4194       enum machine_mode ret_mode;
4195
4196       /* Handle a libcall just for the mode we are using.  */
4197       libfunc = optab_libfunc (cmp_optab, mode);
4198       gcc_assert (libfunc);
4199
4200       /* If we want unsigned, and this mode has a distinct unsigned
4201          comparison routine, use that.  */
4202       if (unsignedp)
4203         {
4204           rtx ulibfunc = optab_libfunc (ucmp_optab, mode);
4205           if (ulibfunc)
4206             libfunc = ulibfunc;
4207         }
4208
4209       ret_mode = targetm.libgcc_cmp_return_mode ();
4210       result = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4211                                         ret_mode, 2, x, mode, y, mode);
4212
4213       /* There are two kinds of comparison routines. Biased routines
4214          return 0/1/2, and unbiased routines return -1/0/1. Other parts
4215          of gcc expect that the comparison operation is equivalent
4216          to the modified comparison. For signed comparisons compare the
4217          result against 1 in the biased case, and zero in the unbiased
4218          case. For unsigned comparisons always compare against 1 after
4219          biasing the unbiased result by adding 1. This gives us a way to
4220          represent LTU.
4221          The comparisons in the fixed-point helper library are always
4222          biased.  */
4223       x = result;
4224       y = const1_rtx;
4225
4226       if (!TARGET_LIB_INT_CMP_BIASED && !ALL_FIXED_POINT_MODE_P (mode))
4227         {
4228           if (unsignedp)
4229             x = plus_constant (ret_mode, result, 1);
4230           else
4231             y = const0_rtx;
4232         }
4233
4234       *pmode = word_mode;
4235       prepare_cmp_insn (x, y, comparison, NULL_RTX, unsignedp, methods,
4236                         ptest, pmode);
4237     }
4238   else
4239     prepare_float_lib_cmp (x, y, comparison, ptest, pmode);
4240
4241   return;
4242
4243  fail:
4244   *ptest = NULL_RTX;
4245 }
4246
4247 /* Before emitting an insn with code ICODE, make sure that X, which is going
4248    to be used for operand OPNUM of the insn, is converted from mode MODE to
4249    WIDER_MODE (UNSIGNEDP determines whether it is an unsigned conversion), and
4250    that it is accepted by the operand predicate.  Return the new value.  */
4251
4252 rtx
4253 prepare_operand (enum insn_code icode, rtx x, int opnum, enum machine_mode mode,
4254                  enum machine_mode wider_mode, int unsignedp)
4255 {
4256   if (mode != wider_mode)
4257     x = convert_modes (wider_mode, mode, x, unsignedp);
4258
4259   if (!insn_operand_matches (icode, opnum, x))
4260     {
4261       if (reload_completed)
4262         return NULL_RTX;
4263       x = copy_to_mode_reg (insn_data[(int) icode].operand[opnum].mode, x);
4264     }
4265
4266   return x;
4267 }
4268
4269 /* Subroutine of emit_cmp_and_jump_insns; this function is called when we know
4270    we can do the branch.  */
4271
4272 static void
4273 emit_cmp_and_jump_insn_1 (rtx test, enum machine_mode mode, rtx label, int prob)
4274 {
4275   enum machine_mode optab_mode;
4276   enum mode_class mclass;
4277   enum insn_code icode;
4278   rtx insn;
4279
4280   mclass = GET_MODE_CLASS (mode);
4281   optab_mode = (mclass == MODE_CC) ? CCmode : mode;
4282   icode = optab_handler (cbranch_optab, optab_mode);
4283
4284   gcc_assert (icode != CODE_FOR_nothing);
4285   gcc_assert (insn_operand_matches (icode, 0, test));
4286   insn = emit_jump_insn (GEN_FCN (icode) (test, XEXP (test, 0),
4287                                           XEXP (test, 1), label));
4288   if (prob != -1
4289       && profile_status_for_fn (cfun) != PROFILE_ABSENT
4290       && insn
4291       && JUMP_P (insn)
4292       && any_condjump_p (insn)
4293       && !find_reg_note (insn, REG_BR_PROB, 0))
4294     add_int_reg_note (insn, REG_BR_PROB, prob);
4295 }
4296
4297 /* Generate code to compare X with Y so that the condition codes are
4298    set and to jump to LABEL if the condition is true.  If X is a
4299    constant and Y is not a constant, then the comparison is swapped to
4300    ensure that the comparison RTL has the canonical form.
4301
4302    UNSIGNEDP nonzero says that X and Y are unsigned; this matters if they
4303    need to be widened.  UNSIGNEDP is also used to select the proper
4304    branch condition code.
4305
4306    If X and Y have mode BLKmode, then SIZE specifies the size of both X and Y.
4307
4308    MODE is the mode of the inputs (in case they are const_int).
4309
4310    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).
4311    It will be potentially converted into an unsigned variant based on
4312    UNSIGNEDP to select a proper jump instruction.
4313
4314    PROB is the probability of jumping to LABEL.  */
4315
4316 void
4317 emit_cmp_and_jump_insns (rtx x, rtx y, enum rtx_code comparison, rtx size,
4318                          enum machine_mode mode, int unsignedp, rtx label,
4319                          int prob)
4320 {
4321   rtx op0 = x, op1 = y;
4322   rtx test;
4323
4324   /* Swap operands and condition to ensure canonical RTL.  */
4325   if (swap_commutative_operands_p (x, y)
4326       && can_compare_p (swap_condition (comparison), mode, ccp_jump))
4327     {
4328       op0 = y, op1 = x;
4329       comparison = swap_condition (comparison);
4330     }
4331
4332   /* If OP0 is still a constant, then both X and Y must be constants
4333      or the opposite comparison is not supported.  Force X into a register
4334      to create canonical RTL.  */
4335   if (CONSTANT_P (op0))
4336     op0 = force_reg (mode, op0);
4337
4338   if (unsignedp)
4339     comparison = unsigned_condition (comparison);
4340
4341   prepare_cmp_insn (op0, op1, comparison, size, unsignedp, OPTAB_LIB_WIDEN,
4342                     &test, &mode);
4343   emit_cmp_and_jump_insn_1 (test, mode, label, prob);
4344 }
4345
4346 \f
4347 /* Emit a library call comparison between floating point X and Y.
4348    COMPARISON is the rtl operator to compare with (EQ, NE, GT, etc.).  */
4349
4350 static void
4351 prepare_float_lib_cmp (rtx x, rtx y, enum rtx_code comparison,
4352                        rtx *ptest, enum machine_mode *pmode)
4353 {
4354   enum rtx_code swapped = swap_condition (comparison);
4355   enum rtx_code reversed = reverse_condition_maybe_unordered (comparison);
4356   enum machine_mode orig_mode = GET_MODE (x);
4357   enum machine_mode mode, cmp_mode;
4358   rtx true_rtx, false_rtx;
4359   rtx value, target, insns, equiv;
4360   rtx libfunc = 0;
4361   bool reversed_p = false;
4362   cmp_mode = targetm.libgcc_cmp_return_mode ();
4363
4364   for (mode = orig_mode;
4365        mode != VOIDmode;
4366        mode = GET_MODE_WIDER_MODE (mode))
4367     {
4368       if (code_to_optab (comparison)
4369           && (libfunc = optab_libfunc (code_to_optab (comparison), mode)))
4370         break;
4371
4372       if (code_to_optab (swapped)
4373           && (libfunc = optab_libfunc (code_to_optab (swapped), mode)))
4374         {
4375           rtx tmp;
4376           tmp = x; x = y; y = tmp;
4377           comparison = swapped;
4378           break;
4379         }
4380
4381       if (code_to_optab (reversed)
4382           && (libfunc = optab_libfunc (code_to_optab (reversed), mode)))
4383         {
4384           comparison = reversed;
4385           reversed_p = true;
4386           break;
4387         }
4388     }
4389
4390   gcc_assert (mode != VOIDmode);
4391
4392   if (mode != orig_mode)
4393     {
4394       x = convert_to_mode (mode, x, 0);
4395       y = convert_to_mode (mode, y, 0);
4396     }
4397
4398   /* Attach a REG_EQUAL note describing the semantics of the libcall to
4399      the RTL.  The allows the RTL optimizers to delete the libcall if the
4400      condition can be determined at compile-time.  */
4401   if (comparison == UNORDERED
4402       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4403     {
4404       true_rtx = const_true_rtx;
4405       false_rtx = const0_rtx;
4406     }
4407   else
4408     {
4409       switch (comparison)
4410         {
4411         case EQ:
4412           true_rtx = const0_rtx;
4413           false_rtx = const_true_rtx;
4414           break;
4415
4416         case NE:
4417           true_rtx = const_true_rtx;
4418           false_rtx = const0_rtx;
4419           break;
4420
4421         case GT:
4422           true_rtx = const1_rtx;
4423           false_rtx = const0_rtx;
4424           break;
4425
4426         case GE:
4427           true_rtx = const0_rtx;
4428           false_rtx = constm1_rtx;
4429           break;
4430
4431         case LT:
4432           true_rtx = constm1_rtx;
4433           false_rtx = const0_rtx;
4434           break;
4435
4436         case LE:
4437           true_rtx = const0_rtx;
4438           false_rtx = const1_rtx;
4439           break;
4440
4441         default:
4442           gcc_unreachable ();
4443         }
4444     }
4445
4446   if (comparison == UNORDERED)
4447     {
4448       rtx temp = simplify_gen_relational (NE, cmp_mode, mode, x, x);
4449       equiv = simplify_gen_relational (NE, cmp_mode, mode, y, y);
4450       equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4451                                     temp, const_true_rtx, equiv);
4452     }
4453   else
4454     {
4455       equiv = simplify_gen_relational (comparison, cmp_mode, mode, x, y);
4456       if (! FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison))
4457         equiv = simplify_gen_ternary (IF_THEN_ELSE, cmp_mode, cmp_mode,
4458                                       equiv, true_rtx, false_rtx);
4459     }
4460
4461   start_sequence ();
4462   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
4463                                    cmp_mode, 2, x, mode, y, mode);
4464   insns = get_insns ();
4465   end_sequence ();
4466
4467   target = gen_reg_rtx (cmp_mode);
4468   emit_libcall_block (insns, target, value, equiv);
4469
4470   if (comparison == UNORDERED
4471       || FLOAT_LIB_COMPARE_RETURNS_BOOL (mode, comparison)
4472       || reversed_p)
4473     *ptest = gen_rtx_fmt_ee (reversed_p ? EQ : NE, VOIDmode, target, false_rtx);
4474   else
4475     *ptest = gen_rtx_fmt_ee (comparison, VOIDmode, target, const0_rtx);
4476
4477   *pmode = cmp_mode;
4478 }
4479 \f
4480 /* Generate code to indirectly jump to a location given in the rtx LOC.  */
4481
4482 void
4483 emit_indirect_jump (rtx loc)
4484 {
4485   struct expand_operand ops[1];
4486
4487   create_address_operand (&ops[0], loc);
4488   expand_jump_insn (CODE_FOR_indirect_jump, 1, ops);
4489   emit_barrier ();
4490 }
4491 \f
4492 #ifdef HAVE_conditional_move
4493
4494 /* Emit a conditional move instruction if the machine supports one for that
4495    condition and machine mode.
4496
4497    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4498    the mode to use should they be constants.  If it is VOIDmode, they cannot
4499    both be constants.
4500
4501    OP2 should be stored in TARGET if the comparison is true, otherwise OP3
4502    should be stored there.  MODE is the mode to use should they be constants.
4503    If it is VOIDmode, they cannot both be constants.
4504
4505    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4506    is not supported.  */
4507
4508 rtx
4509 emit_conditional_move (rtx target, enum rtx_code code, rtx op0, rtx op1,
4510                        enum machine_mode cmode, rtx op2, rtx op3,
4511                        enum machine_mode mode, int unsignedp)
4512 {
4513   rtx tem, comparison, last;
4514   enum insn_code icode;
4515   enum rtx_code reversed;
4516
4517   /* If one operand is constant, make it the second one.  Only do this
4518      if the other operand is not constant as well.  */
4519
4520   if (swap_commutative_operands_p (op0, op1))
4521     {
4522       tem = op0;
4523       op0 = op1;
4524       op1 = tem;
4525       code = swap_condition (code);
4526     }
4527
4528   /* get_condition will prefer to generate LT and GT even if the old
4529      comparison was against zero, so undo that canonicalization here since
4530      comparisons against zero are cheaper.  */
4531   if (code == LT && op1 == const1_rtx)
4532     code = LE, op1 = const0_rtx;
4533   else if (code == GT && op1 == constm1_rtx)
4534     code = GE, op1 = const0_rtx;
4535
4536   if (cmode == VOIDmode)
4537     cmode = GET_MODE (op0);
4538
4539   if (swap_commutative_operands_p (op2, op3)
4540       && ((reversed = reversed_comparison_code_parts (code, op0, op1, NULL))
4541           != UNKNOWN))
4542     {
4543       tem = op2;
4544       op2 = op3;
4545       op3 = tem;
4546       code = reversed;
4547     }
4548
4549   if (mode == VOIDmode)
4550     mode = GET_MODE (op2);
4551
4552   icode = direct_optab_handler (movcc_optab, mode);
4553
4554   if (icode == CODE_FOR_nothing)
4555     return 0;
4556
4557   if (!target)
4558     target = gen_reg_rtx (mode);
4559
4560   code = unsignedp ? unsigned_condition (code) : code;
4561   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4562
4563   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4564      return NULL and let the caller figure out how best to deal with this
4565      situation.  */
4566   if (!COMPARISON_P (comparison))
4567     return NULL_RTX;
4568
4569   saved_pending_stack_adjust save;
4570   save_pending_stack_adjust (&save);
4571   last = get_last_insn ();
4572   do_pending_stack_adjust ();
4573   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4574                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4575                     &comparison, &cmode);
4576   if (comparison)
4577     {
4578       struct expand_operand ops[4];
4579
4580       create_output_operand (&ops[0], target, mode);
4581       create_fixed_operand (&ops[1], comparison);
4582       create_input_operand (&ops[2], op2, mode);
4583       create_input_operand (&ops[3], op3, mode);
4584       if (maybe_expand_insn (icode, 4, ops))
4585         {
4586           if (ops[0].value != target)
4587             convert_move (target, ops[0].value, false);
4588           return target;
4589         }
4590     }
4591   delete_insns_since (last);
4592   restore_pending_stack_adjust (&save);
4593   return NULL_RTX;
4594 }
4595
4596 /* Return nonzero if a conditional move of mode MODE is supported.
4597
4598    This function is for combine so it can tell whether an insn that looks
4599    like a conditional move is actually supported by the hardware.  If we
4600    guess wrong we lose a bit on optimization, but that's it.  */
4601 /* ??? sparc64 supports conditionally moving integers values based on fp
4602    comparisons, and vice versa.  How do we handle them?  */
4603
4604 int
4605 can_conditionally_move_p (enum machine_mode mode)
4606 {
4607   if (direct_optab_handler (movcc_optab, mode) != CODE_FOR_nothing)
4608     return 1;
4609
4610   return 0;
4611 }
4612
4613 #endif /* HAVE_conditional_move */
4614
4615 /* Emit a conditional addition instruction if the machine supports one for that
4616    condition and machine mode.
4617
4618    OP0 and OP1 are the operands that should be compared using CODE.  CMODE is
4619    the mode to use should they be constants.  If it is VOIDmode, they cannot
4620    both be constants.
4621
4622    OP2 should be stored in TARGET if the comparison is false, otherwise OP2+OP3
4623    should be stored there.  MODE is the mode to use should they be constants.
4624    If it is VOIDmode, they cannot both be constants.
4625
4626    The result is either TARGET (perhaps modified) or NULL_RTX if the operation
4627    is not supported.  */
4628
4629 rtx
4630 emit_conditional_add (rtx target, enum rtx_code code, rtx op0, rtx op1,
4631                       enum machine_mode cmode, rtx op2, rtx op3,
4632                       enum machine_mode mode, int unsignedp)
4633 {
4634   rtx tem, comparison, last;
4635   enum insn_code icode;
4636
4637   /* If one operand is constant, make it the second one.  Only do this
4638      if the other operand is not constant as well.  */
4639
4640   if (swap_commutative_operands_p (op0, op1))
4641     {
4642       tem = op0;
4643       op0 = op1;
4644       op1 = tem;
4645       code = swap_condition (code);
4646     }
4647
4648   /* get_condition will prefer to generate LT and GT even if the old
4649      comparison was against zero, so undo that canonicalization here since
4650      comparisons against zero are cheaper.  */
4651   if (code == LT && op1 == const1_rtx)
4652     code = LE, op1 = const0_rtx;
4653   else if (code == GT && op1 == constm1_rtx)
4654     code = GE, op1 = const0_rtx;
4655
4656   if (cmode == VOIDmode)
4657     cmode = GET_MODE (op0);
4658
4659   if (mode == VOIDmode)
4660     mode = GET_MODE (op2);
4661
4662   icode = optab_handler (addcc_optab, mode);
4663
4664   if (icode == CODE_FOR_nothing)
4665     return 0;
4666
4667   if (!target)
4668     target = gen_reg_rtx (mode);
4669
4670   code = unsignedp ? unsigned_condition (code) : code;
4671   comparison = simplify_gen_relational (code, VOIDmode, cmode, op0, op1);
4672
4673   /* We can get const0_rtx or const_true_rtx in some circumstances.  Just
4674      return NULL and let the caller figure out how best to deal with this
4675      situation.  */
4676   if (!COMPARISON_P (comparison))
4677     return NULL_RTX;
4678
4679   do_pending_stack_adjust ();
4680   last = get_last_insn ();
4681   prepare_cmp_insn (XEXP (comparison, 0), XEXP (comparison, 1),
4682                     GET_CODE (comparison), NULL_RTX, unsignedp, OPTAB_WIDEN,
4683                     &comparison, &cmode);
4684   if (comparison)
4685     {
4686       struct expand_operand ops[4];
4687
4688       create_output_operand (&ops[0], target, mode);
4689       create_fixed_operand (&ops[1], comparison);
4690       create_input_operand (&ops[2], op2, mode);
4691       create_input_operand (&ops[3], op3, mode);
4692       if (maybe_expand_insn (icode, 4, ops))
4693         {
4694           if (ops[0].value != target)
4695             convert_move (target, ops[0].value, false);
4696           return target;
4697         }
4698     }
4699   delete_insns_since (last);
4700   return NULL_RTX;
4701 }
4702 \f
4703 /* These functions attempt to generate an insn body, rather than
4704    emitting the insn, but if the gen function already emits them, we
4705    make no attempt to turn them back into naked patterns.  */
4706
4707 /* Generate and return an insn body to add Y to X.  */
4708
4709 rtx
4710 gen_add2_insn (rtx x, rtx y)
4711 {
4712   enum insn_code icode = optab_handler (add_optab, GET_MODE (x));
4713
4714   gcc_assert (insn_operand_matches (icode, 0, x));
4715   gcc_assert (insn_operand_matches (icode, 1, x));
4716   gcc_assert (insn_operand_matches (icode, 2, y));
4717
4718   return GEN_FCN (icode) (x, x, y);
4719 }
4720
4721 /* Generate and return an insn body to add r1 and c,
4722    storing the result in r0.  */
4723
4724 rtx
4725 gen_add3_insn (rtx r0, rtx r1, rtx c)
4726 {
4727   enum insn_code icode = optab_handler (add_optab, GET_MODE (r0));
4728
4729   if (icode == CODE_FOR_nothing
4730       || !insn_operand_matches (icode, 0, r0)
4731       || !insn_operand_matches (icode, 1, r1)
4732       || !insn_operand_matches (icode, 2, c))
4733     return NULL_RTX;
4734
4735   return GEN_FCN (icode) (r0, r1, c);
4736 }
4737
4738 int
4739 have_add2_insn (rtx x, rtx y)
4740 {
4741   enum insn_code icode;
4742
4743   gcc_assert (GET_MODE (x) != VOIDmode);
4744
4745   icode = optab_handler (add_optab, GET_MODE (x));
4746
4747   if (icode == CODE_FOR_nothing)
4748     return 0;
4749
4750   if (!insn_operand_matches (icode, 0, x)
4751       || !insn_operand_matches (icode, 1, x)
4752       || !insn_operand_matches (icode, 2, y))
4753     return 0;
4754
4755   return 1;
4756 }
4757
4758 /* Generate and return an insn body to add Y to X.  */
4759
4760 rtx
4761 gen_addptr3_insn (rtx x, rtx y, rtx z)
4762 {
4763   enum insn_code icode = optab_handler (addptr3_optab, GET_MODE (x));
4764
4765   gcc_assert (insn_operand_matches (icode, 0, x));
4766   gcc_assert (insn_operand_matches (icode, 1, y));
4767   gcc_assert (insn_operand_matches (icode, 2, z));
4768
4769   return GEN_FCN (icode) (x, y, z);
4770 }
4771
4772 /* Return true if the target implements an addptr pattern and X, Y,
4773    and Z are valid for the pattern predicates.  */
4774
4775 int
4776 have_addptr3_insn (rtx x, rtx y, rtx z)
4777 {
4778   enum insn_code icode;
4779
4780   gcc_assert (GET_MODE (x) != VOIDmode);
4781
4782   icode = optab_handler (addptr3_optab, GET_MODE (x));
4783
4784   if (icode == CODE_FOR_nothing)
4785     return 0;
4786
4787   if (!insn_operand_matches (icode, 0, x)
4788       || !insn_operand_matches (icode, 1, y)
4789       || !insn_operand_matches (icode, 2, z))
4790     return 0;
4791
4792   return 1;
4793 }
4794
4795 /* Generate and return an insn body to subtract Y from X.  */
4796
4797 rtx
4798 gen_sub2_insn (rtx x, rtx y)
4799 {
4800   enum insn_code icode = optab_handler (sub_optab, GET_MODE (x));
4801
4802   gcc_assert (insn_operand_matches (icode, 0, x));
4803   gcc_assert (insn_operand_matches (icode, 1, x));
4804   gcc_assert (insn_operand_matches (icode, 2, y));
4805
4806   return GEN_FCN (icode) (x, x, y);
4807 }
4808
4809 /* Generate and return an insn body to subtract r1 and c,
4810    storing the result in r0.  */
4811
4812 rtx
4813 gen_sub3_insn (rtx r0, rtx r1, rtx c)
4814 {
4815   enum insn_code icode = optab_handler (sub_optab, GET_MODE (r0));
4816
4817   if (icode == CODE_FOR_nothing
4818       || !insn_operand_matches (icode, 0, r0)
4819       || !insn_operand_matches (icode, 1, r1)
4820       || !insn_operand_matches (icode, 2, c))
4821     return NULL_RTX;
4822
4823   return GEN_FCN (icode) (r0, r1, c);
4824 }
4825
4826 int
4827 have_sub2_insn (rtx x, rtx y)
4828 {
4829   enum insn_code icode;
4830
4831   gcc_assert (GET_MODE (x) != VOIDmode);
4832
4833   icode = optab_handler (sub_optab, GET_MODE (x));
4834
4835   if (icode == CODE_FOR_nothing)
4836     return 0;
4837
4838   if (!insn_operand_matches (icode, 0, x)
4839       || !insn_operand_matches (icode, 1, x)
4840       || !insn_operand_matches (icode, 2, y))
4841     return 0;
4842
4843   return 1;
4844 }
4845
4846 /* Generate the body of an instruction to copy Y into X.
4847    It may be a list of insns, if one insn isn't enough.  */
4848
4849 rtx
4850 gen_move_insn (rtx x, rtx y)
4851 {
4852   rtx seq;
4853
4854   start_sequence ();
4855   emit_move_insn_1 (x, y);
4856   seq = get_insns ();
4857   end_sequence ();
4858   return seq;
4859 }
4860 \f
4861 /* Return the insn code used to extend FROM_MODE to TO_MODE.
4862    UNSIGNEDP specifies zero-extension instead of sign-extension.  If
4863    no such operation exists, CODE_FOR_nothing will be returned.  */
4864
4865 enum insn_code
4866 can_extend_p (enum machine_mode to_mode, enum machine_mode from_mode,
4867               int unsignedp)
4868 {
4869   convert_optab tab;
4870 #ifdef HAVE_ptr_extend
4871   if (unsignedp < 0)
4872     return CODE_FOR_ptr_extend;
4873 #endif
4874
4875   tab = unsignedp ? zext_optab : sext_optab;
4876   return convert_optab_handler (tab, to_mode, from_mode);
4877 }
4878
4879 /* Generate the body of an insn to extend Y (with mode MFROM)
4880    into X (with mode MTO).  Do zero-extension if UNSIGNEDP is nonzero.  */
4881
4882 rtx
4883 gen_extend_insn (rtx x, rtx y, enum machine_mode mto,
4884                  enum machine_mode mfrom, int unsignedp)
4885 {
4886   enum insn_code icode = can_extend_p (mto, mfrom, unsignedp);
4887   return GEN_FCN (icode) (x, y);
4888 }
4889 \f
4890 /* can_fix_p and can_float_p say whether the target machine
4891    can directly convert a given fixed point type to
4892    a given floating point type, or vice versa.
4893    The returned value is the CODE_FOR_... value to use,
4894    or CODE_FOR_nothing if these modes cannot be directly converted.
4895
4896    *TRUNCP_PTR is set to 1 if it is necessary to output
4897    an explicit FTRUNC insn before the fix insn; otherwise 0.  */
4898
4899 static enum insn_code
4900 can_fix_p (enum machine_mode fixmode, enum machine_mode fltmode,
4901            int unsignedp, int *truncp_ptr)
4902 {
4903   convert_optab tab;
4904   enum insn_code icode;
4905
4906   tab = unsignedp ? ufixtrunc_optab : sfixtrunc_optab;
4907   icode = convert_optab_handler (tab, fixmode, fltmode);
4908   if (icode != CODE_FOR_nothing)
4909     {
4910       *truncp_ptr = 0;
4911       return icode;
4912     }
4913
4914   /* FIXME: This requires a port to define both FIX and FTRUNC pattern
4915      for this to work. We need to rework the fix* and ftrunc* patterns
4916      and documentation.  */
4917   tab = unsignedp ? ufix_optab : sfix_optab;
4918   icode = convert_optab_handler (tab, fixmode, fltmode);
4919   if (icode != CODE_FOR_nothing
4920       && optab_handler (ftrunc_optab, fltmode) != CODE_FOR_nothing)
4921     {
4922       *truncp_ptr = 1;
4923       return icode;
4924     }
4925
4926   *truncp_ptr = 0;
4927   return CODE_FOR_nothing;
4928 }
4929
4930 enum insn_code
4931 can_float_p (enum machine_mode fltmode, enum machine_mode fixmode,
4932              int unsignedp)
4933 {
4934   convert_optab tab;
4935
4936   tab = unsignedp ? ufloat_optab : sfloat_optab;
4937   return convert_optab_handler (tab, fltmode, fixmode);
4938 }
4939
4940 /* Function supportable_convert_operation
4941
4942    Check whether an operation represented by the code CODE is a
4943    convert operation that is supported by the target platform in
4944    vector form (i.e., when operating on arguments of type VECTYPE_IN
4945    producing a result of type VECTYPE_OUT).
4946
4947    Convert operations we currently support directly are FIX_TRUNC and FLOAT.
4948    This function checks if these operations are supported
4949    by the target platform either directly (via vector tree-codes), or via
4950    target builtins.
4951
4952    Output:
4953    - CODE1 is code of vector operation to be used when
4954    vectorizing the operation, if available.
4955    - DECL is decl of target builtin functions to be used
4956    when vectorizing the operation, if available.  In this case,
4957    CODE1 is CALL_EXPR.  */
4958
4959 bool
4960 supportable_convert_operation (enum tree_code code,
4961                                     tree vectype_out, tree vectype_in,
4962                                     tree *decl, enum tree_code *code1)
4963 {
4964   enum machine_mode m1,m2;
4965   int truncp;
4966
4967   m1 = TYPE_MODE (vectype_out);
4968   m2 = TYPE_MODE (vectype_in);
4969
4970   /* First check if we can done conversion directly.  */
4971   if ((code == FIX_TRUNC_EXPR
4972        && can_fix_p (m1,m2,TYPE_UNSIGNED (vectype_out), &truncp)
4973           != CODE_FOR_nothing)
4974       || (code == FLOAT_EXPR
4975           && can_float_p (m1,m2,TYPE_UNSIGNED (vectype_in))
4976              != CODE_FOR_nothing))
4977     {
4978       *code1 = code;
4979       return true;
4980     }
4981
4982   /* Now check for builtin.  */
4983   if (targetm.vectorize.builtin_conversion
4984       && targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in))
4985     {
4986       *code1 = CALL_EXPR;
4987       *decl = targetm.vectorize.builtin_conversion (code, vectype_out, vectype_in);
4988       return true;
4989     }
4990   return false;
4991 }
4992
4993 \f
4994 /* Generate code to convert FROM to floating point
4995    and store in TO.  FROM must be fixed point and not VOIDmode.
4996    UNSIGNEDP nonzero means regard FROM as unsigned.
4997    Normally this is done by correcting the final value
4998    if it is negative.  */
4999
5000 void
5001 expand_float (rtx to, rtx from, int unsignedp)
5002 {
5003   enum insn_code icode;
5004   rtx target = to;
5005   enum machine_mode fmode, imode;
5006   bool can_do_signed = false;
5007
5008   /* Crash now, because we won't be able to decide which mode to use.  */
5009   gcc_assert (GET_MODE (from) != VOIDmode);
5010
5011   /* Look for an insn to do the conversion.  Do it in the specified
5012      modes if possible; otherwise convert either input, output or both to
5013      wider mode.  If the integer mode is wider than the mode of FROM,
5014      we can do the conversion signed even if the input is unsigned.  */
5015
5016   for (fmode = GET_MODE (to); fmode != VOIDmode;
5017        fmode = GET_MODE_WIDER_MODE (fmode))
5018     for (imode = GET_MODE (from); imode != VOIDmode;
5019          imode = GET_MODE_WIDER_MODE (imode))
5020       {
5021         int doing_unsigned = unsignedp;
5022
5023         if (fmode != GET_MODE (to)
5024             && significand_size (fmode) < GET_MODE_PRECISION (GET_MODE (from)))
5025           continue;
5026
5027         icode = can_float_p (fmode, imode, unsignedp);
5028         if (icode == CODE_FOR_nothing && unsignedp)
5029           {
5030             enum insn_code scode = can_float_p (fmode, imode, 0);
5031             if (scode != CODE_FOR_nothing)
5032               can_do_signed = true;
5033             if (imode != GET_MODE (from))
5034               icode = scode, doing_unsigned = 0;
5035           }
5036
5037         if (icode != CODE_FOR_nothing)
5038           {
5039             if (imode != GET_MODE (from))
5040               from = convert_to_mode (imode, from, unsignedp);
5041
5042             if (fmode != GET_MODE (to))
5043               target = gen_reg_rtx (fmode);
5044
5045             emit_unop_insn (icode, target, from,
5046                             doing_unsigned ? UNSIGNED_FLOAT : FLOAT);
5047
5048             if (target != to)
5049               convert_move (to, target, 0);
5050             return;
5051           }
5052       }
5053
5054   /* Unsigned integer, and no way to convert directly.  Convert as signed,
5055      then unconditionally adjust the result.  */
5056   if (unsignedp && can_do_signed)
5057     {
5058       rtx label = gen_label_rtx ();
5059       rtx temp;
5060       REAL_VALUE_TYPE offset;
5061
5062       /* Look for a usable floating mode FMODE wider than the source and at
5063          least as wide as the target.  Using FMODE will avoid rounding woes
5064          with unsigned values greater than the signed maximum value.  */
5065
5066       for (fmode = GET_MODE (to);  fmode != VOIDmode;
5067            fmode = GET_MODE_WIDER_MODE (fmode))
5068         if (GET_MODE_PRECISION (GET_MODE (from)) < GET_MODE_BITSIZE (fmode)
5069             && can_float_p (fmode, GET_MODE (from), 0) != CODE_FOR_nothing)
5070           break;
5071
5072       if (fmode == VOIDmode)
5073         {
5074           /* There is no such mode.  Pretend the target is wide enough.  */
5075           fmode = GET_MODE (to);
5076
5077           /* Avoid double-rounding when TO is narrower than FROM.  */
5078           if ((significand_size (fmode) + 1)
5079               < GET_MODE_PRECISION (GET_MODE (from)))
5080             {
5081               rtx temp1;
5082               rtx neglabel = gen_label_rtx ();
5083
5084               /* Don't use TARGET if it isn't a register, is a hard register,
5085                  or is the wrong mode.  */
5086               if (!REG_P (target)
5087                   || REGNO (target) < FIRST_PSEUDO_REGISTER
5088                   || GET_MODE (target) != fmode)
5089                 target = gen_reg_rtx (fmode);
5090
5091               imode = GET_MODE (from);
5092               do_pending_stack_adjust ();
5093
5094               /* Test whether the sign bit is set.  */
5095               emit_cmp_and_jump_insns (from, const0_rtx, LT, NULL_RTX, imode,
5096                                        0, neglabel);
5097
5098               /* The sign bit is not set.  Convert as signed.  */
5099               expand_float (target, from, 0);
5100               emit_jump_insn (gen_jump (label));
5101               emit_barrier ();
5102
5103               /* The sign bit is set.
5104                  Convert to a usable (positive signed) value by shifting right
5105                  one bit, while remembering if a nonzero bit was shifted
5106                  out; i.e., compute  (from & 1) | (from >> 1).  */
5107
5108               emit_label (neglabel);
5109               temp = expand_binop (imode, and_optab, from, const1_rtx,
5110                                    NULL_RTX, 1, OPTAB_LIB_WIDEN);
5111               temp1 = expand_shift (RSHIFT_EXPR, imode, from, 1, NULL_RTX, 1);
5112               temp = expand_binop (imode, ior_optab, temp, temp1, temp, 1,
5113                                    OPTAB_LIB_WIDEN);
5114               expand_float (target, temp, 0);
5115
5116               /* Multiply by 2 to undo the shift above.  */
5117               temp = expand_binop (fmode, add_optab, target, target,
5118                                    target, 0, OPTAB_LIB_WIDEN);
5119               if (temp != target)
5120                 emit_move_insn (target, temp);
5121
5122               do_pending_stack_adjust ();
5123               emit_label (label);
5124               goto done;
5125             }
5126         }
5127
5128       /* If we are about to do some arithmetic to correct for an
5129          unsigned operand, do it in a pseudo-register.  */
5130
5131       if (GET_MODE (to) != fmode
5132           || !REG_P (to) || REGNO (to) < FIRST_PSEUDO_REGISTER)
5133         target = gen_reg_rtx (fmode);
5134
5135       /* Convert as signed integer to floating.  */
5136       expand_float (target, from, 0);
5137
5138       /* If FROM is negative (and therefore TO is negative),
5139          correct its value by 2**bitwidth.  */
5140
5141       do_pending_stack_adjust ();
5142       emit_cmp_and_jump_insns (from, const0_rtx, GE, NULL_RTX, GET_MODE (from),
5143                                0, label);
5144
5145
5146       real_2expN (&offset, GET_MODE_PRECISION (GET_MODE (from)), fmode);
5147       temp = expand_binop (fmode, add_optab, target,
5148                            CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode),
5149                            target, 0, OPTAB_LIB_WIDEN);
5150       if (temp != target)
5151         emit_move_insn (target, temp);
5152
5153       do_pending_stack_adjust ();
5154       emit_label (label);
5155       goto done;
5156     }
5157
5158   /* No hardware instruction available; call a library routine.  */
5159     {
5160       rtx libfunc;
5161       rtx insns;
5162       rtx value;
5163       convert_optab tab = unsignedp ? ufloat_optab : sfloat_optab;
5164
5165       if (GET_MODE_SIZE (GET_MODE (from)) < GET_MODE_SIZE (SImode))
5166         from = convert_to_mode (SImode, from, unsignedp);
5167
5168       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5169       gcc_assert (libfunc);
5170
5171       start_sequence ();
5172
5173       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5174                                        GET_MODE (to), 1, from,
5175                                        GET_MODE (from));
5176       insns = get_insns ();
5177       end_sequence ();
5178
5179       emit_libcall_block (insns, target, value,
5180                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FLOAT : FLOAT,
5181                                          GET_MODE (to), from));
5182     }
5183
5184  done:
5185
5186   /* Copy result to requested destination
5187      if we have been computing in a temp location.  */
5188
5189   if (target != to)
5190     {
5191       if (GET_MODE (target) == GET_MODE (to))
5192         emit_move_insn (to, target);
5193       else
5194         convert_move (to, target, 0);
5195     }
5196 }
5197 \f
5198 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5199    must be floating point.  */
5200
5201 void
5202 expand_fix (rtx to, rtx from, int unsignedp)
5203 {
5204   enum insn_code icode;
5205   rtx target = to;
5206   enum machine_mode fmode, imode;
5207   int must_trunc = 0;
5208
5209   /* We first try to find a pair of modes, one real and one integer, at
5210      least as wide as FROM and TO, respectively, in which we can open-code
5211      this conversion.  If the integer mode is wider than the mode of TO,
5212      we can do the conversion either signed or unsigned.  */
5213
5214   for (fmode = GET_MODE (from); fmode != VOIDmode;
5215        fmode = GET_MODE_WIDER_MODE (fmode))
5216     for (imode = GET_MODE (to); imode != VOIDmode;
5217          imode = GET_MODE_WIDER_MODE (imode))
5218       {
5219         int doing_unsigned = unsignedp;
5220
5221         icode = can_fix_p (imode, fmode, unsignedp, &must_trunc);
5222         if (icode == CODE_FOR_nothing && imode != GET_MODE (to) && unsignedp)
5223           icode = can_fix_p (imode, fmode, 0, &must_trunc), doing_unsigned = 0;
5224
5225         if (icode != CODE_FOR_nothing)
5226           {
5227             rtx last = get_last_insn ();
5228             if (fmode != GET_MODE (from))
5229               from = convert_to_mode (fmode, from, 0);
5230
5231             if (must_trunc)
5232               {
5233                 rtx temp = gen_reg_rtx (GET_MODE (from));
5234                 from = expand_unop (GET_MODE (from), ftrunc_optab, from,
5235                                     temp, 0);
5236               }
5237
5238             if (imode != GET_MODE (to))
5239               target = gen_reg_rtx (imode);
5240
5241             if (maybe_emit_unop_insn (icode, target, from,
5242                                       doing_unsigned ? UNSIGNED_FIX : FIX))
5243               {
5244                 if (target != to)
5245                   convert_move (to, target, unsignedp);
5246                 return;
5247               }
5248             delete_insns_since (last);
5249           }
5250       }
5251
5252   /* For an unsigned conversion, there is one more way to do it.
5253      If we have a signed conversion, we generate code that compares
5254      the real value to the largest representable positive number.  If if
5255      is smaller, the conversion is done normally.  Otherwise, subtract
5256      one plus the highest signed number, convert, and add it back.
5257
5258      We only need to check all real modes, since we know we didn't find
5259      anything with a wider integer mode.
5260
5261      This code used to extend FP value into mode wider than the destination.
5262      This is needed for decimal float modes which cannot accurately
5263      represent one plus the highest signed number of the same size, but
5264      not for binary modes.  Consider, for instance conversion from SFmode
5265      into DImode.
5266
5267      The hot path through the code is dealing with inputs smaller than 2^63
5268      and doing just the conversion, so there is no bits to lose.
5269
5270      In the other path we know the value is positive in the range 2^63..2^64-1
5271      inclusive.  (as for other input overflow happens and result is undefined)
5272      So we know that the most important bit set in mantissa corresponds to
5273      2^63.  The subtraction of 2^63 should not generate any rounding as it
5274      simply clears out that bit.  The rest is trivial.  */
5275
5276   if (unsignedp && GET_MODE_PRECISION (GET_MODE (to)) <= HOST_BITS_PER_WIDE_INT)
5277     for (fmode = GET_MODE (from); fmode != VOIDmode;
5278          fmode = GET_MODE_WIDER_MODE (fmode))
5279       if (CODE_FOR_nothing != can_fix_p (GET_MODE (to), fmode, 0, &must_trunc)
5280           && (!DECIMAL_FLOAT_MODE_P (fmode)
5281               || GET_MODE_BITSIZE (fmode) > GET_MODE_PRECISION (GET_MODE (to))))
5282         {
5283           int bitsize;
5284           REAL_VALUE_TYPE offset;
5285           rtx limit, lab1, lab2, insn;
5286
5287           bitsize = GET_MODE_PRECISION (GET_MODE (to));
5288           real_2expN (&offset, bitsize - 1, fmode);
5289           limit = CONST_DOUBLE_FROM_REAL_VALUE (offset, fmode);
5290           lab1 = gen_label_rtx ();
5291           lab2 = gen_label_rtx ();
5292
5293           if (fmode != GET_MODE (from))
5294             from = convert_to_mode (fmode, from, 0);
5295
5296           /* See if we need to do the subtraction.  */
5297           do_pending_stack_adjust ();
5298           emit_cmp_and_jump_insns (from, limit, GE, NULL_RTX, GET_MODE (from),
5299                                    0, lab1);
5300
5301           /* If not, do the signed "fix" and branch around fixup code.  */
5302           expand_fix (to, from, 0);
5303           emit_jump_insn (gen_jump (lab2));
5304           emit_barrier ();
5305
5306           /* Otherwise, subtract 2**(N-1), convert to signed number,
5307              then add 2**(N-1).  Do the addition using XOR since this
5308              will often generate better code.  */
5309           emit_label (lab1);
5310           target = expand_binop (GET_MODE (from), sub_optab, from, limit,
5311                                  NULL_RTX, 0, OPTAB_LIB_WIDEN);
5312           expand_fix (to, target, 0);
5313           target = expand_binop (GET_MODE (to), xor_optab, to,
5314                                  gen_int_mode
5315                                  ((HOST_WIDE_INT) 1 << (bitsize - 1),
5316                                   GET_MODE (to)),
5317                                  to, 1, OPTAB_LIB_WIDEN);
5318
5319           if (target != to)
5320             emit_move_insn (to, target);
5321
5322           emit_label (lab2);
5323
5324           if (optab_handler (mov_optab, GET_MODE (to)) != CODE_FOR_nothing)
5325             {
5326               /* Make a place for a REG_NOTE and add it.  */
5327               insn = emit_move_insn (to, to);
5328               set_dst_reg_note (insn, REG_EQUAL,
5329                                 gen_rtx_fmt_e (UNSIGNED_FIX, GET_MODE (to),
5330                                                copy_rtx (from)),
5331                                 to);
5332             }
5333
5334           return;
5335         }
5336
5337   /* We can't do it with an insn, so use a library call.  But first ensure
5338      that the mode of TO is at least as wide as SImode, since those are the
5339      only library calls we know about.  */
5340
5341   if (GET_MODE_SIZE (GET_MODE (to)) < GET_MODE_SIZE (SImode))
5342     {
5343       target = gen_reg_rtx (SImode);
5344
5345       expand_fix (target, from, unsignedp);
5346     }
5347   else
5348     {
5349       rtx insns;
5350       rtx value;
5351       rtx libfunc;
5352
5353       convert_optab tab = unsignedp ? ufix_optab : sfix_optab;
5354       libfunc = convert_optab_libfunc (tab, GET_MODE (to), GET_MODE (from));
5355       gcc_assert (libfunc);
5356
5357       start_sequence ();
5358
5359       value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST,
5360                                        GET_MODE (to), 1, from,
5361                                        GET_MODE (from));
5362       insns = get_insns ();
5363       end_sequence ();
5364
5365       emit_libcall_block (insns, target, value,
5366                           gen_rtx_fmt_e (unsignedp ? UNSIGNED_FIX : FIX,
5367                                          GET_MODE (to), from));
5368     }
5369
5370   if (target != to)
5371     {
5372       if (GET_MODE (to) == GET_MODE (target))
5373         emit_move_insn (to, target);
5374       else
5375         convert_move (to, target, 0);
5376     }
5377 }
5378
5379 /* Generate code to convert FROM or TO a fixed-point.
5380    If UINTP is true, either TO or FROM is an unsigned integer.
5381    If SATP is true, we need to saturate the result.  */
5382
5383 void
5384 expand_fixed_convert (rtx to, rtx from, int uintp, int satp)
5385 {
5386   enum machine_mode to_mode = GET_MODE (to);
5387   enum machine_mode from_mode = GET_MODE (from);
5388   convert_optab tab;
5389   enum rtx_code this_code;
5390   enum insn_code code;
5391   rtx insns, value;
5392   rtx libfunc;
5393
5394   if (to_mode == from_mode)
5395     {
5396       emit_move_insn (to, from);
5397       return;
5398     }
5399
5400   if (uintp)
5401     {
5402       tab = satp ? satfractuns_optab : fractuns_optab;
5403       this_code = satp ? UNSIGNED_SAT_FRACT : UNSIGNED_FRACT_CONVERT;
5404     }
5405   else
5406     {
5407       tab = satp ? satfract_optab : fract_optab;
5408       this_code = satp ? SAT_FRACT : FRACT_CONVERT;
5409     }
5410   code = convert_optab_handler (tab, to_mode, from_mode);
5411   if (code != CODE_FOR_nothing)
5412     {
5413       emit_unop_insn (code, to, from, this_code);
5414       return;
5415     }
5416
5417   libfunc = convert_optab_libfunc (tab, to_mode, from_mode);
5418   gcc_assert (libfunc);
5419
5420   start_sequence ();
5421   value = emit_library_call_value (libfunc, NULL_RTX, LCT_CONST, to_mode,
5422                                    1, from, from_mode);
5423   insns = get_insns ();
5424   end_sequence ();
5425
5426   emit_libcall_block (insns, to, value,
5427                       gen_rtx_fmt_e (optab_to_code (tab), to_mode, from));
5428 }
5429
5430 /* Generate code to convert FROM to fixed point and store in TO.  FROM
5431    must be floating point, TO must be signed.  Use the conversion optab
5432    TAB to do the conversion.  */
5433
5434 bool
5435 expand_sfix_optab (rtx to, rtx from, convert_optab tab)
5436 {
5437   enum insn_code icode;
5438   rtx target = to;
5439   enum machine_mode fmode, imode;
5440
5441   /* We first try to find a pair of modes, one real and one integer, at
5442      least as wide as FROM and TO, respectively, in which we can open-code
5443      this conversion.  If the integer mode is wider than the mode of TO,
5444      we can do the conversion either signed or unsigned.  */
5445
5446   for (fmode = GET_MODE (from); fmode != VOIDmode;
5447        fmode = GET_MODE_WIDER_MODE (fmode))
5448     for (imode = GET_MODE (to); imode != VOIDmode;
5449          imode = GET_MODE_WIDER_MODE (imode))
5450       {
5451         icode = convert_optab_handler (tab, imode, fmode);
5452         if (icode != CODE_FOR_nothing)
5453           {
5454             rtx last = get_last_insn ();
5455             if (fmode != GET_MODE (from))
5456               from = convert_to_mode (fmode, from, 0);
5457
5458             if (imode != GET_MODE (to))
5459               target = gen_reg_rtx (imode);
5460
5461             if (!maybe_emit_unop_insn (icode, target, from, UNKNOWN))
5462               {
5463                 delete_insns_since (last);
5464                 continue;
5465               }
5466             if (target != to)
5467               convert_move (to, target, 0);
5468             return true;
5469           }
5470       }
5471
5472   return false;
5473 }
5474 \f
5475 /* Report whether we have an instruction to perform the operation
5476    specified by CODE on operands of mode MODE.  */
5477 int
5478 have_insn_for (enum rtx_code code, enum machine_mode mode)
5479 {
5480   return (code_to_optab (code)
5481           && (optab_handler (code_to_optab (code), mode)
5482               != CODE_FOR_nothing));
5483 }
5484
5485 /* Initialize the libfunc fields of an entire group of entries in some
5486    optab.  Each entry is set equal to a string consisting of a leading
5487    pair of underscores followed by a generic operation name followed by
5488    a mode name (downshifted to lowercase) followed by a single character
5489    representing the number of operands for the given operation (which is
5490    usually one of the characters '2', '3', or '4').
5491
5492    OPTABLE is the table in which libfunc fields are to be initialized.
5493    OPNAME is the generic (string) name of the operation.
5494    SUFFIX is the character which specifies the number of operands for
5495      the given generic operation.
5496    MODE is the mode to generate for.
5497 */
5498
5499 static void
5500 gen_libfunc (optab optable, const char *opname, int suffix,
5501              enum machine_mode mode)
5502 {
5503   unsigned opname_len = strlen (opname);
5504   const char *mname = GET_MODE_NAME (mode);
5505   unsigned mname_len = strlen (mname);
5506   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5507   int len = prefix_len + opname_len + mname_len + 1 + 1;
5508   char *libfunc_name = XALLOCAVEC (char, len);
5509   char *p;
5510   const char *q;
5511
5512   p = libfunc_name;
5513   *p++ = '_';
5514   *p++ = '_';
5515   if (targetm.libfunc_gnu_prefix)
5516     {
5517       *p++ = 'g';
5518       *p++ = 'n';
5519       *p++ = 'u';
5520       *p++ = '_';
5521     }
5522   for (q = opname; *q; )
5523     *p++ = *q++;
5524   for (q = mname; *q; q++)
5525     *p++ = TOLOWER (*q);
5526   *p++ = suffix;
5527   *p = '\0';
5528
5529   set_optab_libfunc (optable, mode,
5530                      ggc_alloc_string (libfunc_name, p - libfunc_name));
5531 }
5532
5533 /* Like gen_libfunc, but verify that integer operation is involved.  */
5534
5535 void
5536 gen_int_libfunc (optab optable, const char *opname, char suffix,
5537                  enum machine_mode mode)
5538 {
5539   int maxsize = 2 * BITS_PER_WORD;
5540
5541   if (GET_MODE_CLASS (mode) != MODE_INT)
5542     return;
5543   if (maxsize < LONG_LONG_TYPE_SIZE)
5544     maxsize = LONG_LONG_TYPE_SIZE;
5545   if (GET_MODE_CLASS (mode) != MODE_INT
5546       || GET_MODE_BITSIZE (mode) < BITS_PER_WORD
5547       || GET_MODE_BITSIZE (mode) > maxsize)
5548     return;
5549   gen_libfunc (optable, opname, suffix, mode);
5550 }
5551
5552 /* Like gen_libfunc, but verify that FP and set decimal prefix if needed.  */
5553
5554 void
5555 gen_fp_libfunc (optab optable, const char *opname, char suffix,
5556                 enum machine_mode mode)
5557 {
5558   char *dec_opname;
5559
5560   if (GET_MODE_CLASS (mode) == MODE_FLOAT)
5561     gen_libfunc (optable, opname, suffix, mode);
5562   if (DECIMAL_FLOAT_MODE_P (mode))
5563     {
5564       dec_opname = XALLOCAVEC (char, sizeof (DECIMAL_PREFIX) + strlen (opname));
5565       /* For BID support, change the name to have either a bid_ or dpd_ prefix
5566          depending on the low level floating format used.  */
5567       memcpy (dec_opname, DECIMAL_PREFIX, sizeof (DECIMAL_PREFIX) - 1);
5568       strcpy (dec_opname + sizeof (DECIMAL_PREFIX) - 1, opname);
5569       gen_libfunc (optable, dec_opname, suffix, mode);
5570     }
5571 }
5572
5573 /* Like gen_libfunc, but verify that fixed-point operation is involved.  */
5574
5575 void
5576 gen_fixed_libfunc (optab optable, const char *opname, char suffix,
5577                    enum machine_mode mode)
5578 {
5579   if (!ALL_FIXED_POINT_MODE_P (mode))
5580     return;
5581   gen_libfunc (optable, opname, suffix, mode);
5582 }
5583
5584 /* Like gen_libfunc, but verify that signed fixed-point operation is
5585    involved.  */
5586
5587 void
5588 gen_signed_fixed_libfunc (optab optable, const char *opname, char suffix,
5589                           enum machine_mode mode)
5590 {
5591   if (!SIGNED_FIXED_POINT_MODE_P (mode))
5592     return;
5593   gen_libfunc (optable, opname, suffix, mode);
5594 }
5595
5596 /* Like gen_libfunc, but verify that unsigned fixed-point operation is
5597    involved.  */
5598
5599 void
5600 gen_unsigned_fixed_libfunc (optab optable, const char *opname, char suffix,
5601                             enum machine_mode mode)
5602 {
5603   if (!UNSIGNED_FIXED_POINT_MODE_P (mode))
5604     return;
5605   gen_libfunc (optable, opname, suffix, mode);
5606 }
5607
5608 /* Like gen_libfunc, but verify that FP or INT operation is involved.  */
5609
5610 void
5611 gen_int_fp_libfunc (optab optable, const char *name, char suffix,
5612                     enum machine_mode mode)
5613 {
5614   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5615     gen_fp_libfunc (optable, name, suffix, mode);
5616   if (INTEGRAL_MODE_P (mode))
5617     gen_int_libfunc (optable, name, suffix, mode);
5618 }
5619
5620 /* Like gen_libfunc, but verify that FP or INT operation is involved
5621    and add 'v' suffix for integer operation.  */
5622
5623 void
5624 gen_intv_fp_libfunc (optab optable, const char *name, char suffix,
5625                      enum machine_mode mode)
5626 {
5627   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5628     gen_fp_libfunc (optable, name, suffix, mode);
5629   if (GET_MODE_CLASS (mode) == MODE_INT)
5630     {
5631       int len = strlen (name);
5632       char *v_name = XALLOCAVEC (char, len + 2);
5633       strcpy (v_name, name);
5634       v_name[len] = 'v';
5635       v_name[len + 1] = 0;
5636       gen_int_libfunc (optable, v_name, suffix, mode);
5637     }
5638 }
5639
5640 /* Like gen_libfunc, but verify that FP or INT or FIXED operation is
5641    involved.  */
5642
5643 void
5644 gen_int_fp_fixed_libfunc (optab optable, const char *name, char suffix,
5645                           enum machine_mode mode)
5646 {
5647   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5648     gen_fp_libfunc (optable, name, suffix, mode);
5649   if (INTEGRAL_MODE_P (mode))
5650     gen_int_libfunc (optable, name, suffix, mode);
5651   if (ALL_FIXED_POINT_MODE_P (mode))
5652     gen_fixed_libfunc (optable, name, suffix, mode);
5653 }
5654
5655 /* Like gen_libfunc, but verify that FP or INT or signed FIXED operation is
5656    involved.  */
5657
5658 void
5659 gen_int_fp_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5660                                  enum machine_mode mode)
5661 {
5662   if (DECIMAL_FLOAT_MODE_P (mode) || GET_MODE_CLASS (mode) == MODE_FLOAT)
5663     gen_fp_libfunc (optable, name, suffix, mode);
5664   if (INTEGRAL_MODE_P (mode))
5665     gen_int_libfunc (optable, name, suffix, mode);
5666   if (SIGNED_FIXED_POINT_MODE_P (mode))
5667     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5668 }
5669
5670 /* Like gen_libfunc, but verify that INT or FIXED operation is
5671    involved.  */
5672
5673 void
5674 gen_int_fixed_libfunc (optab optable, const char *name, char suffix,
5675                        enum machine_mode mode)
5676 {
5677   if (INTEGRAL_MODE_P (mode))
5678     gen_int_libfunc (optable, name, suffix, mode);
5679   if (ALL_FIXED_POINT_MODE_P (mode))
5680     gen_fixed_libfunc (optable, name, suffix, mode);
5681 }
5682
5683 /* Like gen_libfunc, but verify that INT or signed FIXED operation is
5684    involved.  */
5685
5686 void
5687 gen_int_signed_fixed_libfunc (optab optable, const char *name, char suffix,
5688                               enum machine_mode mode)
5689 {
5690   if (INTEGRAL_MODE_P (mode))
5691     gen_int_libfunc (optable, name, suffix, mode);
5692   if (SIGNED_FIXED_POINT_MODE_P (mode))
5693     gen_signed_fixed_libfunc (optable, name, suffix, mode);
5694 }
5695
5696 /* Like gen_libfunc, but verify that INT or unsigned FIXED operation is
5697    involved.  */
5698
5699 void
5700 gen_int_unsigned_fixed_libfunc (optab optable, const char *name, char suffix,
5701                                 enum machine_mode mode)
5702 {
5703   if (INTEGRAL_MODE_P (mode))
5704     gen_int_libfunc (optable, name, suffix, mode);
5705   if (UNSIGNED_FIXED_POINT_MODE_P (mode))
5706     gen_unsigned_fixed_libfunc (optable, name, suffix, mode);
5707 }
5708
5709 /* Initialize the libfunc fields of an entire group of entries of an
5710    inter-mode-class conversion optab.  The string formation rules are
5711    similar to the ones for init_libfuncs, above, but instead of having
5712    a mode name and an operand count these functions have two mode names
5713    and no operand count.  */
5714
5715 void
5716 gen_interclass_conv_libfunc (convert_optab tab,
5717                              const char *opname,
5718                              enum machine_mode tmode,
5719                              enum machine_mode fmode)
5720 {
5721   size_t opname_len = strlen (opname);
5722   size_t mname_len = 0;
5723
5724   const char *fname, *tname;
5725   const char *q;
5726   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5727   char *libfunc_name, *suffix;
5728   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5729   char *p;
5730
5731   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5732      depends on which underlying decimal floating point format is used.  */
5733   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5734
5735   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5736
5737   nondec_name = XALLOCAVEC (char, prefix_len + opname_len + mname_len + 1 + 1);
5738   nondec_name[0] = '_';
5739   nondec_name[1] = '_';
5740   if (targetm.libfunc_gnu_prefix)
5741     {
5742       nondec_name[2] = 'g';
5743       nondec_name[3] = 'n';
5744       nondec_name[4] = 'u';
5745       nondec_name[5] = '_';
5746     }
5747
5748   memcpy (&nondec_name[prefix_len], opname, opname_len);
5749   nondec_suffix = nondec_name + opname_len + prefix_len;
5750
5751   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5752   dec_name[0] = '_';
5753   dec_name[1] = '_';
5754   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5755   memcpy (&dec_name[2+dec_len], opname, opname_len);
5756   dec_suffix = dec_name + dec_len + opname_len + 2;
5757
5758   fname = GET_MODE_NAME (fmode);
5759   tname = GET_MODE_NAME (tmode);
5760
5761   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5762     {
5763       libfunc_name = dec_name;
5764       suffix = dec_suffix;
5765     }
5766   else
5767     {
5768       libfunc_name = nondec_name;
5769       suffix = nondec_suffix;
5770     }
5771
5772   p = suffix;
5773   for (q = fname; *q; p++, q++)
5774     *p = TOLOWER (*q);
5775   for (q = tname; *q; p++, q++)
5776     *p = TOLOWER (*q);
5777
5778   *p = '\0';
5779
5780   set_conv_libfunc (tab, tmode, fmode,
5781                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5782 }
5783
5784 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5785    int->fp conversion.  */
5786
5787 void
5788 gen_int_to_fp_conv_libfunc (convert_optab tab,
5789                             const char *opname,
5790                             enum machine_mode tmode,
5791                             enum machine_mode fmode)
5792 {
5793   if (GET_MODE_CLASS (fmode) != MODE_INT)
5794     return;
5795   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5796     return;
5797   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5798 }
5799
5800 /* ufloat_optab is special by using floatun for FP and floatuns decimal fp
5801    naming scheme.  */
5802
5803 void
5804 gen_ufloat_conv_libfunc (convert_optab tab,
5805                          const char *opname ATTRIBUTE_UNUSED,
5806                          enum machine_mode tmode,
5807                          enum machine_mode fmode)
5808 {
5809   if (DECIMAL_FLOAT_MODE_P (tmode))
5810     gen_int_to_fp_conv_libfunc (tab, "floatuns", tmode, fmode);
5811   else
5812     gen_int_to_fp_conv_libfunc (tab, "floatun", tmode, fmode);
5813 }
5814
5815 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5816    fp->int conversion.  */
5817
5818 void
5819 gen_int_to_fp_nondecimal_conv_libfunc (convert_optab tab,
5820                                        const char *opname,
5821                                        enum machine_mode tmode,
5822                                        enum machine_mode fmode)
5823 {
5824   if (GET_MODE_CLASS (fmode) != MODE_INT)
5825     return;
5826   if (GET_MODE_CLASS (tmode) != MODE_FLOAT)
5827     return;
5828   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5829 }
5830
5831 /* Same as gen_interclass_conv_libfunc but verify that we are producing
5832    fp->int conversion with no decimal floating point involved.  */
5833
5834 void
5835 gen_fp_to_int_conv_libfunc (convert_optab tab,
5836                             const char *opname,
5837                             enum machine_mode tmode,
5838                             enum machine_mode fmode)
5839 {
5840   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5841     return;
5842   if (GET_MODE_CLASS (tmode) != MODE_INT)
5843     return;
5844   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5845 }
5846
5847 /* Initialize the libfunc fields of an of an intra-mode-class conversion optab.
5848    The string formation rules are
5849    similar to the ones for init_libfunc, above.  */
5850
5851 void
5852 gen_intraclass_conv_libfunc (convert_optab tab, const char *opname,
5853                              enum machine_mode tmode, enum machine_mode fmode)
5854 {
5855   size_t opname_len = strlen (opname);
5856   size_t mname_len = 0;
5857
5858   const char *fname, *tname;
5859   const char *q;
5860   int prefix_len = targetm.libfunc_gnu_prefix ? 6 : 2;
5861   char *nondec_name, *dec_name, *nondec_suffix, *dec_suffix;
5862   char *libfunc_name, *suffix;
5863   char *p;
5864
5865   /* If this is a decimal conversion, add the current BID vs. DPD prefix that
5866      depends on which underlying decimal floating point format is used.  */
5867   const size_t dec_len = sizeof (DECIMAL_PREFIX) - 1;
5868
5869   mname_len = strlen (GET_MODE_NAME (tmode)) + strlen (GET_MODE_NAME (fmode));
5870
5871   nondec_name = XALLOCAVEC (char, 2 + opname_len + mname_len + 1 + 1);
5872   nondec_name[0] = '_';
5873   nondec_name[1] = '_';
5874   if (targetm.libfunc_gnu_prefix)
5875     {
5876       nondec_name[2] = 'g';
5877       nondec_name[3] = 'n';
5878       nondec_name[4] = 'u';
5879       nondec_name[5] = '_';
5880     }
5881   memcpy (&nondec_name[prefix_len], opname, opname_len);
5882   nondec_suffix = nondec_name + opname_len + prefix_len;
5883
5884   dec_name = XALLOCAVEC (char, 2 + dec_len + opname_len + mname_len + 1 + 1);
5885   dec_name[0] = '_';
5886   dec_name[1] = '_';
5887   memcpy (&dec_name[2], DECIMAL_PREFIX, dec_len);
5888   memcpy (&dec_name[2 + dec_len], opname, opname_len);
5889   dec_suffix = dec_name + dec_len + opname_len + 2;
5890
5891   fname = GET_MODE_NAME (fmode);
5892   tname = GET_MODE_NAME (tmode);
5893
5894   if (DECIMAL_FLOAT_MODE_P (fmode) || DECIMAL_FLOAT_MODE_P (tmode))
5895     {
5896       libfunc_name = dec_name;
5897       suffix = dec_suffix;
5898     }
5899   else
5900     {
5901       libfunc_name = nondec_name;
5902       suffix = nondec_suffix;
5903     }
5904
5905   p = suffix;
5906   for (q = fname; *q; p++, q++)
5907     *p = TOLOWER (*q);
5908   for (q = tname; *q; p++, q++)
5909     *p = TOLOWER (*q);
5910
5911   *p++ = '2';
5912   *p = '\0';
5913
5914   set_conv_libfunc (tab, tmode, fmode,
5915                     ggc_alloc_string (libfunc_name, p - libfunc_name));
5916 }
5917
5918 /* Pick proper libcall for trunc_optab.  We need to chose if we do
5919    truncation or extension and interclass or intraclass.  */
5920
5921 void
5922 gen_trunc_conv_libfunc (convert_optab tab,
5923                          const char *opname,
5924                          enum machine_mode tmode,
5925                          enum machine_mode fmode)
5926 {
5927   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5928     return;
5929   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5930     return;
5931   if (tmode == fmode)
5932     return;
5933
5934   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5935       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5936      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5937
5938   if (GET_MODE_PRECISION (fmode) <= GET_MODE_PRECISION (tmode))
5939     return;
5940
5941   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5942        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5943       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5944     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5945 }
5946
5947 /* Pick proper libcall for extend_optab.  We need to chose if we do
5948    truncation or extension and interclass or intraclass.  */
5949
5950 void
5951 gen_extend_conv_libfunc (convert_optab tab,
5952                          const char *opname ATTRIBUTE_UNUSED,
5953                          enum machine_mode tmode,
5954                          enum machine_mode fmode)
5955 {
5956   if (GET_MODE_CLASS (tmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (tmode))
5957     return;
5958   if (GET_MODE_CLASS (fmode) != MODE_FLOAT && !DECIMAL_FLOAT_MODE_P (fmode))
5959     return;
5960   if (tmode == fmode)
5961     return;
5962
5963   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (fmode))
5964       || (GET_MODE_CLASS (fmode) == MODE_FLOAT && DECIMAL_FLOAT_MODE_P (tmode)))
5965      gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5966
5967   if (GET_MODE_PRECISION (fmode) > GET_MODE_PRECISION (tmode))
5968     return;
5969
5970   if ((GET_MODE_CLASS (tmode) == MODE_FLOAT
5971        && GET_MODE_CLASS (fmode) == MODE_FLOAT)
5972       || (DECIMAL_FLOAT_MODE_P (fmode) && DECIMAL_FLOAT_MODE_P (tmode)))
5973     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5974 }
5975
5976 /* Pick proper libcall for fract_optab.  We need to chose if we do
5977    interclass or intraclass.  */
5978
5979 void
5980 gen_fract_conv_libfunc (convert_optab tab,
5981                         const char *opname,
5982                         enum machine_mode tmode,
5983                         enum machine_mode fmode)
5984 {
5985   if (tmode == fmode)
5986     return;
5987   if (!(ALL_FIXED_POINT_MODE_P (tmode) || ALL_FIXED_POINT_MODE_P (fmode)))
5988     return;
5989
5990   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
5991     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
5992   else
5993     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
5994 }
5995
5996 /* Pick proper libcall for fractuns_optab.  */
5997
5998 void
5999 gen_fractuns_conv_libfunc (convert_optab tab,
6000                            const char *opname,
6001                            enum machine_mode tmode,
6002                            enum machine_mode fmode)
6003 {
6004   if (tmode == fmode)
6005     return;
6006   /* One mode must be a fixed-point mode, and the other must be an integer
6007      mode. */
6008   if (!((ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT)
6009         || (ALL_FIXED_POINT_MODE_P (fmode)
6010             && GET_MODE_CLASS (tmode) == MODE_INT)))
6011     return;
6012
6013   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6014 }
6015
6016 /* Pick proper libcall for satfract_optab.  We need to chose if we do
6017    interclass or intraclass.  */
6018
6019 void
6020 gen_satfract_conv_libfunc (convert_optab tab,
6021                            const char *opname,
6022                            enum machine_mode tmode,
6023                            enum machine_mode fmode)
6024 {
6025   if (tmode == fmode)
6026     return;
6027   /* TMODE must be a fixed-point mode.  */
6028   if (!ALL_FIXED_POINT_MODE_P (tmode))
6029     return;
6030
6031   if (GET_MODE_CLASS (tmode) == GET_MODE_CLASS (fmode))
6032     gen_intraclass_conv_libfunc (tab, opname, tmode, fmode);
6033   else
6034     gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6035 }
6036
6037 /* Pick proper libcall for satfractuns_optab.  */
6038
6039 void
6040 gen_satfractuns_conv_libfunc (convert_optab tab,
6041                               const char *opname,
6042                               enum machine_mode tmode,
6043                               enum machine_mode fmode)
6044 {
6045   if (tmode == fmode)
6046     return;
6047   /* TMODE must be a fixed-point mode, and FMODE must be an integer mode. */
6048   if (!(ALL_FIXED_POINT_MODE_P (tmode) && GET_MODE_CLASS (fmode) == MODE_INT))
6049     return;
6050
6051   gen_interclass_conv_libfunc (tab, opname, tmode, fmode);
6052 }
6053
6054 /* A table of previously-created libfuncs, hashed by name.  */
6055 static GTY ((param_is (union tree_node))) htab_t libfunc_decls;
6056
6057 /* Hashtable callbacks for libfunc_decls.  */
6058
6059 static hashval_t
6060 libfunc_decl_hash (const void *entry)
6061 {
6062   return IDENTIFIER_HASH_VALUE (DECL_NAME ((const_tree) entry));
6063 }
6064
6065 static int
6066 libfunc_decl_eq (const void *entry1, const void *entry2)
6067 {
6068   return DECL_NAME ((const_tree) entry1) == (const_tree) entry2;
6069 }
6070
6071 /* Build a decl for a libfunc named NAME. */
6072
6073 tree
6074 build_libfunc_function (const char *name)
6075 {
6076   tree decl = build_decl (UNKNOWN_LOCATION, FUNCTION_DECL,
6077                           get_identifier (name),
6078                           build_function_type (integer_type_node, NULL_TREE));
6079   /* ??? We don't have any type information except for this is
6080      a function.  Pretend this is "int foo()".  */
6081   DECL_ARTIFICIAL (decl) = 1;
6082   DECL_EXTERNAL (decl) = 1;
6083   TREE_PUBLIC (decl) = 1;
6084   gcc_assert (DECL_ASSEMBLER_NAME (decl));
6085
6086   /* Zap the nonsensical SYMBOL_REF_DECL for this.  What we're left with
6087      are the flags assigned by targetm.encode_section_info.  */
6088   SET_SYMBOL_REF_DECL (XEXP (DECL_RTL (decl), 0), NULL);
6089
6090   return decl;
6091 }
6092
6093 rtx
6094 init_one_libfunc (const char *name)
6095 {
6096   tree id, decl;
6097   void **slot;
6098   hashval_t hash;
6099
6100   if (libfunc_decls == NULL)
6101     libfunc_decls = htab_create_ggc (37, libfunc_decl_hash,
6102                                      libfunc_decl_eq, NULL);
6103
6104   /* See if we have already created a libfunc decl for this function.  */
6105   id = get_identifier (name);
6106   hash = IDENTIFIER_HASH_VALUE (id);
6107   slot = htab_find_slot_with_hash (libfunc_decls, id, hash, INSERT);
6108   decl = (tree) *slot;
6109   if (decl == NULL)
6110     {
6111       /* Create a new decl, so that it can be passed to
6112          targetm.encode_section_info.  */
6113       decl = build_libfunc_function (name);
6114       *slot = decl;
6115     }
6116   return XEXP (DECL_RTL (decl), 0);
6117 }
6118
6119 /* Adjust the assembler name of libfunc NAME to ASMSPEC.  */
6120
6121 rtx
6122 set_user_assembler_libfunc (const char *name, const char *asmspec)
6123 {
6124   tree id, decl;
6125   void **slot;
6126   hashval_t hash;
6127
6128   id = get_identifier (name);
6129   hash = IDENTIFIER_HASH_VALUE (id);
6130   slot = htab_find_slot_with_hash (libfunc_decls, id, hash, NO_INSERT);
6131   gcc_assert (slot);
6132   decl = (tree) *slot;
6133   set_user_assembler_name (decl, asmspec);
6134   return XEXP (DECL_RTL (decl), 0);
6135 }
6136
6137 /* Call this to reset the function entry for one optab (OPTABLE) in mode
6138    MODE to NAME, which should be either 0 or a string constant.  */
6139 void
6140 set_optab_libfunc (optab op, enum machine_mode mode, const char *name)
6141 {
6142   rtx val;
6143   struct libfunc_entry e;
6144   struct libfunc_entry **slot;
6145
6146   e.op = op;
6147   e.mode1 = mode;
6148   e.mode2 = VOIDmode;
6149
6150   if (name)
6151     val = init_one_libfunc (name);
6152   else
6153     val = 0;
6154   slot = (struct libfunc_entry **) htab_find_slot (libfunc_hash, &e, INSERT);
6155   if (*slot == NULL)
6156     *slot = ggc_alloc<libfunc_entry> ();
6157   (*slot)->op = op;
6158   (*slot)->mode1 = mode;
6159   (*slot)->mode2 = VOIDmode;
6160   (*slot)->libfunc = val;
6161 }
6162
6163 /* Call this to reset the function entry for one conversion optab
6164    (OPTABLE) from mode FMODE to mode TMODE to NAME, which should be
6165    either 0 or a string constant.  */
6166 void
6167 set_conv_libfunc (convert_optab optab, enum machine_mode tmode,
6168                   enum machine_mode fmode, const char *name)
6169 {
6170   rtx val;
6171   struct libfunc_entry e;
6172   struct libfunc_entry **slot;
6173
6174   e.op = optab;
6175   e.mode1 = tmode;
6176   e.mode2 = fmode;
6177
6178   if (name)
6179     val = init_one_libfunc (name);
6180   else
6181     val = 0;
6182   slot = (struct libfunc_entry **) htab_find_slot (libfunc_hash, &e, INSERT);
6183   if (*slot == NULL)
6184     *slot = ggc_alloc<libfunc_entry> ();
6185   (*slot)->op = optab;
6186   (*slot)->mode1 = tmode;
6187   (*slot)->mode2 = fmode;
6188   (*slot)->libfunc = val;
6189 }
6190
6191 /* Call this to initialize the contents of the optabs
6192    appropriately for the current target machine.  */
6193
6194 void
6195 init_optabs (void)
6196 {
6197   if (libfunc_hash)
6198     htab_empty (libfunc_hash);
6199   else
6200     libfunc_hash = htab_create_ggc (10, hash_libfunc, eq_libfunc, NULL);
6201
6202   /* Fill in the optabs with the insns we support.  */
6203   init_all_optabs (this_fn_optabs);
6204
6205   /* The ffs function operates on `int'.  Fall back on it if we do not
6206      have a libgcc2 function for that width.  */
6207   if (INT_TYPE_SIZE < BITS_PER_WORD)
6208     set_optab_libfunc (ffs_optab, mode_for_size (INT_TYPE_SIZE, MODE_INT, 0),
6209                        "ffs");
6210
6211   /* Explicitly initialize the bswap libfuncs since we need them to be
6212      valid for things other than word_mode.  */
6213   if (targetm.libfunc_gnu_prefix)
6214     {
6215       set_optab_libfunc (bswap_optab, SImode, "__gnu_bswapsi2");
6216       set_optab_libfunc (bswap_optab, DImode, "__gnu_bswapdi2");
6217     }
6218   else
6219     {
6220       set_optab_libfunc (bswap_optab, SImode, "__bswapsi2");
6221       set_optab_libfunc (bswap_optab, DImode, "__bswapdi2");
6222     }
6223
6224   /* Use cabs for double complex abs, since systems generally have cabs.
6225      Don't define any libcall for float complex, so that cabs will be used.  */
6226   if (complex_double_type_node)
6227     set_optab_libfunc (abs_optab, TYPE_MODE (complex_double_type_node),
6228                        "cabs");
6229
6230   abort_libfunc = init_one_libfunc ("abort");
6231   memcpy_libfunc = init_one_libfunc ("memcpy");
6232   memmove_libfunc = init_one_libfunc ("memmove");
6233   memcmp_libfunc = init_one_libfunc ("memcmp");
6234   memset_libfunc = init_one_libfunc ("memset");
6235   setbits_libfunc = init_one_libfunc ("__setbits");
6236
6237 #ifndef DONT_USE_BUILTIN_SETJMP
6238   setjmp_libfunc = init_one_libfunc ("__builtin_setjmp");
6239   longjmp_libfunc = init_one_libfunc ("__builtin_longjmp");
6240 #else
6241   setjmp_libfunc = init_one_libfunc ("setjmp");
6242   longjmp_libfunc = init_one_libfunc ("longjmp");
6243 #endif
6244   unwind_sjlj_register_libfunc = init_one_libfunc ("_Unwind_SjLj_Register");
6245   unwind_sjlj_unregister_libfunc
6246     = init_one_libfunc ("_Unwind_SjLj_Unregister");
6247
6248   /* For function entry/exit instrumentation.  */
6249   profile_function_entry_libfunc
6250     = init_one_libfunc ("__cyg_profile_func_enter");
6251   profile_function_exit_libfunc
6252     = init_one_libfunc ("__cyg_profile_func_exit");
6253
6254   gcov_flush_libfunc = init_one_libfunc ("__gcov_flush");
6255
6256   /* Allow the target to add more libcalls or rename some, etc.  */
6257   targetm.init_libfuncs ();
6258 }
6259
6260 /* Use the current target and options to initialize
6261    TREE_OPTIMIZATION_OPTABS (OPTNODE).  */
6262
6263 void
6264 init_tree_optimization_optabs (tree optnode)
6265 {
6266   /* Quick exit if we have already computed optabs for this target.  */
6267   if (TREE_OPTIMIZATION_BASE_OPTABS (optnode) == this_target_optabs)
6268     return;
6269
6270   /* Forget any previous information and set up for the current target.  */
6271   TREE_OPTIMIZATION_BASE_OPTABS (optnode) = this_target_optabs;
6272   struct target_optabs *tmp_optabs = (struct target_optabs *)
6273     TREE_OPTIMIZATION_OPTABS (optnode);
6274   if (tmp_optabs)
6275     memset (tmp_optabs, 0, sizeof (struct target_optabs));
6276   else
6277     tmp_optabs = ggc_alloc<target_optabs> ();
6278
6279   /* Generate a new set of optabs into tmp_optabs.  */
6280   init_all_optabs (tmp_optabs);
6281
6282   /* If the optabs changed, record it.  */
6283   if (memcmp (tmp_optabs, this_target_optabs, sizeof (struct target_optabs)))
6284     TREE_OPTIMIZATION_OPTABS (optnode) = tmp_optabs;
6285   else
6286     {
6287       TREE_OPTIMIZATION_OPTABS (optnode) = NULL;
6288       ggc_free (tmp_optabs);
6289     }
6290 }
6291
6292 /* A helper function for init_sync_libfuncs.  Using the basename BASE,
6293    install libfuncs into TAB for BASE_N for 1 <= N <= MAX.  */
6294
6295 static void
6296 init_sync_libfuncs_1 (optab tab, const char *base, int max)
6297 {
6298   enum machine_mode mode;
6299   char buf[64];
6300   size_t len = strlen (base);
6301   int i;
6302
6303   gcc_assert (max <= 8);
6304   gcc_assert (len + 3 < sizeof (buf));
6305
6306   memcpy (buf, base, len);
6307   buf[len] = '_';
6308   buf[len + 1] = '0';
6309   buf[len + 2] = '\0';
6310
6311   mode = QImode;
6312   for (i = 1; i <= max; i *= 2)
6313     {
6314       buf[len + 1] = '0' + i;
6315       set_optab_libfunc (tab, mode, buf);
6316       mode = GET_MODE_2XWIDER_MODE (mode);
6317     }
6318 }
6319
6320 void
6321 init_sync_libfuncs (int max)
6322 {
6323   if (!flag_sync_libcalls)
6324     return;
6325
6326   init_sync_libfuncs_1 (sync_compare_and_swap_optab,
6327                         "__sync_val_compare_and_swap", max);
6328   init_sync_libfuncs_1 (sync_lock_test_and_set_optab,
6329                         "__sync_lock_test_and_set", max);
6330
6331   init_sync_libfuncs_1 (sync_old_add_optab, "__sync_fetch_and_add", max);
6332   init_sync_libfuncs_1 (sync_old_sub_optab, "__sync_fetch_and_sub", max);
6333   init_sync_libfuncs_1 (sync_old_ior_optab, "__sync_fetch_and_or", max);
6334   init_sync_libfuncs_1 (sync_old_and_optab, "__sync_fetch_and_and", max);
6335   init_sync_libfuncs_1 (sync_old_xor_optab, "__sync_fetch_and_xor", max);
6336   init_sync_libfuncs_1 (sync_old_nand_optab, "__sync_fetch_and_nand", max);
6337
6338   init_sync_libfuncs_1 (sync_new_add_optab, "__sync_add_and_fetch", max);
6339   init_sync_libfuncs_1 (sync_new_sub_optab, "__sync_sub_and_fetch", max);
6340   init_sync_libfuncs_1 (sync_new_ior_optab, "__sync_or_and_fetch", max);
6341   init_sync_libfuncs_1 (sync_new_and_optab, "__sync_and_and_fetch", max);
6342   init_sync_libfuncs_1 (sync_new_xor_optab, "__sync_xor_and_fetch", max);
6343   init_sync_libfuncs_1 (sync_new_nand_optab, "__sync_nand_and_fetch", max);
6344 }
6345
6346 /* Print information about the current contents of the optabs on
6347    STDERR.  */
6348
6349 DEBUG_FUNCTION void
6350 debug_optab_libfuncs (void)
6351 {
6352   int i, j, k;
6353
6354   /* Dump the arithmetic optabs.  */
6355   for (i = FIRST_NORM_OPTAB; i <= LAST_NORMLIB_OPTAB; ++i)
6356     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6357       {
6358         rtx l = optab_libfunc ((optab) i, (enum machine_mode) j);
6359         if (l)
6360           {
6361             gcc_assert (GET_CODE (l) == SYMBOL_REF);
6362             fprintf (stderr, "%s\t%s:\t%s\n",
6363                      GET_RTX_NAME (optab_to_code ((optab) i)),
6364                      GET_MODE_NAME (j),
6365                      XSTR (l, 0));
6366           }
6367       }
6368
6369   /* Dump the conversion optabs.  */
6370   for (i = FIRST_CONV_OPTAB; i <= LAST_CONVLIB_OPTAB; ++i)
6371     for (j = 0; j < NUM_MACHINE_MODES; ++j)
6372       for (k = 0; k < NUM_MACHINE_MODES; ++k)
6373         {
6374           rtx l = convert_optab_libfunc ((optab) i, (enum machine_mode) j,
6375                                          (enum machine_mode) k);
6376           if (l)
6377             {
6378               gcc_assert (GET_CODE (l) == SYMBOL_REF);
6379               fprintf (stderr, "%s\t%s\t%s:\t%s\n",
6380                        GET_RTX_NAME (optab_to_code ((optab) i)),
6381                        GET_MODE_NAME (j),
6382                        GET_MODE_NAME (k),
6383                        XSTR (l, 0));
6384             }
6385         }
6386 }
6387
6388 \f
6389 /* Generate insns to trap with code TCODE if OP1 and OP2 satisfy condition
6390    CODE.  Return 0 on failure.  */
6391
6392 rtx
6393 gen_cond_trap (enum rtx_code code, rtx op1, rtx op2, rtx tcode)
6394 {
6395   enum machine_mode mode = GET_MODE (op1);
6396   enum insn_code icode;
6397   rtx insn;
6398   rtx trap_rtx;
6399
6400   if (mode == VOIDmode)
6401     return 0;
6402
6403   icode = optab_handler (ctrap_optab, mode);
6404   if (icode == CODE_FOR_nothing)
6405     return 0;
6406
6407   /* Some targets only accept a zero trap code.  */
6408   if (!insn_operand_matches (icode, 3, tcode))
6409     return 0;
6410
6411   do_pending_stack_adjust ();
6412   start_sequence ();
6413   prepare_cmp_insn (op1, op2, code, NULL_RTX, false, OPTAB_DIRECT,
6414                     &trap_rtx, &mode);
6415   if (!trap_rtx)
6416     insn = NULL_RTX;
6417   else
6418     insn = GEN_FCN (icode) (trap_rtx, XEXP (trap_rtx, 0), XEXP (trap_rtx, 1),
6419                             tcode);
6420
6421   /* If that failed, then give up.  */
6422   if (insn == 0)
6423     {
6424       end_sequence ();
6425       return 0;
6426     }
6427
6428   emit_insn (insn);
6429   insn = get_insns ();
6430   end_sequence ();
6431   return insn;
6432 }
6433
6434 /* Return rtx code for TCODE. Use UNSIGNEDP to select signed
6435    or unsigned operation code.  */
6436
6437 static enum rtx_code
6438 get_rtx_code (enum tree_code tcode, bool unsignedp)
6439 {
6440   enum rtx_code code;
6441   switch (tcode)
6442     {
6443     case EQ_EXPR:
6444       code = EQ;
6445       break;
6446     case NE_EXPR:
6447       code = NE;
6448       break;
6449     case LT_EXPR:
6450       code = unsignedp ? LTU : LT;
6451       break;
6452     case LE_EXPR:
6453       code = unsignedp ? LEU : LE;
6454       break;
6455     case GT_EXPR:
6456       code = unsignedp ? GTU : GT;
6457       break;
6458     case GE_EXPR:
6459       code = unsignedp ? GEU : GE;
6460       break;
6461
6462     case UNORDERED_EXPR:
6463       code = UNORDERED;
6464       break;
6465     case ORDERED_EXPR:
6466       code = ORDERED;
6467       break;
6468     case UNLT_EXPR:
6469       code = UNLT;
6470       break;
6471     case UNLE_EXPR:
6472       code = UNLE;
6473       break;
6474     case UNGT_EXPR:
6475       code = UNGT;
6476       break;
6477     case UNGE_EXPR:
6478       code = UNGE;
6479       break;
6480     case UNEQ_EXPR:
6481       code = UNEQ;
6482       break;
6483     case LTGT_EXPR:
6484       code = LTGT;
6485       break;
6486
6487     default:
6488       gcc_unreachable ();
6489     }
6490   return code;
6491 }
6492
6493 /* Return comparison rtx for COND. Use UNSIGNEDP to select signed or
6494    unsigned operators. Do not generate compare instruction.  */
6495
6496 static rtx
6497 vector_compare_rtx (enum tree_code tcode, tree t_op0, tree t_op1,
6498                     bool unsignedp, enum insn_code icode)
6499 {
6500   struct expand_operand ops[2];
6501   rtx rtx_op0, rtx_op1;
6502   enum rtx_code rcode = get_rtx_code (tcode, unsignedp);
6503
6504   gcc_assert (TREE_CODE_CLASS (tcode) == tcc_comparison);
6505
6506   /* Expand operands.  */
6507   rtx_op0 = expand_expr (t_op0, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op0)),
6508                          EXPAND_STACK_PARM);
6509   rtx_op1 = expand_expr (t_op1, NULL_RTX, TYPE_MODE (TREE_TYPE (t_op1)),
6510                          EXPAND_STACK_PARM);
6511
6512   create_input_operand (&ops[0], rtx_op0, GET_MODE (rtx_op0));
6513   create_input_operand (&ops[1], rtx_op1, GET_MODE (rtx_op1));
6514   if (!maybe_legitimize_operands (icode, 4, 2, ops))
6515     gcc_unreachable ();
6516   return gen_rtx_fmt_ee (rcode, VOIDmode, ops[0].value, ops[1].value);
6517 }
6518
6519 /* Return true if VEC_PERM_EXPR can be expanded using SIMD extensions
6520    of the CPU.  SEL may be NULL, which stands for an unknown constant.  */
6521
6522 bool
6523 can_vec_perm_p (enum machine_mode mode, bool variable,
6524                 const unsigned char *sel)
6525 {
6526   enum machine_mode qimode;
6527
6528   /* If the target doesn't implement a vector mode for the vector type,
6529      then no operations are supported.  */
6530   if (!VECTOR_MODE_P (mode))
6531     return false;
6532
6533   if (!variable)
6534     {
6535       if (direct_optab_handler (vec_perm_const_optab, mode) != CODE_FOR_nothing
6536           && (sel == NULL
6537               || targetm.vectorize.vec_perm_const_ok == NULL
6538               || targetm.vectorize.vec_perm_const_ok (mode, sel)))
6539         return true;
6540     }
6541
6542   if (direct_optab_handler (vec_perm_optab, mode) != CODE_FOR_nothing)
6543     return true;
6544
6545   /* We allow fallback to a QI vector mode, and adjust the mask.  */
6546   if (GET_MODE_INNER (mode) == QImode)
6547     return false;
6548   qimode = mode_for_vector (QImode, GET_MODE_SIZE (mode));
6549   if (!VECTOR_MODE_P (qimode))
6550     return false;
6551
6552   /* ??? For completeness, we ought to check the QImode version of
6553       vec_perm_const_optab.  But all users of this implicit lowering
6554       feature implement the variable vec_perm_optab.  */
6555   if (direct_optab_handler (vec_perm_optab, qimode) == CODE_FOR_nothing)
6556     return false;
6557
6558   /* In order to support the lowering of variable permutations,
6559      we need to support shifts and adds.  */
6560   if (variable)
6561     {
6562       if (GET_MODE_UNIT_SIZE (mode) > 2
6563           && optab_handler (ashl_optab, mode) == CODE_FOR_nothing
6564           && optab_handler (vashl_optab, mode) == CODE_FOR_nothing)
6565         return false;
6566       if (optab_handler (add_optab, qimode) == CODE_FOR_nothing)
6567         return false;
6568     }
6569
6570   return true;
6571 }
6572
6573 /* A subroutine of expand_vec_perm for expanding one vec_perm insn.  */
6574
6575 static rtx
6576 expand_vec_perm_1 (enum insn_code icode, rtx target,
6577                    rtx v0, rtx v1, rtx sel)
6578 {
6579   enum machine_mode tmode = GET_MODE (target);
6580   enum machine_mode smode = GET_MODE (sel);
6581   struct expand_operand ops[4];
6582
6583   create_output_operand (&ops[0], target, tmode);
6584   create_input_operand (&ops[3], sel, smode);
6585
6586   /* Make an effort to preserve v0 == v1.  The target expander is able to
6587      rely on this to determine if we're permuting a single input operand.  */
6588   if (rtx_equal_p (v0, v1))
6589     {
6590       if (!insn_operand_matches (icode, 1, v0))
6591         v0 = force_reg (tmode, v0);
6592       gcc_checking_assert (insn_operand_matches (icode, 1, v0));
6593       gcc_checking_assert (insn_operand_matches (icode, 2, v0));
6594
6595       create_fixed_operand (&ops[1], v0);
6596       create_fixed_operand (&ops[2], v0);
6597     }
6598   else
6599     {
6600       create_input_operand (&ops[1], v0, tmode);
6601       create_input_operand (&ops[2], v1, tmode);
6602     }
6603
6604   if (maybe_expand_insn (icode, 4, ops))
6605     return ops[0].value;
6606   return NULL_RTX;
6607 }
6608
6609 /* Generate instructions for vec_perm optab given its mode
6610    and three operands.  */
6611
6612 rtx
6613 expand_vec_perm (enum machine_mode mode, rtx v0, rtx v1, rtx sel, rtx target)
6614 {
6615   enum insn_code icode;
6616   enum machine_mode qimode;
6617   unsigned int i, w, e, u;
6618   rtx tmp, sel_qi = NULL;
6619   rtvec vec;
6620
6621   if (!target || GET_MODE (target) != mode)
6622     target = gen_reg_rtx (mode);
6623
6624   w = GET_MODE_SIZE (mode);
6625   e = GET_MODE_NUNITS (mode);
6626   u = GET_MODE_UNIT_SIZE (mode);
6627
6628   /* Set QIMODE to a different vector mode with byte elements.
6629      If no such mode, or if MODE already has byte elements, use VOIDmode.  */
6630   qimode = VOIDmode;
6631   if (GET_MODE_INNER (mode) != QImode)
6632     {
6633       qimode = mode_for_vector (QImode, w);
6634       if (!VECTOR_MODE_P (qimode))
6635         qimode = VOIDmode;
6636     }
6637
6638   /* If the input is a constant, expand it specially.  */
6639   gcc_assert (GET_MODE_CLASS (GET_MODE (sel)) == MODE_VECTOR_INT);
6640   if (GET_CODE (sel) == CONST_VECTOR)
6641     {
6642       icode = direct_optab_handler (vec_perm_const_optab, mode);
6643       if (icode != CODE_FOR_nothing)
6644         {
6645           tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6646           if (tmp)
6647             return tmp;
6648         }
6649
6650       /* Fall back to a constant byte-based permutation.  */
6651       if (qimode != VOIDmode)
6652         {
6653           vec = rtvec_alloc (w);
6654           for (i = 0; i < e; ++i)
6655             {
6656               unsigned int j, this_e;
6657
6658               this_e = INTVAL (CONST_VECTOR_ELT (sel, i));
6659               this_e &= 2 * e - 1;
6660               this_e *= u;
6661
6662               for (j = 0; j < u; ++j)
6663                 RTVEC_ELT (vec, i * u + j) = GEN_INT (this_e + j);
6664             }
6665           sel_qi = gen_rtx_CONST_VECTOR (qimode, vec);
6666
6667           icode = direct_optab_handler (vec_perm_const_optab, qimode);
6668           if (icode != CODE_FOR_nothing)
6669             {
6670               tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6671               tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6672                                        gen_lowpart (qimode, v1), sel_qi);
6673               if (tmp)
6674                 return gen_lowpart (mode, tmp);
6675             }
6676         }
6677     }
6678
6679   /* Otherwise expand as a fully variable permuation.  */
6680   icode = direct_optab_handler (vec_perm_optab, mode);
6681   if (icode != CODE_FOR_nothing)
6682     {
6683       tmp = expand_vec_perm_1 (icode, target, v0, v1, sel);
6684       if (tmp)
6685         return tmp;
6686     }
6687
6688   /* As a special case to aid several targets, lower the element-based
6689      permutation to a byte-based permutation and try again.  */
6690   if (qimode == VOIDmode)
6691     return NULL_RTX;
6692   icode = direct_optab_handler (vec_perm_optab, qimode);
6693   if (icode == CODE_FOR_nothing)
6694     return NULL_RTX;
6695
6696   if (sel_qi == NULL)
6697     {
6698       /* Multiply each element by its byte size.  */
6699       enum machine_mode selmode = GET_MODE (sel);
6700       if (u == 2)
6701         sel = expand_simple_binop (selmode, PLUS, sel, sel,
6702                                    sel, 0, OPTAB_DIRECT);
6703       else
6704         sel = expand_simple_binop (selmode, ASHIFT, sel,
6705                                    GEN_INT (exact_log2 (u)),
6706                                    sel, 0, OPTAB_DIRECT);
6707       gcc_assert (sel != NULL);
6708
6709       /* Broadcast the low byte each element into each of its bytes.  */
6710       vec = rtvec_alloc (w);
6711       for (i = 0; i < w; ++i)
6712         {
6713           int this_e = i / u * u;
6714           if (BYTES_BIG_ENDIAN)
6715             this_e += u - 1;
6716           RTVEC_ELT (vec, i) = GEN_INT (this_e);
6717         }
6718       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6719       sel = gen_lowpart (qimode, sel);
6720       sel = expand_vec_perm (qimode, sel, sel, tmp, NULL);
6721       gcc_assert (sel != NULL);
6722
6723       /* Add the byte offset to each byte element.  */
6724       /* Note that the definition of the indicies here is memory ordering,
6725          so there should be no difference between big and little endian.  */
6726       vec = rtvec_alloc (w);
6727       for (i = 0; i < w; ++i)
6728         RTVEC_ELT (vec, i) = GEN_INT (i % u);
6729       tmp = gen_rtx_CONST_VECTOR (qimode, vec);
6730       sel_qi = expand_simple_binop (qimode, PLUS, sel, tmp,
6731                                     sel, 0, OPTAB_DIRECT);
6732       gcc_assert (sel_qi != NULL);
6733     }
6734
6735   tmp = mode != qimode ? gen_reg_rtx (qimode) : target;
6736   tmp = expand_vec_perm_1 (icode, tmp, gen_lowpart (qimode, v0),
6737                            gen_lowpart (qimode, v1), sel_qi);
6738   if (tmp)
6739     tmp = gen_lowpart (mode, tmp);
6740   return tmp;
6741 }
6742
6743 /* Return insn code for a conditional operator with a comparison in
6744    mode CMODE, unsigned if UNS is true, resulting in a value of mode VMODE.  */
6745
6746 static inline enum insn_code
6747 get_vcond_icode (enum machine_mode vmode, enum machine_mode cmode, bool uns)
6748 {
6749   enum insn_code icode = CODE_FOR_nothing;
6750   if (uns)
6751     icode = convert_optab_handler (vcondu_optab, vmode, cmode);
6752   else
6753     icode = convert_optab_handler (vcond_optab, vmode, cmode);
6754   return icode;
6755 }
6756
6757 /* Return TRUE iff, appropriate vector insns are available
6758    for vector cond expr with vector type VALUE_TYPE and a comparison
6759    with operand vector types in CMP_OP_TYPE.  */
6760
6761 bool
6762 expand_vec_cond_expr_p (tree value_type, tree cmp_op_type)
6763 {
6764   enum machine_mode value_mode = TYPE_MODE (value_type);
6765   enum machine_mode cmp_op_mode = TYPE_MODE (cmp_op_type);
6766   if (GET_MODE_SIZE (value_mode) != GET_MODE_SIZE (cmp_op_mode)
6767       || GET_MODE_NUNITS (value_mode) != GET_MODE_NUNITS (cmp_op_mode)
6768       || get_vcond_icode (TYPE_MODE (value_type), TYPE_MODE (cmp_op_type),
6769                           TYPE_UNSIGNED (cmp_op_type)) == CODE_FOR_nothing)
6770     return false;
6771   return true;
6772 }
6773
6774 /* Generate insns for a VEC_COND_EXPR, given its TYPE and its
6775    three operands.  */
6776
6777 rtx
6778 expand_vec_cond_expr (tree vec_cond_type, tree op0, tree op1, tree op2,
6779                       rtx target)
6780 {
6781   struct expand_operand ops[6];
6782   enum insn_code icode;
6783   rtx comparison, rtx_op1, rtx_op2;
6784   enum machine_mode mode = TYPE_MODE (vec_cond_type);
6785   enum machine_mode cmp_op_mode;
6786   bool unsignedp;
6787   tree op0a, op0b;
6788   enum tree_code tcode;
6789
6790   if (COMPARISON_CLASS_P (op0))
6791     {
6792       op0a = TREE_OPERAND (op0, 0);
6793       op0b = TREE_OPERAND (op0, 1);
6794       tcode = TREE_CODE (op0);
6795     }
6796   else
6797     {
6798       /* Fake op0 < 0.  */
6799       gcc_assert (!TYPE_UNSIGNED (TREE_TYPE (op0)));
6800       op0a = op0;
6801       op0b = build_zero_cst (TREE_TYPE (op0));
6802       tcode = LT_EXPR;
6803     }
6804   unsignedp = TYPE_UNSIGNED (TREE_TYPE (op0a));
6805   cmp_op_mode = TYPE_MODE (TREE_TYPE (op0a));
6806
6807
6808   gcc_assert (GET_MODE_SIZE (mode) == GET_MODE_SIZE (cmp_op_mode)
6809               && GET_MODE_NUNITS (mode) == GET_MODE_NUNITS (cmp_op_mode));
6810
6811   icode = get_vcond_icode (mode, cmp_op_mode, unsignedp);
6812   if (icode == CODE_FOR_nothing)
6813     return 0;
6814
6815   comparison = vector_compare_rtx (tcode, op0a, op0b, unsignedp, icode);
6816   rtx_op1 = expand_normal (op1);
6817   rtx_op2 = expand_normal (op2);
6818
6819   create_output_operand (&ops[0], target, mode);
6820   create_input_operand (&ops[1], rtx_op1, mode);
6821   create_input_operand (&ops[2], rtx_op2, mode);
6822   create_fixed_operand (&ops[3], comparison);
6823   create_fixed_operand (&ops[4], XEXP (comparison, 0));
6824   create_fixed_operand (&ops[5], XEXP (comparison, 1));
6825   expand_insn (icode, 6, ops);
6826   return ops[0].value;
6827 }
6828
6829 /* Return non-zero if a highpart multiply is supported of can be synthisized.
6830    For the benefit of expand_mult_highpart, the return value is 1 for direct,
6831    2 for even/odd widening, and 3 for hi/lo widening.  */
6832
6833 int
6834 can_mult_highpart_p (enum machine_mode mode, bool uns_p)
6835 {
6836   optab op;
6837   unsigned char *sel;
6838   unsigned i, nunits;
6839
6840   op = uns_p ? umul_highpart_optab : smul_highpart_optab;
6841   if (optab_handler (op, mode) != CODE_FOR_nothing)
6842     return 1;
6843
6844   /* If the mode is an integral vector, synth from widening operations.  */
6845   if (GET_MODE_CLASS (mode) != MODE_VECTOR_INT)
6846     return 0;
6847
6848   nunits = GET_MODE_NUNITS (mode);
6849   sel = XALLOCAVEC (unsigned char, nunits);
6850
6851   op = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6852   if (optab_handler (op, mode) != CODE_FOR_nothing)
6853     {
6854       op = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6855       if (optab_handler (op, mode) != CODE_FOR_nothing)
6856         {
6857           for (i = 0; i < nunits; ++i)
6858             sel[i] = !BYTES_BIG_ENDIAN + (i & ~1) + ((i & 1) ? nunits : 0);
6859           if (can_vec_perm_p (mode, false, sel))
6860             return 2;
6861         }
6862     }
6863
6864   op = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6865   if (optab_handler (op, mode) != CODE_FOR_nothing)
6866     {
6867       op = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6868       if (optab_handler (op, mode) != CODE_FOR_nothing)
6869         {
6870           for (i = 0; i < nunits; ++i)
6871             sel[i] = 2 * i + (BYTES_BIG_ENDIAN ? 0 : 1);
6872           if (can_vec_perm_p (mode, false, sel))
6873             return 3;
6874         }
6875     }
6876
6877   return 0;
6878 }
6879
6880 /* Expand a highpart multiply.  */
6881
6882 rtx
6883 expand_mult_highpart (enum machine_mode mode, rtx op0, rtx op1,
6884                       rtx target, bool uns_p)
6885 {
6886   struct expand_operand eops[3];
6887   enum insn_code icode;
6888   int method, i, nunits;
6889   enum machine_mode wmode;
6890   rtx m1, m2, perm;
6891   optab tab1, tab2;
6892   rtvec v;
6893
6894   method = can_mult_highpart_p (mode, uns_p);
6895   switch (method)
6896     {
6897     case 0:
6898       return NULL_RTX;
6899     case 1:
6900       tab1 = uns_p ? umul_highpart_optab : smul_highpart_optab;
6901       return expand_binop (mode, tab1, op0, op1, target, uns_p,
6902                            OPTAB_LIB_WIDEN);
6903     case 2:
6904       tab1 = uns_p ? vec_widen_umult_even_optab : vec_widen_smult_even_optab;
6905       tab2 = uns_p ? vec_widen_umult_odd_optab : vec_widen_smult_odd_optab;
6906       break;
6907     case 3:
6908       tab1 = uns_p ? vec_widen_umult_lo_optab : vec_widen_smult_lo_optab;
6909       tab2 = uns_p ? vec_widen_umult_hi_optab : vec_widen_smult_hi_optab;
6910       if (BYTES_BIG_ENDIAN)
6911         {
6912           optab t = tab1;
6913           tab1 = tab2;
6914           tab2 = t;
6915         }
6916       break;
6917     default:
6918       gcc_unreachable ();
6919     }
6920
6921   icode = optab_handler (tab1, mode);
6922   nunits = GET_MODE_NUNITS (mode);
6923   wmode = insn_data[icode].operand[0].mode;
6924   gcc_checking_assert (2 * GET_MODE_NUNITS (wmode) == nunits);
6925   gcc_checking_assert (GET_MODE_SIZE (wmode) == GET_MODE_SIZE (mode));
6926
6927   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6928   create_input_operand (&eops[1], op0, mode);
6929   create_input_operand (&eops[2], op1, mode);
6930   expand_insn (icode, 3, eops);
6931   m1 = gen_lowpart (mode, eops[0].value);
6932
6933   create_output_operand (&eops[0], gen_reg_rtx (wmode), wmode);
6934   create_input_operand (&eops[1], op0, mode);
6935   create_input_operand (&eops[2], op1, mode);
6936   expand_insn (optab_handler (tab2, mode), 3, eops);
6937   m2 = gen_lowpart (mode, eops[0].value);
6938
6939   v = rtvec_alloc (nunits);
6940   if (method == 2)
6941     {
6942       for (i = 0; i < nunits; ++i)
6943         RTVEC_ELT (v, i) = GEN_INT (!BYTES_BIG_ENDIAN + (i & ~1)
6944                                     + ((i & 1) ? nunits : 0));
6945     }
6946   else
6947     {
6948       for (i = 0; i < nunits; ++i)
6949         RTVEC_ELT (v, i) = GEN_INT (2 * i + (BYTES_BIG_ENDIAN ? 0 : 1));
6950     }
6951   perm = gen_rtx_CONST_VECTOR (mode, v);
6952
6953   return expand_vec_perm (mode, m1, m2, perm, target);
6954 }
6955
6956 /* Return true if target supports vector masked load/store for mode.  */
6957 bool
6958 can_vec_mask_load_store_p (enum machine_mode mode, bool is_load)
6959 {
6960   optab op = is_load ? maskload_optab : maskstore_optab;
6961   enum machine_mode vmode;
6962   unsigned int vector_sizes;
6963
6964   /* If mode is vector mode, check it directly.  */
6965   if (VECTOR_MODE_P (mode))
6966     return optab_handler (op, mode) != CODE_FOR_nothing;
6967
6968   /* Otherwise, return true if there is some vector mode with
6969      the mask load/store supported.  */
6970
6971   /* See if there is any chance the mask load or store might be
6972      vectorized.  If not, punt.  */
6973   vmode = targetm.vectorize.preferred_simd_mode (mode);
6974   if (!VECTOR_MODE_P (vmode))
6975     return false;
6976
6977   if (optab_handler (op, vmode) != CODE_FOR_nothing)
6978     return true;
6979
6980   vector_sizes = targetm.vectorize.autovectorize_vector_sizes ();
6981   while (vector_sizes != 0)
6982     {
6983       unsigned int cur = 1 << floor_log2 (vector_sizes);
6984       vector_sizes &= ~cur;
6985       if (cur <= GET_MODE_SIZE (mode))
6986         continue;
6987       vmode = mode_for_vector (mode, cur / GET_MODE_SIZE (mode));
6988       if (VECTOR_MODE_P (vmode)
6989           && optab_handler (op, vmode) != CODE_FOR_nothing)
6990         return true;
6991     }
6992   return false;
6993 }
6994 \f
6995 /* Return true if there is a compare_and_swap pattern.  */
6996
6997 bool
6998 can_compare_and_swap_p (enum machine_mode mode, bool allow_libcall)
6999 {
7000   enum insn_code icode;
7001
7002   /* Check for __atomic_compare_and_swap.  */
7003   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7004   if (icode != CODE_FOR_nothing)
7005     return true;
7006
7007   /* Check for __sync_compare_and_swap.  */
7008   icode = optab_handler (sync_compare_and_swap_optab, mode);
7009   if (icode != CODE_FOR_nothing)
7010     return true;
7011   if (allow_libcall && optab_libfunc (sync_compare_and_swap_optab, mode))
7012     return true;
7013
7014   /* No inline compare and swap.  */
7015   return false;
7016 }
7017
7018 /* Return true if an atomic exchange can be performed.  */
7019
7020 bool
7021 can_atomic_exchange_p (enum machine_mode mode, bool allow_libcall)
7022 {
7023   enum insn_code icode;
7024
7025   /* Check for __atomic_exchange.  */
7026   icode = direct_optab_handler (atomic_exchange_optab, mode);
7027   if (icode != CODE_FOR_nothing)
7028     return true;
7029
7030   /* Don't check __sync_test_and_set, as on some platforms that
7031      has reduced functionality.  Targets that really do support
7032      a proper exchange should simply be updated to the __atomics.  */
7033
7034   return can_compare_and_swap_p (mode, allow_libcall);
7035 }
7036
7037
7038 /* Helper function to find the MODE_CC set in a sync_compare_and_swap
7039    pattern.  */
7040
7041 static void
7042 find_cc_set (rtx x, const_rtx pat, void *data)
7043 {
7044   if (REG_P (x) && GET_MODE_CLASS (GET_MODE (x)) == MODE_CC
7045       && GET_CODE (pat) == SET)
7046     {
7047       rtx *p_cc_reg = (rtx *) data;
7048       gcc_assert (!*p_cc_reg);
7049       *p_cc_reg = x;
7050     }
7051 }
7052
7053 /* This is a helper function for the other atomic operations.  This function
7054    emits a loop that contains SEQ that iterates until a compare-and-swap
7055    operation at the end succeeds.  MEM is the memory to be modified.  SEQ is
7056    a set of instructions that takes a value from OLD_REG as an input and
7057    produces a value in NEW_REG as an output.  Before SEQ, OLD_REG will be
7058    set to the current contents of MEM.  After SEQ, a compare-and-swap will
7059    attempt to update MEM with NEW_REG.  The function returns true when the
7060    loop was generated successfully.  */
7061
7062 static bool
7063 expand_compare_and_swap_loop (rtx mem, rtx old_reg, rtx new_reg, rtx seq)
7064 {
7065   enum machine_mode mode = GET_MODE (mem);
7066   rtx label, cmp_reg, success, oldval;
7067
7068   /* The loop we want to generate looks like
7069
7070         cmp_reg = mem;
7071       label:
7072         old_reg = cmp_reg;
7073         seq;
7074         (success, cmp_reg) = compare-and-swap(mem, old_reg, new_reg)
7075         if (success)
7076           goto label;
7077
7078      Note that we only do the plain load from memory once.  Subsequent
7079      iterations use the value loaded by the compare-and-swap pattern.  */
7080
7081   label = gen_label_rtx ();
7082   cmp_reg = gen_reg_rtx (mode);
7083
7084   emit_move_insn (cmp_reg, mem);
7085   emit_label (label);
7086   emit_move_insn (old_reg, cmp_reg);
7087   if (seq)
7088     emit_insn (seq);
7089
7090   success = NULL_RTX;
7091   oldval = cmp_reg;
7092   if (!expand_atomic_compare_and_swap (&success, &oldval, mem, old_reg,
7093                                        new_reg, false, MEMMODEL_SEQ_CST,
7094                                        MEMMODEL_RELAXED))
7095     return false;
7096
7097   if (oldval != cmp_reg)
7098     emit_move_insn (cmp_reg, oldval);
7099
7100   /* Mark this jump predicted not taken.  */
7101   emit_cmp_and_jump_insns (success, const0_rtx, EQ, const0_rtx,
7102                            GET_MODE (success), 1, label, 0);
7103   return true;
7104 }
7105
7106
7107 /* This function tries to emit an atomic_exchange intruction.  VAL is written
7108    to *MEM using memory model MODEL. The previous contents of *MEM are returned,
7109    using TARGET if possible.  */
7110
7111 static rtx
7112 maybe_emit_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7113 {
7114   enum machine_mode mode = GET_MODE (mem);
7115   enum insn_code icode;
7116
7117   /* If the target supports the exchange directly, great.  */
7118   icode = direct_optab_handler (atomic_exchange_optab, mode);
7119   if (icode != CODE_FOR_nothing)
7120     {
7121       struct expand_operand ops[4];
7122
7123       create_output_operand (&ops[0], target, mode);
7124       create_fixed_operand (&ops[1], mem);
7125       create_input_operand (&ops[2], val, mode);
7126       create_integer_operand (&ops[3], model);
7127       if (maybe_expand_insn (icode, 4, ops))
7128         return ops[0].value;
7129     }
7130
7131   return NULL_RTX;
7132 }
7133
7134 /* This function tries to implement an atomic exchange operation using
7135    __sync_lock_test_and_set. VAL is written to *MEM using memory model MODEL.
7136    The previous contents of *MEM are returned, using TARGET if possible.
7137    Since this instructionn is an acquire barrier only, stronger memory
7138    models may require additional barriers to be emitted.  */
7139
7140 static rtx
7141 maybe_emit_sync_lock_test_and_set (rtx target, rtx mem, rtx val,
7142                                    enum memmodel model)
7143 {
7144   enum machine_mode mode = GET_MODE (mem);
7145   enum insn_code icode;
7146   rtx last_insn = get_last_insn ();
7147
7148   icode = optab_handler (sync_lock_test_and_set_optab, mode);
7149
7150   /* Legacy sync_lock_test_and_set is an acquire barrier.  If the pattern
7151      exists, and the memory model is stronger than acquire, add a release
7152      barrier before the instruction.  */
7153
7154   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST
7155       || (model & MEMMODEL_MASK) == MEMMODEL_RELEASE
7156       || (model & MEMMODEL_MASK) == MEMMODEL_ACQ_REL)
7157     expand_mem_thread_fence (model);
7158
7159   if (icode != CODE_FOR_nothing)
7160     {
7161       struct expand_operand ops[3];
7162       create_output_operand (&ops[0], target, mode);
7163       create_fixed_operand (&ops[1], mem);
7164       create_input_operand (&ops[2], val, mode);
7165       if (maybe_expand_insn (icode, 3, ops))
7166         return ops[0].value;
7167     }
7168
7169   /* If an external test-and-set libcall is provided, use that instead of
7170      any external compare-and-swap that we might get from the compare-and-
7171      swap-loop expansion later.  */
7172   if (!can_compare_and_swap_p (mode, false))
7173     {
7174       rtx libfunc = optab_libfunc (sync_lock_test_and_set_optab, mode);
7175       if (libfunc != NULL)
7176         {
7177           rtx addr;
7178
7179           addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7180           return emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7181                                           mode, 2, addr, ptr_mode,
7182                                           val, mode);
7183         }
7184     }
7185
7186   /* If the test_and_set can't be emitted, eliminate any barrier that might
7187      have been emitted.  */
7188   delete_insns_since (last_insn);
7189   return NULL_RTX;
7190 }
7191
7192 /* This function tries to implement an atomic exchange operation using a
7193    compare_and_swap loop. VAL is written to *MEM.  The previous contents of
7194    *MEM are returned, using TARGET if possible.  No memory model is required
7195    since a compare_and_swap loop is seq-cst.  */
7196
7197 static rtx
7198 maybe_emit_compare_and_swap_exchange_loop (rtx target, rtx mem, rtx val)
7199 {
7200   enum machine_mode mode = GET_MODE (mem);
7201
7202   if (can_compare_and_swap_p (mode, true))
7203     {
7204       if (!target || !register_operand (target, mode))
7205         target = gen_reg_rtx (mode);
7206       if (expand_compare_and_swap_loop (mem, target, val, NULL_RTX))
7207         return target;
7208     }
7209
7210   return NULL_RTX;
7211 }
7212
7213 /* This function tries to implement an atomic test-and-set operation
7214    using the atomic_test_and_set instruction pattern.  A boolean value
7215    is returned from the operation, using TARGET if possible.  */
7216
7217 #ifndef HAVE_atomic_test_and_set
7218 #define HAVE_atomic_test_and_set 0
7219 #define CODE_FOR_atomic_test_and_set CODE_FOR_nothing
7220 #endif
7221
7222 static rtx
7223 maybe_emit_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7224 {
7225   enum machine_mode pat_bool_mode;
7226   struct expand_operand ops[3];
7227
7228   if (!HAVE_atomic_test_and_set)
7229     return NULL_RTX;
7230
7231   /* While we always get QImode from __atomic_test_and_set, we get
7232      other memory modes from __sync_lock_test_and_set.  Note that we
7233      use no endian adjustment here.  This matches the 4.6 behavior
7234      in the Sparc backend.  */
7235   gcc_checking_assert
7236     (insn_data[CODE_FOR_atomic_test_and_set].operand[1].mode == QImode);
7237   if (GET_MODE (mem) != QImode)
7238     mem = adjust_address_nv (mem, QImode, 0);
7239
7240   pat_bool_mode = insn_data[CODE_FOR_atomic_test_and_set].operand[0].mode;
7241   create_output_operand (&ops[0], target, pat_bool_mode);
7242   create_fixed_operand (&ops[1], mem);
7243   create_integer_operand (&ops[2], model);
7244
7245   if (maybe_expand_insn (CODE_FOR_atomic_test_and_set, 3, ops))
7246     return ops[0].value;
7247   return NULL_RTX;
7248 }
7249
7250 /* This function expands the legacy _sync_lock test_and_set operation which is
7251    generally an atomic exchange.  Some limited targets only allow the
7252    constant 1 to be stored.  This is an ACQUIRE operation.
7253
7254    TARGET is an optional place to stick the return value.
7255    MEM is where VAL is stored.  */
7256
7257 rtx
7258 expand_sync_lock_test_and_set (rtx target, rtx mem, rtx val)
7259 {
7260   rtx ret;
7261
7262   /* Try an atomic_exchange first.  */
7263   ret = maybe_emit_atomic_exchange (target, mem, val, MEMMODEL_ACQUIRE);
7264   if (ret)
7265     return ret;
7266
7267   ret = maybe_emit_sync_lock_test_and_set (target, mem, val, MEMMODEL_ACQUIRE);
7268   if (ret)
7269     return ret;
7270
7271   ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7272   if (ret)
7273     return ret;
7274
7275   /* If there are no other options, try atomic_test_and_set if the value
7276      being stored is 1.  */
7277   if (val == const1_rtx)
7278     ret = maybe_emit_atomic_test_and_set (target, mem, MEMMODEL_ACQUIRE);
7279
7280   return ret;
7281 }
7282
7283 /* This function expands the atomic test_and_set operation:
7284    atomically store a boolean TRUE into MEM and return the previous value.
7285
7286    MEMMODEL is the memory model variant to use.
7287    TARGET is an optional place to stick the return value.  */
7288
7289 rtx
7290 expand_atomic_test_and_set (rtx target, rtx mem, enum memmodel model)
7291 {
7292   enum machine_mode mode = GET_MODE (mem);
7293   rtx ret, trueval, subtarget;
7294
7295   ret = maybe_emit_atomic_test_and_set (target, mem, model);
7296   if (ret)
7297     return ret;
7298
7299   /* Be binary compatible with non-default settings of trueval, and different
7300      cpu revisions.  E.g. one revision may have atomic-test-and-set, but
7301      another only has atomic-exchange.  */
7302   if (targetm.atomic_test_and_set_trueval == 1)
7303     {
7304       trueval = const1_rtx;
7305       subtarget = target ? target : gen_reg_rtx (mode);
7306     }
7307   else
7308     {
7309       trueval = gen_int_mode (targetm.atomic_test_and_set_trueval, mode);
7310       subtarget = gen_reg_rtx (mode);
7311     }
7312
7313   /* Try the atomic-exchange optab...  */
7314   ret = maybe_emit_atomic_exchange (subtarget, mem, trueval, model);
7315
7316   /* ... then an atomic-compare-and-swap loop ... */
7317   if (!ret)
7318     ret = maybe_emit_compare_and_swap_exchange_loop (subtarget, mem, trueval);
7319
7320   /* ... before trying the vaguely defined legacy lock_test_and_set. */
7321   if (!ret)
7322     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, trueval, model);
7323
7324   /* Recall that the legacy lock_test_and_set optab was allowed to do magic
7325      things with the value 1.  Thus we try again without trueval.  */
7326   if (!ret && targetm.atomic_test_and_set_trueval != 1)
7327     ret = maybe_emit_sync_lock_test_and_set (subtarget, mem, const1_rtx, model);
7328
7329   /* Failing all else, assume a single threaded environment and simply
7330      perform the operation.  */
7331   if (!ret)
7332     {
7333       emit_move_insn (subtarget, mem);
7334       emit_move_insn (mem, trueval);
7335       ret = subtarget;
7336     }
7337
7338   /* Recall that have to return a boolean value; rectify if trueval
7339      is not exactly one.  */
7340   if (targetm.atomic_test_and_set_trueval != 1)
7341     ret = emit_store_flag_force (target, NE, ret, const0_rtx, mode, 0, 1);
7342
7343   return ret;
7344 }
7345
7346 /* This function expands the atomic exchange operation:
7347    atomically store VAL in MEM and return the previous value in MEM.
7348
7349    MEMMODEL is the memory model variant to use.
7350    TARGET is an optional place to stick the return value.  */
7351
7352 rtx
7353 expand_atomic_exchange (rtx target, rtx mem, rtx val, enum memmodel model)
7354 {
7355   rtx ret;
7356
7357   ret = maybe_emit_atomic_exchange (target, mem, val, model);
7358
7359   /* Next try a compare-and-swap loop for the exchange.  */
7360   if (!ret)
7361     ret = maybe_emit_compare_and_swap_exchange_loop (target, mem, val);
7362
7363   return ret;
7364 }
7365
7366 /* This function expands the atomic compare exchange operation:
7367
7368    *PTARGET_BOOL is an optional place to store the boolean success/failure.
7369    *PTARGET_OVAL is an optional place to store the old value from memory.
7370    Both target parameters may be NULL to indicate that we do not care about
7371    that return value.  Both target parameters are updated on success to
7372    the actual location of the corresponding result.
7373
7374    MEMMODEL is the memory model variant to use.
7375
7376    The return value of the function is true for success.  */
7377
7378 bool
7379 expand_atomic_compare_and_swap (rtx *ptarget_bool, rtx *ptarget_oval,
7380                                 rtx mem, rtx expected, rtx desired,
7381                                 bool is_weak, enum memmodel succ_model,
7382                                 enum memmodel fail_model)
7383 {
7384   enum machine_mode mode = GET_MODE (mem);
7385   struct expand_operand ops[8];
7386   enum insn_code icode;
7387   rtx target_oval, target_bool = NULL_RTX;
7388   rtx libfunc;
7389
7390   /* Load expected into a register for the compare and swap.  */
7391   if (MEM_P (expected))
7392     expected = copy_to_reg (expected);
7393
7394   /* Make sure we always have some place to put the return oldval.
7395      Further, make sure that place is distinct from the input expected,
7396      just in case we need that path down below.  */
7397   if (ptarget_oval == NULL
7398       || (target_oval = *ptarget_oval) == NULL
7399       || reg_overlap_mentioned_p (expected, target_oval))
7400     target_oval = gen_reg_rtx (mode);
7401
7402   icode = direct_optab_handler (atomic_compare_and_swap_optab, mode);
7403   if (icode != CODE_FOR_nothing)
7404     {
7405       enum machine_mode bool_mode = insn_data[icode].operand[0].mode;
7406
7407       /* Make sure we always have a place for the bool operand.  */
7408       if (ptarget_bool == NULL
7409           || (target_bool = *ptarget_bool) == NULL
7410           || GET_MODE (target_bool) != bool_mode)
7411         target_bool = gen_reg_rtx (bool_mode);
7412
7413       /* Emit the compare_and_swap.  */
7414       create_output_operand (&ops[0], target_bool, bool_mode);
7415       create_output_operand (&ops[1], target_oval, mode);
7416       create_fixed_operand (&ops[2], mem);
7417       create_input_operand (&ops[3], expected, mode);
7418       create_input_operand (&ops[4], desired, mode);
7419       create_integer_operand (&ops[5], is_weak);
7420       create_integer_operand (&ops[6], succ_model);
7421       create_integer_operand (&ops[7], fail_model);
7422       if (maybe_expand_insn (icode, 8, ops))
7423         {
7424           /* Return success/failure.  */
7425           target_bool = ops[0].value;
7426           target_oval = ops[1].value;
7427           goto success;
7428         }
7429     }
7430
7431   /* Otherwise fall back to the original __sync_val_compare_and_swap
7432      which is always seq-cst.  */
7433   icode = optab_handler (sync_compare_and_swap_optab, mode);
7434   if (icode != CODE_FOR_nothing)
7435     {
7436       rtx cc_reg;
7437
7438       create_output_operand (&ops[0], target_oval, mode);
7439       create_fixed_operand (&ops[1], mem);
7440       create_input_operand (&ops[2], expected, mode);
7441       create_input_operand (&ops[3], desired, mode);
7442       if (!maybe_expand_insn (icode, 4, ops))
7443         return false;
7444
7445       target_oval = ops[0].value;
7446
7447       /* If the caller isn't interested in the boolean return value,
7448          skip the computation of it.  */
7449       if (ptarget_bool == NULL)
7450         goto success;
7451
7452       /* Otherwise, work out if the compare-and-swap succeeded.  */
7453       cc_reg = NULL_RTX;
7454       if (have_insn_for (COMPARE, CCmode))
7455         note_stores (PATTERN (get_last_insn ()), find_cc_set, &cc_reg);
7456       if (cc_reg)
7457         {
7458           target_bool = emit_store_flag_force (target_bool, EQ, cc_reg,
7459                                                const0_rtx, VOIDmode, 0, 1);
7460           goto success;
7461         }
7462       goto success_bool_from_val;
7463     }
7464
7465   /* Also check for library support for __sync_val_compare_and_swap.  */
7466   libfunc = optab_libfunc (sync_compare_and_swap_optab, mode);
7467   if (libfunc != NULL)
7468     {
7469       rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
7470       target_oval = emit_library_call_value (libfunc, NULL_RTX, LCT_NORMAL,
7471                                              mode, 3, addr, ptr_mode,
7472                                              expected, mode, desired, mode);
7473
7474       /* Compute the boolean return value only if requested.  */
7475       if (ptarget_bool)
7476         goto success_bool_from_val;
7477       else
7478         goto success;
7479     }
7480
7481   /* Failure.  */
7482   return false;
7483
7484  success_bool_from_val:
7485    target_bool = emit_store_flag_force (target_bool, EQ, target_oval,
7486                                         expected, VOIDmode, 1, 1);
7487  success:
7488   /* Make sure that the oval output winds up where the caller asked.  */
7489   if (ptarget_oval)
7490     *ptarget_oval = target_oval;
7491   if (ptarget_bool)
7492     *ptarget_bool = target_bool;
7493   return true;
7494 }
7495
7496 /* Generate asm volatile("" : : : "memory") as the memory barrier.  */
7497
7498 static void
7499 expand_asm_memory_barrier (void)
7500 {
7501   rtx asm_op, clob;
7502
7503   asm_op = gen_rtx_ASM_OPERANDS (VOIDmode, empty_string, empty_string, 0,
7504                                  rtvec_alloc (0), rtvec_alloc (0),
7505                                  rtvec_alloc (0), UNKNOWN_LOCATION);
7506   MEM_VOLATILE_P (asm_op) = 1;
7507
7508   clob = gen_rtx_SCRATCH (VOIDmode);
7509   clob = gen_rtx_MEM (BLKmode, clob);
7510   clob = gen_rtx_CLOBBER (VOIDmode, clob);
7511
7512   emit_insn (gen_rtx_PARALLEL (VOIDmode, gen_rtvec (2, asm_op, clob)));
7513 }
7514
7515 /* This routine will either emit the mem_thread_fence pattern or issue a
7516    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7517
7518 #ifndef HAVE_mem_thread_fence
7519 # define HAVE_mem_thread_fence 0
7520 # define gen_mem_thread_fence(x) (gcc_unreachable (), NULL_RTX)
7521 #endif
7522 #ifndef HAVE_memory_barrier
7523 # define HAVE_memory_barrier 0
7524 # define gen_memory_barrier()  (gcc_unreachable (), NULL_RTX)
7525 #endif
7526
7527 void
7528 expand_mem_thread_fence (enum memmodel model)
7529 {
7530   if (HAVE_mem_thread_fence)
7531     emit_insn (gen_mem_thread_fence (GEN_INT (model)));
7532   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7533     {
7534       if (HAVE_memory_barrier)
7535         emit_insn (gen_memory_barrier ());
7536       else if (synchronize_libfunc != NULL_RTX)
7537         emit_library_call (synchronize_libfunc, LCT_NORMAL, VOIDmode, 0);
7538       else
7539         expand_asm_memory_barrier ();
7540     }
7541 }
7542
7543 /* This routine will either emit the mem_signal_fence pattern or issue a
7544    sync_synchronize to generate a fence for memory model MEMMODEL.  */
7545
7546 #ifndef HAVE_mem_signal_fence
7547 # define HAVE_mem_signal_fence 0
7548 # define gen_mem_signal_fence(x) (gcc_unreachable (), NULL_RTX)
7549 #endif
7550
7551 void
7552 expand_mem_signal_fence (enum memmodel model)
7553 {
7554   if (HAVE_mem_signal_fence)
7555     emit_insn (gen_mem_signal_fence (GEN_INT (model)));
7556   else if ((model & MEMMODEL_MASK) != MEMMODEL_RELAXED)
7557     {
7558       /* By default targets are coherent between a thread and the signal
7559          handler running on the same thread.  Thus this really becomes a
7560          compiler barrier, in that stores must not be sunk past
7561          (or raised above) a given point.  */
7562       expand_asm_memory_barrier ();
7563     }
7564 }
7565
7566 /* This function expands the atomic load operation:
7567    return the atomically loaded value in MEM.
7568
7569    MEMMODEL is the memory model variant to use.
7570    TARGET is an option place to stick the return value.  */
7571
7572 rtx
7573 expand_atomic_load (rtx target, rtx mem, enum memmodel model)
7574 {
7575   enum machine_mode mode = GET_MODE (mem);
7576   enum insn_code icode;
7577
7578   /* If the target supports the load directly, great.  */
7579   icode = direct_optab_handler (atomic_load_optab, mode);
7580   if (icode != CODE_FOR_nothing)
7581     {
7582       struct expand_operand ops[3];
7583
7584       create_output_operand (&ops[0], target, mode);
7585       create_fixed_operand (&ops[1], mem);
7586       create_integer_operand (&ops[2], model);
7587       if (maybe_expand_insn (icode, 3, ops))
7588         return ops[0].value;
7589     }
7590
7591   /* If the size of the object is greater than word size on this target,
7592      then we assume that a load will not be atomic.  */
7593   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7594     {
7595       /* Issue val = compare_and_swap (mem, 0, 0).
7596          This may cause the occasional harmless store of 0 when the value is
7597          already 0, but it seems to be OK according to the standards guys.  */
7598       if (expand_atomic_compare_and_swap (NULL, &target, mem, const0_rtx,
7599                                           const0_rtx, false, model, model))
7600         return target;
7601       else
7602       /* Otherwise there is no atomic load, leave the library call.  */
7603         return NULL_RTX;
7604     }
7605
7606   /* Otherwise assume loads are atomic, and emit the proper barriers.  */
7607   if (!target || target == const0_rtx)
7608     target = gen_reg_rtx (mode);
7609
7610   /* For SEQ_CST, emit a barrier before the load.  */
7611   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7612     expand_mem_thread_fence (model);
7613
7614   emit_move_insn (target, mem);
7615
7616   /* Emit the appropriate barrier after the load.  */
7617   expand_mem_thread_fence (model);
7618
7619   return target;
7620 }
7621
7622 /* This function expands the atomic store operation:
7623    Atomically store VAL in MEM.
7624    MEMMODEL is the memory model variant to use.
7625    USE_RELEASE is true if __sync_lock_release can be used as a fall back.
7626    function returns const0_rtx if a pattern was emitted.  */
7627
7628 rtx
7629 expand_atomic_store (rtx mem, rtx val, enum memmodel model, bool use_release)
7630 {
7631   enum machine_mode mode = GET_MODE (mem);
7632   enum insn_code icode;
7633   struct expand_operand ops[3];
7634
7635   /* If the target supports the store directly, great.  */
7636   icode = direct_optab_handler (atomic_store_optab, mode);
7637   if (icode != CODE_FOR_nothing)
7638     {
7639       create_fixed_operand (&ops[0], mem);
7640       create_input_operand (&ops[1], val, mode);
7641       create_integer_operand (&ops[2], model);
7642       if (maybe_expand_insn (icode, 3, ops))
7643         return const0_rtx;
7644     }
7645
7646   /* If using __sync_lock_release is a viable alternative, try it.  */
7647   if (use_release)
7648     {
7649       icode = direct_optab_handler (sync_lock_release_optab, mode);
7650       if (icode != CODE_FOR_nothing)
7651         {
7652           create_fixed_operand (&ops[0], mem);
7653           create_input_operand (&ops[1], const0_rtx, mode);
7654           if (maybe_expand_insn (icode, 2, ops))
7655             {
7656               /* lock_release is only a release barrier.  */
7657               if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7658                 expand_mem_thread_fence (model);
7659               return const0_rtx;
7660             }
7661         }
7662     }
7663
7664   /* If the size of the object is greater than word size on this target,
7665      a default store will not be atomic, Try a mem_exchange and throw away
7666      the result.  If that doesn't work, don't do anything.  */
7667   if (GET_MODE_PRECISION (mode) > BITS_PER_WORD)
7668     {
7669       rtx target = maybe_emit_atomic_exchange (NULL_RTX, mem, val, model);
7670       if (!target)
7671         target = maybe_emit_compare_and_swap_exchange_loop (NULL_RTX, mem, val);
7672       if (target)
7673         return const0_rtx;
7674       else
7675         return NULL_RTX;
7676     }
7677
7678   /* Otherwise assume stores are atomic, and emit the proper barriers.  */
7679   expand_mem_thread_fence (model);
7680
7681   emit_move_insn (mem, val);
7682
7683   /* For SEQ_CST, also emit a barrier after the store.  */
7684   if ((model & MEMMODEL_MASK) == MEMMODEL_SEQ_CST)
7685     expand_mem_thread_fence (model);
7686
7687   return const0_rtx;
7688 }
7689
7690
7691 /* Structure containing the pointers and values required to process the
7692    various forms of the atomic_fetch_op and atomic_op_fetch builtins.  */
7693
7694 struct atomic_op_functions
7695 {
7696   direct_optab mem_fetch_before;
7697   direct_optab mem_fetch_after;
7698   direct_optab mem_no_result;
7699   optab fetch_before;
7700   optab fetch_after;
7701   direct_optab no_result;
7702   enum rtx_code reverse_code;
7703 };
7704
7705
7706 /* Fill in structure pointed to by OP with the various optab entries for an
7707    operation of type CODE.  */
7708
7709 static void
7710 get_atomic_op_for_code (struct atomic_op_functions *op, enum rtx_code code)
7711 {
7712   gcc_assert (op!= NULL);
7713
7714   /* If SWITCHABLE_TARGET is defined, then subtargets can be switched
7715      in the source code during compilation, and the optab entries are not
7716      computable until runtime.  Fill in the values at runtime.  */
7717   switch (code)
7718     {
7719     case PLUS:
7720       op->mem_fetch_before = atomic_fetch_add_optab;
7721       op->mem_fetch_after = atomic_add_fetch_optab;
7722       op->mem_no_result = atomic_add_optab;
7723       op->fetch_before = sync_old_add_optab;
7724       op->fetch_after = sync_new_add_optab;
7725       op->no_result = sync_add_optab;
7726       op->reverse_code = MINUS;
7727       break;
7728     case MINUS:
7729       op->mem_fetch_before = atomic_fetch_sub_optab;
7730       op->mem_fetch_after = atomic_sub_fetch_optab;
7731       op->mem_no_result = atomic_sub_optab;
7732       op->fetch_before = sync_old_sub_optab;
7733       op->fetch_after = sync_new_sub_optab;
7734       op->no_result = sync_sub_optab;
7735       op->reverse_code = PLUS;
7736       break;
7737     case XOR:
7738       op->mem_fetch_before = atomic_fetch_xor_optab;
7739       op->mem_fetch_after = atomic_xor_fetch_optab;
7740       op->mem_no_result = atomic_xor_optab;
7741       op->fetch_before = sync_old_xor_optab;
7742       op->fetch_after = sync_new_xor_optab;
7743       op->no_result = sync_xor_optab;
7744       op->reverse_code = XOR;
7745       break;
7746     case AND:
7747       op->mem_fetch_before = atomic_fetch_and_optab;
7748       op->mem_fetch_after = atomic_and_fetch_optab;
7749       op->mem_no_result = atomic_and_optab;
7750       op->fetch_before = sync_old_and_optab;
7751       op->fetch_after = sync_new_and_optab;
7752       op->no_result = sync_and_optab;
7753       op->reverse_code = UNKNOWN;
7754       break;
7755     case IOR:
7756       op->mem_fetch_before = atomic_fetch_or_optab;
7757       op->mem_fetch_after = atomic_or_fetch_optab;
7758       op->mem_no_result = atomic_or_optab;
7759       op->fetch_before = sync_old_ior_optab;
7760       op->fetch_after = sync_new_ior_optab;
7761       op->no_result = sync_ior_optab;
7762       op->reverse_code = UNKNOWN;
7763       break;
7764     case NOT:
7765       op->mem_fetch_before = atomic_fetch_nand_optab;
7766       op->mem_fetch_after = atomic_nand_fetch_optab;
7767       op->mem_no_result = atomic_nand_optab;
7768       op->fetch_before = sync_old_nand_optab;
7769       op->fetch_after = sync_new_nand_optab;
7770       op->no_result = sync_nand_optab;
7771       op->reverse_code = UNKNOWN;
7772       break;
7773     default:
7774       gcc_unreachable ();
7775     }
7776 }
7777
7778 /* See if there is a more optimal way to implement the operation "*MEM CODE VAL"
7779    using memory order MODEL.  If AFTER is true the operation needs to return
7780    the value of *MEM after the operation, otherwise the previous value.
7781    TARGET is an optional place to place the result.  The result is unused if
7782    it is const0_rtx.
7783    Return the result if there is a better sequence, otherwise NULL_RTX.  */
7784
7785 static rtx
7786 maybe_optimize_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7787                          enum memmodel model, bool after)
7788 {
7789   /* If the value is prefetched, or not used, it may be possible to replace
7790      the sequence with a native exchange operation.  */
7791   if (!after || target == const0_rtx)
7792     {
7793       /* fetch_and (&x, 0, m) can be replaced with exchange (&x, 0, m).  */
7794       if (code == AND && val == const0_rtx)
7795         {
7796           if (target == const0_rtx)
7797             target = gen_reg_rtx (GET_MODE (mem));
7798           return maybe_emit_atomic_exchange (target, mem, val, model);
7799         }
7800
7801       /* fetch_or (&x, -1, m) can be replaced with exchange (&x, -1, m).  */
7802       if (code == IOR && val == constm1_rtx)
7803         {
7804           if (target == const0_rtx)
7805             target = gen_reg_rtx (GET_MODE (mem));
7806           return maybe_emit_atomic_exchange (target, mem, val, model);
7807         }
7808     }
7809
7810   return NULL_RTX;
7811 }
7812
7813 /* Try to emit an instruction for a specific operation varaition.
7814    OPTAB contains the OP functions.
7815    TARGET is an optional place to return the result. const0_rtx means unused.
7816    MEM is the memory location to operate on.
7817    VAL is the value to use in the operation.
7818    USE_MEMMODEL is TRUE if the variation with a memory model should be tried.
7819    MODEL is the memory model, if used.
7820    AFTER is true if the returned result is the value after the operation.  */
7821
7822 static rtx
7823 maybe_emit_op (const struct atomic_op_functions *optab, rtx target, rtx mem,
7824                rtx val, bool use_memmodel, enum memmodel model, bool after)
7825 {
7826   enum machine_mode mode = GET_MODE (mem);
7827   struct expand_operand ops[4];
7828   enum insn_code icode;
7829   int op_counter = 0;
7830   int num_ops;
7831
7832   /* Check to see if there is a result returned.  */
7833   if (target == const0_rtx)
7834     {
7835       if (use_memmodel)
7836         {
7837           icode = direct_optab_handler (optab->mem_no_result, mode);
7838           create_integer_operand (&ops[2], model);
7839           num_ops = 3;
7840         }
7841       else
7842         {
7843           icode = direct_optab_handler (optab->no_result, mode);
7844           num_ops = 2;
7845         }
7846     }
7847   /* Otherwise, we need to generate a result.  */
7848   else
7849     {
7850       if (use_memmodel)
7851         {
7852           icode = direct_optab_handler (after ? optab->mem_fetch_after
7853                                         : optab->mem_fetch_before, mode);
7854           create_integer_operand (&ops[3], model);
7855           num_ops = 4;
7856         }
7857       else
7858         {
7859           icode = optab_handler (after ? optab->fetch_after
7860                                  : optab->fetch_before, mode);
7861           num_ops = 3;
7862         }
7863       create_output_operand (&ops[op_counter++], target, mode);
7864     }
7865   if (icode == CODE_FOR_nothing)
7866     return NULL_RTX;
7867
7868   create_fixed_operand (&ops[op_counter++], mem);
7869   /* VAL may have been promoted to a wider mode.  Shrink it if so.  */
7870   create_convert_operand_to (&ops[op_counter++], val, mode, true);
7871
7872   if (maybe_expand_insn (icode, num_ops, ops))
7873     return (target == const0_rtx ? const0_rtx : ops[0].value);
7874
7875   return NULL_RTX;
7876 }
7877
7878
7879 /* This function expands an atomic fetch_OP or OP_fetch operation:
7880    TARGET is an option place to stick the return value.  const0_rtx indicates
7881    the result is unused.
7882    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7883    CODE is the operation being performed (OP)
7884    MEMMODEL is the memory model variant to use.
7885    AFTER is true to return the result of the operation (OP_fetch).
7886    AFTER is false to return the value before the operation (fetch_OP).
7887
7888    This function will *only* generate instructions if there is a direct
7889    optab. No compare and swap loops or libcalls will be generated. */
7890
7891 static rtx
7892 expand_atomic_fetch_op_no_fallback (rtx target, rtx mem, rtx val,
7893                                     enum rtx_code code, enum memmodel model,
7894                                     bool after)
7895 {
7896   enum machine_mode mode = GET_MODE (mem);
7897   struct atomic_op_functions optab;
7898   rtx result;
7899   bool unused_result = (target == const0_rtx);
7900
7901   get_atomic_op_for_code (&optab, code);
7902
7903   /* Check to see if there are any better instructions.  */
7904   result = maybe_optimize_fetch_op (target, mem, val, code, model, after);
7905   if (result)
7906     return result;
7907
7908   /* Check for the case where the result isn't used and try those patterns.  */
7909   if (unused_result)
7910     {
7911       /* Try the memory model variant first.  */
7912       result = maybe_emit_op (&optab, target, mem, val, true, model, true);
7913       if (result)
7914         return result;
7915
7916       /* Next try the old style withuot a memory model.  */
7917       result = maybe_emit_op (&optab, target, mem, val, false, model, true);
7918       if (result)
7919         return result;
7920
7921       /* There is no no-result pattern, so try patterns with a result.  */
7922       target = NULL_RTX;
7923     }
7924
7925   /* Try the __atomic version.  */
7926   result = maybe_emit_op (&optab, target, mem, val, true, model, after);
7927   if (result)
7928     return result;
7929
7930   /* Try the older __sync version.  */
7931   result = maybe_emit_op (&optab, target, mem, val, false, model, after);
7932   if (result)
7933     return result;
7934
7935   /* If the fetch value can be calculated from the other variation of fetch,
7936      try that operation.  */
7937   if (after || unused_result || optab.reverse_code != UNKNOWN)
7938     {
7939       /* Try the __atomic version, then the older __sync version.  */
7940       result = maybe_emit_op (&optab, target, mem, val, true, model, !after);
7941       if (!result)
7942         result = maybe_emit_op (&optab, target, mem, val, false, model, !after);
7943
7944       if (result)
7945         {
7946           /* If the result isn't used, no need to do compensation code.  */
7947           if (unused_result)
7948             return result;
7949
7950           /* Issue compensation code.  Fetch_after  == fetch_before OP val.
7951              Fetch_before == after REVERSE_OP val.  */
7952           if (!after)
7953             code = optab.reverse_code;
7954           if (code == NOT)
7955             {
7956               result = expand_simple_binop (mode, AND, result, val, NULL_RTX,
7957                                             true, OPTAB_LIB_WIDEN);
7958               result = expand_simple_unop (mode, NOT, result, target, true);
7959             }
7960           else
7961             result = expand_simple_binop (mode, code, result, val, target,
7962                                           true, OPTAB_LIB_WIDEN);
7963           return result;
7964         }
7965     }
7966
7967   /* No direct opcode can be generated.  */
7968   return NULL_RTX;
7969 }
7970
7971
7972
7973 /* This function expands an atomic fetch_OP or OP_fetch operation:
7974    TARGET is an option place to stick the return value.  const0_rtx indicates
7975    the result is unused.
7976    atomically fetch MEM, perform the operation with VAL and return it to MEM.
7977    CODE is the operation being performed (OP)
7978    MEMMODEL is the memory model variant to use.
7979    AFTER is true to return the result of the operation (OP_fetch).
7980    AFTER is false to return the value before the operation (fetch_OP).  */
7981 rtx
7982 expand_atomic_fetch_op (rtx target, rtx mem, rtx val, enum rtx_code code,
7983                         enum memmodel model, bool after)
7984 {
7985   enum machine_mode mode = GET_MODE (mem);
7986   rtx result;
7987   bool unused_result = (target == const0_rtx);
7988
7989   result = expand_atomic_fetch_op_no_fallback (target, mem, val, code, model,
7990                                                after);
7991
7992   if (result)
7993     return result;
7994
7995   /* Add/sub can be implemented by doing the reverse operation with -(val).  */
7996   if (code == PLUS || code == MINUS)
7997     {
7998       rtx tmp;
7999       enum rtx_code reverse = (code == PLUS ? MINUS : PLUS);
8000
8001       start_sequence ();
8002       tmp = expand_simple_unop (mode, NEG, val, NULL_RTX, true);
8003       result = expand_atomic_fetch_op_no_fallback (target, mem, tmp, reverse,
8004                                                    model, after);
8005       if (result)
8006         {
8007           /* PLUS worked so emit the insns and return.  */
8008           tmp = get_insns ();
8009           end_sequence ();
8010           emit_insn (tmp);
8011           return result;
8012         }
8013
8014       /* PLUS did not work, so throw away the negation code and continue.  */
8015       end_sequence ();
8016     }
8017
8018   /* Try the __sync libcalls only if we can't do compare-and-swap inline.  */
8019   if (!can_compare_and_swap_p (mode, false))
8020     {
8021       rtx libfunc;
8022       bool fixup = false;
8023       enum rtx_code orig_code = code;
8024       struct atomic_op_functions optab;
8025
8026       get_atomic_op_for_code (&optab, code);
8027       libfunc = optab_libfunc (after ? optab.fetch_after
8028                                : optab.fetch_before, mode);
8029       if (libfunc == NULL
8030           && (after || unused_result || optab.reverse_code != UNKNOWN))
8031         {
8032           fixup = true;
8033           if (!after)
8034             code = optab.reverse_code;
8035           libfunc = optab_libfunc (after ? optab.fetch_before
8036                                    : optab.fetch_after, mode);
8037         }
8038       if (libfunc != NULL)
8039         {
8040           rtx addr = convert_memory_address (ptr_mode, XEXP (mem, 0));
8041           result = emit_library_call_value (libfunc, NULL, LCT_NORMAL, mode,
8042                                             2, addr, ptr_mode, val, mode);
8043
8044           if (!unused_result && fixup)
8045             result = expand_simple_binop (mode, code, result, val, target,
8046                                           true, OPTAB_LIB_WIDEN);
8047           return result;
8048         }
8049
8050       /* We need the original code for any further attempts.  */
8051       code = orig_code;
8052     }
8053
8054   /* If nothing else has succeeded, default to a compare and swap loop.  */
8055   if (can_compare_and_swap_p (mode, true))
8056     {
8057       rtx insn;
8058       rtx t0 = gen_reg_rtx (mode), t1;
8059
8060       start_sequence ();
8061
8062       /* If the result is used, get a register for it.  */
8063       if (!unused_result)
8064         {
8065           if (!target || !register_operand (target, mode))
8066             target = gen_reg_rtx (mode);
8067           /* If fetch_before, copy the value now.  */
8068           if (!after)
8069             emit_move_insn (target, t0);
8070         }
8071       else
8072         target = const0_rtx;
8073
8074       t1 = t0;
8075       if (code == NOT)
8076         {
8077           t1 = expand_simple_binop (mode, AND, t1, val, NULL_RTX,
8078                                     true, OPTAB_LIB_WIDEN);
8079           t1 = expand_simple_unop (mode, code, t1, NULL_RTX, true);
8080         }
8081       else
8082         t1 = expand_simple_binop (mode, code, t1, val, NULL_RTX, true,
8083                                   OPTAB_LIB_WIDEN);
8084
8085       /* For after, copy the value now.  */
8086       if (!unused_result && after)
8087         emit_move_insn (target, t1);
8088       insn = get_insns ();
8089       end_sequence ();
8090
8091       if (t1 != NULL && expand_compare_and_swap_loop (mem, t0, t1, insn))
8092         return target;
8093     }
8094
8095   return NULL_RTX;
8096 }
8097 \f
8098 /* Return true if OPERAND is suitable for operand number OPNO of
8099    instruction ICODE.  */
8100
8101 bool
8102 insn_operand_matches (enum insn_code icode, unsigned int opno, rtx operand)
8103 {
8104   return (!insn_data[(int) icode].operand[opno].predicate
8105           || (insn_data[(int) icode].operand[opno].predicate
8106               (operand, insn_data[(int) icode].operand[opno].mode)));
8107 }
8108 \f
8109 /* TARGET is a target of a multiword operation that we are going to
8110    implement as a series of word-mode operations.  Return true if
8111    TARGET is suitable for this purpose.  */
8112
8113 bool
8114 valid_multiword_target_p (rtx target)
8115 {
8116   enum machine_mode mode;
8117   int i;
8118
8119   mode = GET_MODE (target);
8120   for (i = 0; i < GET_MODE_SIZE (mode); i += UNITS_PER_WORD)
8121     if (!validate_subreg (word_mode, mode, target, i))
8122       return false;
8123   return true;
8124 }
8125
8126 /* Like maybe_legitimize_operand, but do not change the code of the
8127    current rtx value.  */
8128
8129 static bool
8130 maybe_legitimize_operand_same_code (enum insn_code icode, unsigned int opno,
8131                                     struct expand_operand *op)
8132 {
8133   /* See if the operand matches in its current form.  */
8134   if (insn_operand_matches (icode, opno, op->value))
8135     return true;
8136
8137   /* If the operand is a memory whose address has no side effects,
8138      try forcing the address into a non-virtual pseudo register.
8139      The check for side effects is important because copy_to_mode_reg
8140      cannot handle things like auto-modified addresses.  */
8141   if (insn_data[(int) icode].operand[opno].allows_mem && MEM_P (op->value))
8142     {
8143       rtx addr, mem;
8144
8145       mem = op->value;
8146       addr = XEXP (mem, 0);
8147       if (!(REG_P (addr) && REGNO (addr) > LAST_VIRTUAL_REGISTER)
8148           && !side_effects_p (addr))
8149         {
8150           rtx last;
8151           enum machine_mode mode;
8152
8153           last = get_last_insn ();
8154           mode = get_address_mode (mem);
8155           mem = replace_equiv_address (mem, copy_to_mode_reg (mode, addr));
8156           if (insn_operand_matches (icode, opno, mem))
8157             {
8158               op->value = mem;
8159               return true;
8160             }
8161           delete_insns_since (last);
8162         }
8163     }
8164
8165   return false;
8166 }
8167
8168 /* Try to make OP match operand OPNO of instruction ICODE.  Return true
8169    on success, storing the new operand value back in OP.  */
8170
8171 static bool
8172 maybe_legitimize_operand (enum insn_code icode, unsigned int opno,
8173                           struct expand_operand *op)
8174 {
8175   enum machine_mode mode, imode;
8176   bool old_volatile_ok, result;
8177
8178   mode = op->mode;
8179   switch (op->type)
8180     {
8181     case EXPAND_FIXED:
8182       old_volatile_ok = volatile_ok;
8183       volatile_ok = true;
8184       result = maybe_legitimize_operand_same_code (icode, opno, op);
8185       volatile_ok = old_volatile_ok;
8186       return result;
8187
8188     case EXPAND_OUTPUT:
8189       gcc_assert (mode != VOIDmode);
8190       if (op->value
8191           && op->value != const0_rtx
8192           && GET_MODE (op->value) == mode
8193           && maybe_legitimize_operand_same_code (icode, opno, op))
8194         return true;
8195
8196       op->value = gen_reg_rtx (mode);
8197       break;
8198
8199     case EXPAND_INPUT:
8200     input:
8201       gcc_assert (mode != VOIDmode);
8202       gcc_assert (GET_MODE (op->value) == VOIDmode
8203                   || GET_MODE (op->value) == mode);
8204       if (maybe_legitimize_operand_same_code (icode, opno, op))
8205         return true;
8206
8207       op->value = copy_to_mode_reg (mode, op->value);
8208       break;
8209
8210     case EXPAND_CONVERT_TO:
8211       gcc_assert (mode != VOIDmode);
8212       op->value = convert_to_mode (mode, op->value, op->unsigned_p);
8213       goto input;
8214
8215     case EXPAND_CONVERT_FROM:
8216       if (GET_MODE (op->value) != VOIDmode)
8217         mode = GET_MODE (op->value);
8218       else
8219         /* The caller must tell us what mode this value has.  */
8220         gcc_assert (mode != VOIDmode);
8221
8222       imode = insn_data[(int) icode].operand[opno].mode;
8223       if (imode != VOIDmode && imode != mode)
8224         {
8225           op->value = convert_modes (imode, mode, op->value, op->unsigned_p);
8226           mode = imode;
8227         }
8228       goto input;
8229
8230     case EXPAND_ADDRESS:
8231       gcc_assert (mode != VOIDmode);
8232       op->value = convert_memory_address (mode, op->value);
8233       goto input;
8234
8235     case EXPAND_INTEGER:
8236       mode = insn_data[(int) icode].operand[opno].mode;
8237       if (mode != VOIDmode && const_int_operand (op->value, mode))
8238         goto input;
8239       break;
8240     }
8241   return insn_operand_matches (icode, opno, op->value);
8242 }
8243
8244 /* Make OP describe an input operand that should have the same value
8245    as VALUE, after any mode conversion that the target might request.
8246    TYPE is the type of VALUE.  */
8247
8248 void
8249 create_convert_operand_from_type (struct expand_operand *op,
8250                                   rtx value, tree type)
8251 {
8252   create_convert_operand_from (op, value, TYPE_MODE (type),
8253                                TYPE_UNSIGNED (type));
8254 }
8255
8256 /* Try to make operands [OPS, OPS + NOPS) match operands [OPNO, OPNO + NOPS)
8257    of instruction ICODE.  Return true on success, leaving the new operand
8258    values in the OPS themselves.  Emit no code on failure.  */
8259
8260 bool
8261 maybe_legitimize_operands (enum insn_code icode, unsigned int opno,
8262                            unsigned int nops, struct expand_operand *ops)
8263 {
8264   rtx last;
8265   unsigned int i;
8266
8267   last = get_last_insn ();
8268   for (i = 0; i < nops; i++)
8269     if (!maybe_legitimize_operand (icode, opno + i, &ops[i]))
8270       {
8271         delete_insns_since (last);
8272         return false;
8273       }
8274   return true;
8275 }
8276
8277 /* Try to generate instruction ICODE, using operands [OPS, OPS + NOPS)
8278    as its operands.  Return the instruction pattern on success,
8279    and emit any necessary set-up code.  Return null and emit no
8280    code on failure.  */
8281
8282 rtx
8283 maybe_gen_insn (enum insn_code icode, unsigned int nops,
8284                 struct expand_operand *ops)
8285 {
8286   gcc_assert (nops == (unsigned int) insn_data[(int) icode].n_generator_args);
8287   if (!maybe_legitimize_operands (icode, 0, nops, ops))
8288     return NULL_RTX;
8289
8290   switch (nops)
8291     {
8292     case 1:
8293       return GEN_FCN (icode) (ops[0].value);
8294     case 2:
8295       return GEN_FCN (icode) (ops[0].value, ops[1].value);
8296     case 3:
8297       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value);
8298     case 4:
8299       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8300                               ops[3].value);
8301     case 5:
8302       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8303                               ops[3].value, ops[4].value);
8304     case 6:
8305       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8306                               ops[3].value, ops[4].value, ops[5].value);
8307     case 7:
8308       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8309                               ops[3].value, ops[4].value, ops[5].value,
8310                               ops[6].value);
8311     case 8:
8312       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8313                               ops[3].value, ops[4].value, ops[5].value,
8314                               ops[6].value, ops[7].value);
8315     case 9:
8316       return GEN_FCN (icode) (ops[0].value, ops[1].value, ops[2].value,
8317                               ops[3].value, ops[4].value, ops[5].value,
8318                               ops[6].value, ops[7].value, ops[8].value);
8319     }
8320   gcc_unreachable ();
8321 }
8322
8323 /* Try to emit instruction ICODE, using operands [OPS, OPS + NOPS)
8324    as its operands.  Return true on success and emit no code on failure.  */
8325
8326 bool
8327 maybe_expand_insn (enum insn_code icode, unsigned int nops,
8328                    struct expand_operand *ops)
8329 {
8330   rtx pat = maybe_gen_insn (icode, nops, ops);
8331   if (pat)
8332     {
8333       emit_insn (pat);
8334       return true;
8335     }
8336   return false;
8337 }
8338
8339 /* Like maybe_expand_insn, but for jumps.  */
8340
8341 bool
8342 maybe_expand_jump_insn (enum insn_code icode, unsigned int nops,
8343                         struct expand_operand *ops)
8344 {
8345   rtx pat = maybe_gen_insn (icode, nops, ops);
8346   if (pat)
8347     {
8348       emit_jump_insn (pat);
8349       return true;
8350     }
8351   return false;
8352 }
8353
8354 /* Emit instruction ICODE, using operands [OPS, OPS + NOPS)
8355    as its operands.  */
8356
8357 void
8358 expand_insn (enum insn_code icode, unsigned int nops,
8359              struct expand_operand *ops)
8360 {
8361   if (!maybe_expand_insn (icode, nops, ops))
8362     gcc_unreachable ();
8363 }
8364
8365 /* Like expand_insn, but for jumps.  */
8366
8367 void
8368 expand_jump_insn (enum insn_code icode, unsigned int nops,
8369                   struct expand_operand *ops)
8370 {
8371   if (!maybe_expand_jump_insn (icode, nops, ops))
8372     gcc_unreachable ();
8373 }
8374
8375 /* Reduce conditional compilation elsewhere.  */
8376 #ifndef HAVE_insv
8377 #define HAVE_insv       0
8378 #define CODE_FOR_insv   CODE_FOR_nothing
8379 #endif
8380 #ifndef HAVE_extv
8381 #define HAVE_extv       0
8382 #define CODE_FOR_extv   CODE_FOR_nothing
8383 #endif
8384 #ifndef HAVE_extzv
8385 #define HAVE_extzv      0
8386 #define CODE_FOR_extzv  CODE_FOR_nothing
8387 #endif
8388
8389 /* Enumerates the possible types of structure operand to an
8390    extraction_insn.  */
8391 enum extraction_type { ET_unaligned_mem, ET_reg };
8392
8393 /* Check whether insv, extv or extzv pattern ICODE can be used for an
8394    insertion or extraction of type TYPE on a structure of mode MODE.
8395    Return true if so and fill in *INSN accordingly.  STRUCT_OP is the
8396    operand number of the structure (the first sign_extract or zero_extract
8397    operand) and FIELD_OP is the operand number of the field (the other
8398    side of the set from the sign_extract or zero_extract).  */
8399
8400 static bool
8401 get_traditional_extraction_insn (extraction_insn *insn,
8402                                  enum extraction_type type,
8403                                  enum machine_mode mode,
8404                                  enum insn_code icode,
8405                                  int struct_op, int field_op)
8406 {
8407   const struct insn_data_d *data = &insn_data[icode];
8408
8409   enum machine_mode struct_mode = data->operand[struct_op].mode;
8410   if (struct_mode == VOIDmode)
8411     struct_mode = word_mode;
8412   if (mode != struct_mode)
8413     return false;
8414
8415   enum machine_mode field_mode = data->operand[field_op].mode;
8416   if (field_mode == VOIDmode)
8417     field_mode = word_mode;
8418
8419   enum machine_mode pos_mode = data->operand[struct_op + 2].mode;
8420   if (pos_mode == VOIDmode)
8421     pos_mode = word_mode;
8422
8423   insn->icode = icode;
8424   insn->field_mode = field_mode;
8425   insn->struct_mode = (type == ET_unaligned_mem ? byte_mode : struct_mode);
8426   insn->pos_mode = pos_mode;
8427   return true;
8428 }
8429
8430 /* Return true if an optab exists to perform an insertion or extraction
8431    of type TYPE in mode MODE.  Describe the instruction in *INSN if so.
8432
8433    REG_OPTAB is the optab to use for register structures and
8434    MISALIGN_OPTAB is the optab to use for misaligned memory structures.
8435    POS_OP is the operand number of the bit position.  */
8436
8437 static bool
8438 get_optab_extraction_insn (struct extraction_insn *insn,
8439                            enum extraction_type type,
8440                            enum machine_mode mode, direct_optab reg_optab,
8441                            direct_optab misalign_optab, int pos_op)
8442 {
8443   direct_optab optab = (type == ET_unaligned_mem ? misalign_optab : reg_optab);
8444   enum insn_code icode = direct_optab_handler (optab, mode);
8445   if (icode == CODE_FOR_nothing)
8446     return false;
8447
8448   const struct insn_data_d *data = &insn_data[icode];
8449
8450   insn->icode = icode;
8451   insn->field_mode = mode;
8452   insn->struct_mode = (type == ET_unaligned_mem ? BLKmode : mode);
8453   insn->pos_mode = data->operand[pos_op].mode;
8454   if (insn->pos_mode == VOIDmode)
8455     insn->pos_mode = word_mode;
8456   return true;
8457 }
8458
8459 /* Return true if an instruction exists to perform an insertion or
8460    extraction (PATTERN says which) of type TYPE in mode MODE.
8461    Describe the instruction in *INSN if so.  */
8462
8463 static bool
8464 get_extraction_insn (extraction_insn *insn,
8465                      enum extraction_pattern pattern,
8466                      enum extraction_type type,
8467                      enum machine_mode mode)
8468 {
8469   switch (pattern)
8470     {
8471     case EP_insv:
8472       if (HAVE_insv
8473           && get_traditional_extraction_insn (insn, type, mode,
8474                                               CODE_FOR_insv, 0, 3))
8475         return true;
8476       return get_optab_extraction_insn (insn, type, mode, insv_optab,
8477                                         insvmisalign_optab, 2);
8478
8479     case EP_extv:
8480       if (HAVE_extv
8481           && get_traditional_extraction_insn (insn, type, mode,
8482                                               CODE_FOR_extv, 1, 0))
8483         return true;
8484       return get_optab_extraction_insn (insn, type, mode, extv_optab,
8485                                         extvmisalign_optab, 3);
8486
8487     case EP_extzv:
8488       if (HAVE_extzv
8489           && get_traditional_extraction_insn (insn, type, mode,
8490                                               CODE_FOR_extzv, 1, 0))
8491         return true;
8492       return get_optab_extraction_insn (insn, type, mode, extzv_optab,
8493                                         extzvmisalign_optab, 3);
8494
8495     default:
8496       gcc_unreachable ();
8497     }
8498 }
8499
8500 /* Return true if an instruction exists to access a field of mode
8501    FIELDMODE in a structure that has STRUCT_BITS significant bits.
8502    Describe the "best" such instruction in *INSN if so.  PATTERN and
8503    TYPE describe the type of insertion or extraction we want to perform.
8504
8505    For an insertion, the number of significant structure bits includes
8506    all bits of the target.  For an extraction, it need only include the
8507    most significant bit of the field.  Larger widths are acceptable
8508    in both cases.  */
8509
8510 static bool
8511 get_best_extraction_insn (extraction_insn *insn,
8512                           enum extraction_pattern pattern,
8513                           enum extraction_type type,
8514                           unsigned HOST_WIDE_INT struct_bits,
8515                           enum machine_mode field_mode)
8516 {
8517   enum machine_mode mode = smallest_mode_for_size (struct_bits, MODE_INT);
8518   while (mode != VOIDmode)
8519     {
8520       if (get_extraction_insn (insn, pattern, type, mode))
8521         {
8522           while (mode != VOIDmode
8523                  && GET_MODE_SIZE (mode) <= GET_MODE_SIZE (field_mode)
8524                  && !TRULY_NOOP_TRUNCATION_MODES_P (insn->field_mode,
8525                                                     field_mode))
8526             {
8527               get_extraction_insn (insn, pattern, type, mode);
8528               mode = GET_MODE_WIDER_MODE (mode);
8529             }
8530           return true;
8531         }
8532       mode = GET_MODE_WIDER_MODE (mode);
8533     }
8534   return false;
8535 }
8536
8537 /* Return true if an instruction exists to access a field of mode
8538    FIELDMODE in a register structure that has STRUCT_BITS significant bits.
8539    Describe the "best" such instruction in *INSN if so.  PATTERN describes
8540    the type of insertion or extraction we want to perform.
8541
8542    For an insertion, the number of significant structure bits includes
8543    all bits of the target.  For an extraction, it need only include the
8544    most significant bit of the field.  Larger widths are acceptable
8545    in both cases.  */
8546
8547 bool
8548 get_best_reg_extraction_insn (extraction_insn *insn,
8549                               enum extraction_pattern pattern,
8550                               unsigned HOST_WIDE_INT struct_bits,
8551                               enum machine_mode field_mode)
8552 {
8553   return get_best_extraction_insn (insn, pattern, ET_reg, struct_bits,
8554                                    field_mode);
8555 }
8556
8557 /* Return true if an instruction exists to access a field of BITSIZE
8558    bits starting BITNUM bits into a memory structure.  Describe the
8559    "best" such instruction in *INSN if so.  PATTERN describes the type
8560    of insertion or extraction we want to perform and FIELDMODE is the
8561    natural mode of the extracted field.
8562
8563    The instructions considered here only access bytes that overlap
8564    the bitfield; they do not touch any surrounding bytes.  */
8565
8566 bool
8567 get_best_mem_extraction_insn (extraction_insn *insn,
8568                               enum extraction_pattern pattern,
8569                               HOST_WIDE_INT bitsize, HOST_WIDE_INT bitnum,
8570                               enum machine_mode field_mode)
8571 {
8572   unsigned HOST_WIDE_INT struct_bits = (bitnum % BITS_PER_UNIT
8573                                         + bitsize
8574                                         + BITS_PER_UNIT - 1);
8575   struct_bits -= struct_bits % BITS_PER_UNIT;
8576   return get_best_extraction_insn (insn, pattern, ET_unaligned_mem,
8577                                    struct_bits, field_mode);
8578 }
8579
8580 #include "gt-optabs.h"