gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2023 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "gen-sframe.h"
  34 #include "sframe.h"
  35 #include "elf/x86-64.h"
  36 #include "opcodes/i386-init.h"
  37 #include "opcodes/i386-mnem.h"
  38 #include <limits.h>
  39
  40 #ifndef INFER_ADDR_PREFIX
  41 #define INFER_ADDR_PREFIX 1
  42 #endif
  43
  44 #ifndef DEFAULT_ARCH
  45 #define DEFAULT_ARCH "i386"
  46 #endif
  47
  48 #ifndef INLINE
  49 #if __GNUC__ >= 2
  50 #define INLINE __inline__
  51 #else
  52 #define INLINE
  53 #endif
  54 #endif
  55
  56 /* Prefixes will be emitted in the order defined below.
  57    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  58    instruction, and so must come before any prefixes.
  59    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  60    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  61 #define WAIT_PREFIX     0
  62 #define SEG_PREFIX      1
  63 #define ADDR_PREFIX     2
  64 #define DATA_PREFIX     3
  65 #define REP_PREFIX      4
  66 #define HLE_PREFIX      REP_PREFIX
  67 #define BND_PREFIX      REP_PREFIX
  68 #define LOCK_PREFIX     5
  69 #define REX_PREFIX      6       /* must come last.  */
  70 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  71
  72 /* we define the syntax here (modulo base,index,scale syntax) */
  73 #define REGISTER_PREFIX '%'
  74 #define IMMEDIATE_PREFIX '$'
  75 #define ABSOLUTE_PREFIX '*'
  76
  77 /* these are the instruction mnemonic suffixes in AT&T syntax or
  78    memory operand size in Intel syntax.  */
  79 #define WORD_MNEM_SUFFIX  'w'
  80 #define BYTE_MNEM_SUFFIX  'b'
  81 #define SHORT_MNEM_SUFFIX 's'
  82 #define LONG_MNEM_SUFFIX  'l'
  83 #define QWORD_MNEM_SUFFIX  'q'
  84
  85 #define END_OF_INSN '\0'
  86
  87 #define OPERAND_TYPE_NONE { .bitfield = { .class = ClassNone } }
  88
  89 /* This matches the C -> StaticRounding alias in the opcode table.  */
  90 #define commutative staticrounding
  91
  92 /*
  93   'templates' is for grouping together 'template' structures for opcodes
  94   of the same name.  This is only used for storing the insns in the grand
  95   ole hash table of insns.
  96   The templates themselves start at START and range up to (but not including)
  97   END.
  98   */
  99 typedef struct
 100 {
 101   const insn_template *start;
 102   const insn_template *end;
 103 }
 104 templates;
 105
 106 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 107 typedef struct
 108 {
 109   unsigned int regmem;  /* codes register or memory operand */
 110   unsigned int reg;     /* codes register operand (or extended opcode) */
 111   unsigned int mode;    /* how to interpret regmem & reg */
 112 }
 113 modrm_byte;
 114
 115 /* x86-64 extension prefix.  */
 116 typedef int rex_byte;
 117
 118 /* 386 opcode byte to code indirect addressing.  */
 119 typedef struct
 120 {
 121   unsigned base;
 122   unsigned index;
 123   unsigned scale;
 124 }
 125 sib_byte;
 126
 127 /* x86 arch names, types and features */
 128 typedef struct
 129 {
 130   const char *name;             /* arch name */
 131   unsigned int len:8;           /* arch string length */
 132   bool skip:1;                  /* show_arch should skip this. */
 133   enum processor_type type;     /* arch type */
 134   enum { vsz_none, vsz_set, vsz_reset } vsz; /* vector size control */
 135   i386_cpu_flags enable;                /* cpu feature enable flags */
 136   i386_cpu_flags disable;       /* cpu feature disable flags */
 137 }
 138 arch_entry;
 139
 140 static void update_code_flag (int, int);
 141 static void s_insn (int);
 142 static void set_code_flag (int);
 143 static void set_16bit_gcc_code_flag (int);
 144 static void set_intel_syntax (int);
 145 static void set_intel_mnemonic (int);
 146 static void set_allow_index_reg (int);
 147 static void set_check (int);
 148 static void set_cpu_arch (int);
 149 #ifdef TE_PE
 150 static void pe_directive_secrel (int);
 151 static void pe_directive_secidx (int);
 152 #endif
 153 static void signed_cons (int);
 154 static char *output_invalid (int c);
 155 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 156                                     const char *);
 157 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 158                                        const char *);
 159 static int i386_att_operand (char *);
 160 static int i386_intel_operand (char *, int);
 161 static int i386_intel_simplify (expressionS *);
 162 static int i386_intel_parse_name (const char *, expressionS *);
 163 static const reg_entry *parse_register (const char *, char **);
 164 static const char *parse_insn (const char *, char *, bool);
 165 static char *parse_operands (char *, const char *);
 166 static void swap_operands (void);
 167 static void swap_2_operands (unsigned int, unsigned int);
 168 static enum flag_code i386_addressing_mode (void);
 169 static void optimize_imm (void);
 170 static bool optimize_disp (const insn_template *t);
 171 static const insn_template *match_template (char);
 172 static int check_string (void);
 173 static int process_suffix (void);
 174 static int check_byte_reg (void);
 175 static int check_long_reg (void);
 176 static int check_qword_reg (void);
 177 static int check_word_reg (void);
 178 static int finalize_imm (void);
 179 static int process_operands (void);
 180 static const reg_entry *build_modrm_byte (void);
 181 static void output_insn (void);
 182 static void output_imm (fragS *, offsetT);
 183 static void output_disp (fragS *, offsetT);
 184 #ifndef I386COFF
 185 static void s_bss (int);
 186 #endif
 187 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 188 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 189
 190 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 191 static unsigned int x86_isa_1_used;
 192 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 193 static unsigned int x86_feature_2_used;
 194 /* Generate x86 used ISA and feature properties.  */
 195 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 196 #endif
 197
 198 static const char *default_arch = DEFAULT_ARCH;
 199
 200 /* parse_register() returns this when a register alias cannot be used.  */
 201 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 202                                    { Dw2Inval, Dw2Inval } };
 203
 204 static const reg_entry *reg_eax;
 205 static const reg_entry *reg_ds;
 206 static const reg_entry *reg_es;
 207 static const reg_entry *reg_ss;
 208 static const reg_entry *reg_st0;
 209 static const reg_entry *reg_k0;
 210
 211 /* VEX prefix.  */
 212 typedef struct
 213 {
 214   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 215   unsigned char bytes[4];
 216   unsigned int length;
 217   /* Destination or source register specifier.  */
 218   const reg_entry *register_specifier;
 219 } vex_prefix;
 220
 221 /* 'md_assemble ()' gathers together information and puts it into a
 222    i386_insn.  */
 223
 224 union i386_op
 225   {
 226     expressionS *disps;
 227     expressionS *imms;
 228     const reg_entry *regs;
 229   };
 230
 231 enum i386_error
 232   {
 233     no_error, /* Must be first.  */
 234     operand_size_mismatch,
 235     operand_type_mismatch,
 236     register_type_mismatch,
 237     number_of_operands_mismatch,
 238     invalid_instruction_suffix,
 239     bad_imm4,
 240     unsupported_with_intel_mnemonic,
 241     unsupported_syntax,
 242     unsupported,
 243     unsupported_on_arch,
 244     unsupported_64bit,
 245     invalid_sib_address,
 246     invalid_vsib_address,
 247     invalid_vector_register_set,
 248     invalid_tmm_register_set,
 249     invalid_dest_and_src_register_set,
 250     unsupported_vector_index_register,
 251     unsupported_broadcast,
 252     broadcast_needed,
 253     unsupported_masking,
 254     mask_not_on_destination,
 255     no_default_mask,
 256     unsupported_rc_sae,
 257     invalid_register_operand,
 258     internal_error,
 259   };
 260
 261 struct _i386_insn
 262   {
 263     /* TM holds the template for the insn were currently assembling.  */
 264     insn_template tm;
 265
 266     /* SUFFIX holds the instruction size suffix for byte, word, dword
 267        or qword, if given.  */
 268     char suffix;
 269
 270     /* OPCODE_LENGTH holds the number of base opcode bytes.  */
 271     unsigned char opcode_length;
 272
 273     /* OPERANDS gives the number of given operands.  */
 274     unsigned int operands;
 275
 276     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 277        of given register, displacement, memory operands and immediate
 278        operands.  */
 279     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 280
 281     /* TYPES [i] is the type (see above #defines) which tells us how to
 282        use OP[i] for the corresponding operand.  */
 283     i386_operand_type types[MAX_OPERANDS];
 284
 285     /* Displacement expression, immediate expression, or register for each
 286        operand.  */
 287     union i386_op op[MAX_OPERANDS];
 288
 289     /* Flags for operands.  */
 290     unsigned int flags[MAX_OPERANDS];
 291 #define Operand_PCrel 1
 292 #define Operand_Mem   2
 293 #define Operand_Signed 4 /* .insn only */
 294
 295     /* Relocation type for operand */
 296     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 297
 298     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 299        the base index byte below.  */
 300     const reg_entry *base_reg;
 301     const reg_entry *index_reg;
 302     unsigned int log2_scale_factor;
 303
 304     /* SEG gives the seg_entries of this insn.  They are zero unless
 305        explicit segment overrides are given.  */
 306     const reg_entry *seg[2];
 307
 308     /* PREFIX holds all the given prefix opcodes (usually null).
 309        PREFIXES is the number of prefix opcodes.  */
 310     unsigned int prefixes;
 311     unsigned char prefix[MAX_PREFIXES];
 312
 313     /* .insn allows for reserved opcode spaces.  */
 314     unsigned char insn_opcode_space;
 315
 316     /* .insn also allows (requires) specifying immediate size.  */
 317     unsigned char imm_bits[MAX_OPERANDS];
 318
 319     /* Register is in low 3 bits of opcode.  */
 320     bool short_form;
 321
 322     /* The operand to a branch insn indicates an absolute branch.  */
 323     bool jumpabsolute;
 324
 325     /* The operand to a branch insn indicates a far branch.  */
 326     bool far_branch;
 327
 328     /* There is a memory operand of (%dx) which should be only used
 329        with input/output instructions.  */
 330     bool input_output_operand;
 331
 332     /* Extended states.  */
 333     enum
 334       {
 335         /* Use MMX state.  */
 336         xstate_mmx = 1 << 0,
 337         /* Use XMM state.  */
 338         xstate_xmm = 1 << 1,
 339         /* Use YMM state.  */
 340         xstate_ymm = 1 << 2 | xstate_xmm,
 341         /* Use ZMM state.  */
 342         xstate_zmm = 1 << 3 | xstate_ymm,
 343         /* Use TMM state.  */
 344         xstate_tmm = 1 << 4,
 345         /* Use MASK state.  */
 346         xstate_mask = 1 << 5
 347       } xstate;
 348
 349     /* Has GOTPC or TLS relocation.  */
 350     bool has_gotpc_tls_reloc;
 351
 352     /* RM and SIB are the modrm byte and the sib byte where the
 353        addressing modes of this insn are encoded.  */
 354     modrm_byte rm;
 355     rex_byte rex;
 356     rex_byte vrex;
 357     sib_byte sib;
 358     vex_prefix vex;
 359
 360     /* Masking attributes.
 361
 362        The struct describes masking, applied to OPERAND in the instruction.
 363        REG is a pointer to the corresponding mask register.  ZEROING tells
 364        whether merging or zeroing mask is used.  */
 365     struct Mask_Operation
 366     {
 367       const reg_entry *reg;
 368       unsigned int zeroing;
 369       /* The operand where this operation is associated.  */
 370       unsigned int operand;
 371     } mask;
 372
 373     /* Rounding control and SAE attributes.  */
 374     struct RC_Operation
 375     {
 376       enum rc_type
 377         {
 378           rc_none = -1,
 379           rne,
 380           rd,
 381           ru,
 382           rz,
 383           saeonly
 384         } type;
 385       /* In Intel syntax the operand modifier form is supposed to be used, but
 386          we continue to accept the immediate forms as well.  */
 387       bool modifier;
 388     } rounding;
 389
 390     /* Broadcasting attributes.
 391
 392        The struct describes broadcasting, applied to OPERAND.  TYPE is
 393        expresses the broadcast factor.  */
 394     struct Broadcast_Operation
 395     {
 396       /* Type of broadcast: {1to2}, {1to4}, {1to8}, {1to16} or {1to32}.  */
 397       unsigned int type;
 398
 399       /* Index of broadcasted operand.  */
 400       unsigned int operand;
 401
 402       /* Number of bytes to broadcast.  */
 403       unsigned int bytes;
 404     } broadcast;
 405
 406     /* Compressed disp8*N attribute.  */
 407     unsigned int memshift;
 408
 409     /* Prefer load or store in encoding.  */
 410     enum
 411       {
 412         dir_encoding_default = 0,
 413         dir_encoding_load,
 414         dir_encoding_store,
 415         dir_encoding_swap
 416       } dir_encoding;
 417
 418     /* Prefer 8bit, 16bit, 32bit displacement in encoding.  */
 419     enum
 420       {
 421         disp_encoding_default = 0,
 422         disp_encoding_8bit,
 423         disp_encoding_16bit,
 424         disp_encoding_32bit
 425       } disp_encoding;
 426
 427     /* Prefer the REX byte in encoding.  */
 428     bool rex_encoding;
 429
 430     /* Disable instruction size optimization.  */
 431     bool no_optimize;
 432
 433     /* How to encode vector instructions.  */
 434     enum
 435       {
 436         vex_encoding_default = 0,
 437         vex_encoding_vex,
 438         vex_encoding_vex3,
 439         vex_encoding_evex,
 440         vex_encoding_evex512,
 441         vex_encoding_error
 442       } vec_encoding;
 443
 444     /* REP prefix.  */
 445     const char *rep_prefix;
 446
 447     /* HLE prefix.  */
 448     const char *hle_prefix;
 449
 450     /* Have BND prefix.  */
 451     const char *bnd_prefix;
 452
 453     /* Have NOTRACK prefix.  */
 454     const char *notrack_prefix;
 455
 456     /* Error message.  */
 457     enum i386_error error;
 458   };
 459
 460 typedef struct _i386_insn i386_insn;
 461
 462 /* Link RC type with corresponding string, that'll be looked for in
 463    asm.  */
 464 struct RC_name
 465 {
 466   enum rc_type type;
 467   const char *name;
 468   unsigned int len;
 469 };
 470
 471 static const struct RC_name RC_NamesTable[] =
 472 {
 473   {  rne, STRING_COMMA_LEN ("rn-sae") },
 474   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 475   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 476   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 477   {  saeonly,  STRING_COMMA_LEN ("sae") },
 478 };
 479
 480 /* To be indexed by segment register number.  */
 481 static const unsigned char i386_seg_prefixes[] = {
 482   ES_PREFIX_OPCODE,
 483   CS_PREFIX_OPCODE,
 484   SS_PREFIX_OPCODE,
 485   DS_PREFIX_OPCODE,
 486   FS_PREFIX_OPCODE,
 487   GS_PREFIX_OPCODE
 488 };
 489
 490 /* List of chars besides those in app.c:symbol_chars that can start an
 491    operand.  Used to prevent the scrubber eating vital white-space.  */
 492 const char extra_symbol_chars[] = "*%-([{}"
 493 #ifdef LEX_AT
 494         "@"
 495 #endif
 496 #ifdef LEX_QM
 497         "?"
 498 #endif
 499         ;
 500
 501 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))     \
 502      && !defined (TE_GNU)                               \
 503      && !defined (TE_LINUX)                             \
 504      && !defined (TE_Haiku)                             \
 505      && !defined (TE_FreeBSD)                           \
 506      && !defined (TE_DragonFly)                         \
 507      && !defined (TE_NetBSD))
 508 /* This array holds the chars that always start a comment.  If the
 509    pre-processor is disabled, these aren't very useful.  The option
 510    --divide will remove '/' from this list.  */
 511 const char *i386_comment_chars = "#/";
 512 #define SVR4_COMMENT_CHARS 1
 513 #define PREFIX_SEPARATOR '\\'
 514
 515 #else
 516 const char *i386_comment_chars = "#";
 517 #define PREFIX_SEPARATOR '/'
 518 #endif
 519
 520 /* This array holds the chars that only start a comment at the beginning of
 521    a line.  If the line seems to have the form '# 123 filename'
 522    .line and .file directives will appear in the pre-processed output.
 523    Note that input_file.c hand checks for '#' at the beginning of the
 524    first line of the input file.  This is because the compiler outputs
 525    #NO_APP at the beginning of its output.
 526    Also note that comments started like this one will always work if
 527    '/' isn't otherwise defined.  */
 528 const char line_comment_chars[] = "#/";
 529
 530 const char line_separator_chars[] = ";";
 531
 532 /* Chars that can be used to separate mant from exp in floating point
 533    nums.  */
 534 const char EXP_CHARS[] = "eE";
 535
 536 /* Chars that mean this number is a floating point constant
 537    As in 0f12.456
 538    or    0d1.2345e12.  */
 539 const char FLT_CHARS[] = "fFdDxXhHbB";
 540
 541 /* Tables for lexical analysis.  */
 542 static char mnemonic_chars[256];
 543 static char register_chars[256];
 544 static char operand_chars[256];
 545
 546 /* Lexical macros.  */
 547 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 548 #define is_register_char(x) (register_chars[(unsigned char) x])
 549 #define is_space_char(x) ((x) == ' ')
 550
 551 /* All non-digit non-letter characters that may occur in an operand and
 552    which aren't already in extra_symbol_chars[].  */
 553 static const char operand_special_chars[] = "$+,)._~/<>|&^!=:@]";
 554
 555 /* md_assemble() always leaves the strings it's passed unaltered.  To
 556    effect this we maintain a stack of saved characters that we've smashed
 557    with '\0's (indicating end of strings for various sub-fields of the
 558    assembler instruction).  */
 559 static char save_stack[32];
 560 static char *save_stack_p;
 561 #define END_STRING_AND_SAVE(s) \
 562         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 563 #define RESTORE_END_STRING(s) \
 564         do { *(s) = *--save_stack_p; } while (0)
 565
 566 /* The instruction we're assembling.  */
 567 static i386_insn i;
 568
 569 /* Possible templates for current insn.  */
 570 static const templates *current_templates;
 571
 572 /* Per instruction expressionS buffers: max displacements & immediates.  */
 573 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 574 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 575
 576 /* Current operand we are working on.  */
 577 static int this_operand = -1;
 578
 579 /* Are we processing a .insn directive?  */
 580 #define dot_insn() (i.tm.mnem_off == MN__insn)
 581
 582 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 583    these.  */
 584
 585 enum flag_code {
 586         CODE_32BIT,
 587         CODE_16BIT,
 588         CODE_64BIT };
 589
 590 static enum flag_code flag_code;
 591 static unsigned int object_64bit;
 592 static unsigned int disallow_64bit_reloc;
 593 static int use_rela_relocations = 0;
 594 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 595 static const char *tls_get_addr;
 596
 597 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 598      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 599      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 600
 601 /* The ELF ABI to use.  */
 602 enum x86_elf_abi
 603 {
 604   I386_ABI,
 605   X86_64_ABI,
 606   X86_64_X32_ABI
 607 };
 608
 609 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 610 #endif
 611
 612 #if defined (TE_PE) || defined (TE_PEP)
 613 /* Use big object file format.  */
 614 static int use_big_obj = 0;
 615 #endif
 616
 617 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 618 /* 1 if generating code for a shared library.  */
 619 static int shared = 0;
 620
 621 unsigned int x86_sframe_cfa_sp_reg;
 622 /* The other CFA base register for SFrame stack trace info.  */
 623 unsigned int x86_sframe_cfa_fp_reg;
 624 unsigned int x86_sframe_cfa_ra_reg;
 625
 626 #endif
 627
 628 /* 1 for intel syntax,
 629    0 if att syntax.  */
 630 static int intel_syntax = 0;
 631
 632 static enum x86_64_isa
 633 {
 634   amd64 = 1,    /* AMD64 ISA.  */
 635   intel64       /* Intel64 ISA.  */
 636 } isa64;
 637
 638 /* 1 for intel mnemonic,
 639    0 if att mnemonic.  */
 640 static int intel_mnemonic = !SYSV386_COMPAT;
 641
 642 /* 1 if pseudo registers are permitted.  */
 643 static int allow_pseudo_reg = 0;
 644
 645 /* 1 if register prefix % not required.  */
 646 static int allow_naked_reg = 0;
 647
 648 /* 1 if the assembler should add BND prefix for all control-transferring
 649    instructions supporting it, even if this prefix wasn't specified
 650    explicitly.  */
 651 static int add_bnd_prefix = 0;
 652
 653 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 654 static int allow_index_reg = 0;
 655
 656 /* 1 if the assembler should ignore LOCK prefix, even if it was
 657    specified explicitly.  */
 658 static int omit_lock_prefix = 0;
 659
 660 /* 1 if the assembler should encode lfence, mfence, and sfence as
 661    "lock addl $0, (%{re}sp)".  */
 662 static int avoid_fence = 0;
 663
 664 /* 1 if lfence should be inserted after every load.  */
 665 static int lfence_after_load = 0;
 666
 667 /* Non-zero if lfence should be inserted before indirect branch.  */
 668 static enum lfence_before_indirect_branch_kind
 669   {
 670     lfence_branch_none = 0,
 671     lfence_branch_register,
 672     lfence_branch_memory,
 673     lfence_branch_all
 674   }
 675 lfence_before_indirect_branch;
 676
 677 /* Non-zero if lfence should be inserted before ret.  */
 678 static enum lfence_before_ret_kind
 679   {
 680     lfence_before_ret_none = 0,
 681     lfence_before_ret_not,
 682     lfence_before_ret_or,
 683     lfence_before_ret_shl
 684   }
 685 lfence_before_ret;
 686
 687 /* Types of previous instruction is .byte or prefix.  */
 688 static struct
 689   {
 690     segT seg;
 691     const char *file;
 692     const char *name;
 693     unsigned int line;
 694     enum last_insn_kind
 695       {
 696         last_insn_other = 0,
 697         last_insn_directive,
 698         last_insn_prefix
 699       } kind;
 700   } last_insn;
 701
 702 /* 1 if the assembler should generate relax relocations.  */
 703
 704 static int generate_relax_relocations
 705   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 706
 707 static enum check_kind
 708   {
 709     check_none = 0,
 710     check_warning,
 711     check_error
 712   }
 713 sse_check, operand_check = check_warning;
 714
 715 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 716 static int align_branch_power = 0;
 717
 718 /* Types of branches to align.  */
 719 enum align_branch_kind
 720   {
 721     align_branch_none = 0,
 722     align_branch_jcc = 1,
 723     align_branch_fused = 2,
 724     align_branch_jmp = 3,
 725     align_branch_call = 4,
 726     align_branch_indirect = 5,
 727     align_branch_ret = 6
 728   };
 729
 730 /* Type bits of branches to align.  */
 731 enum align_branch_bit
 732   {
 733     align_branch_jcc_bit = 1 << align_branch_jcc,
 734     align_branch_fused_bit = 1 << align_branch_fused,
 735     align_branch_jmp_bit = 1 << align_branch_jmp,
 736     align_branch_call_bit = 1 << align_branch_call,
 737     align_branch_indirect_bit = 1 << align_branch_indirect,
 738     align_branch_ret_bit = 1 << align_branch_ret
 739   };
 740
 741 static unsigned int align_branch = (align_branch_jcc_bit
 742                                     | align_branch_fused_bit
 743                                     | align_branch_jmp_bit);
 744
 745 /* Types of condition jump used by macro-fusion.  */
 746 enum mf_jcc_kind
 747   {
 748     mf_jcc_jo = 0,  /* base opcode 0x70  */
 749     mf_jcc_jc,      /* base opcode 0x72  */
 750     mf_jcc_je,      /* base opcode 0x74  */
 751     mf_jcc_jna,     /* base opcode 0x76  */
 752     mf_jcc_js,      /* base opcode 0x78  */
 753     mf_jcc_jp,      /* base opcode 0x7a  */
 754     mf_jcc_jl,      /* base opcode 0x7c  */
 755     mf_jcc_jle,     /* base opcode 0x7e  */
 756   };
 757
 758 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 759 enum mf_cmp_kind
 760   {
 761     mf_cmp_test_and,  /* test/cmp */
 762     mf_cmp_alu_cmp,  /* add/sub/cmp */
 763     mf_cmp_incdec  /* inc/dec */
 764   };
 765
 766 /* The maximum padding size for fused jcc.  CMP like instruction can
 767    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 768    prefixes.   */
 769 #define MAX_FUSED_JCC_PADDING_SIZE 20
 770
 771 /* The maximum number of prefixes added for an instruction.  */
 772 static unsigned int align_branch_prefix_size = 5;
 773
 774 /* Optimization:
 775    1. Clear the REX_W bit with register operand if possible.
 776    2. Above plus use 128bit vector instruction to clear the full vector
 777       register.
 778  */
 779 static int optimize = 0;
 780
 781 /* Optimization:
 782    1. Clear the REX_W bit with register operand if possible.
 783    2. Above plus use 128bit vector instruction to clear the full vector
 784       register.
 785    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 786       "testb $imm7,%r8".
 787  */
 788 static int optimize_for_space = 0;
 789
 790 /* Register prefix used for error message.  */
 791 static const char *register_prefix = "%";
 792
 793 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 794    leave, push, and pop instructions so that gcc has the same stack
 795    frame as in 32 bit mode.  */
 796 static char stackop_size = '\0';
 797
 798 /* Non-zero to optimize code alignment.  */
 799 int optimize_align_code = 1;
 800
 801 /* Non-zero to quieten some warnings.  */
 802 static int quiet_warnings = 0;
 803
 804 /* Guard to avoid repeated warnings about non-16-bit code on 16-bit CPUs.  */
 805 static bool pre_386_16bit_warned;
 806
 807 /* CPU name.  */
 808 static const char *cpu_arch_name = NULL;
 809 static char *cpu_sub_arch_name = NULL;
 810
 811 /* CPU feature flags.  */
 812 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 813
 814 /* If we have selected a cpu we are generating instructions for.  */
 815 static int cpu_arch_tune_set = 0;
 816
 817 /* Cpu we are generating instructions for.  */
 818 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 819
 820 /* CPU instruction set architecture used.  */
 821 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 822
 823 /* CPU feature flags of instruction set architecture used.  */
 824 i386_cpu_flags cpu_arch_isa_flags;
 825
 826 /* If set, conditional jumps are not automatically promoted to handle
 827    larger than a byte offset.  */
 828 static bool no_cond_jump_promotion = false;
 829
 830 /* This will be set from an expression parser hook if there's any
 831    applicable operator involved in an expression.  */
 832 static enum {
 833   expr_operator_none,
 834   expr_operator_present,
 835   expr_large_value,
 836 } expr_mode;
 837
 838 /* Encode SSE instructions with VEX prefix.  */
 839 static unsigned int sse2avx;
 840
 841 /* Encode aligned vector move as unaligned vector move.  */
 842 static unsigned int use_unaligned_vector_move;
 843
 844 /* Maximum permitted vector size. */
 845 #define VSZ_DEFAULT VSZ512
 846 static unsigned int vector_size = VSZ_DEFAULT;
 847
 848 /* Encode scalar AVX instructions with specific vector length.  */
 849 static enum
 850   {
 851     vex128 = 0,
 852     vex256
 853   } avxscalar;
 854
 855 /* Encode VEX WIG instructions with specific vex.w.  */
 856 static enum
 857   {
 858     vexw0 = 0,
 859     vexw1
 860   } vexwig;
 861
 862 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 863 static enum
 864   {
 865     evexl128 = 0,
 866     evexl256,
 867     evexl512
 868   } evexlig;
 869
 870 /* Encode EVEX WIG instructions with specific evex.w.  */
 871 static enum
 872   {
 873     evexw0 = 0,
 874     evexw1
 875   } evexwig;
 876
 877 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 878 static enum rc_type evexrcig = rne;
 879
 880 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 881 static symbolS *GOT_symbol;
 882
 883 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 884 unsigned int x86_dwarf2_return_column;
 885
 886 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 887 int x86_cie_data_alignment;
 888
 889 /* Interface to relax_segment.
 890    There are 3 major relax states for 386 jump insns because the
 891    different types of jumps add different sizes to frags when we're
 892    figuring out what sort of jump to choose to reach a given label.
 893
 894    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 895    branches which are handled by md_estimate_size_before_relax() and
 896    i386_generic_table_relax_frag().  */
 897
 898 /* Types.  */
 899 #define UNCOND_JUMP 0
 900 #define COND_JUMP 1
 901 #define COND_JUMP86 2
 902 #define BRANCH_PADDING 3
 903 #define BRANCH_PREFIX 4
 904 #define FUSED_JCC_PADDING 5
 905
 906 /* Sizes.  */
 907 #define CODE16  1
 908 #define SMALL   0
 909 #define SMALL16 (SMALL | CODE16)
 910 #define BIG     2
 911 #define BIG16   (BIG | CODE16)
 912
 913 #ifndef INLINE
 914 #ifdef __GNUC__
 915 #define INLINE __inline__
 916 #else
 917 #define INLINE
 918 #endif
 919 #endif
 920
 921 #define ENCODE_RELAX_STATE(type, size) \
 922   ((relax_substateT) (((type) << 2) | (size)))
 923 #define TYPE_FROM_RELAX_STATE(s) \
 924   ((s) >> 2)
 925 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 926     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 927
 928 /* This table is used by relax_frag to promote short jumps to long
 929    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 930    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 931    don't allow a short jump in a 32 bit code segment to be promoted to
 932    a 16 bit offset jump because it's slower (requires data size
 933    prefix), and doesn't work, unless the destination is in the bottom
 934    64k of the code segment (The top 16 bits of eip are zeroed).  */
 935
 936 const relax_typeS md_relax_table[] =
 937 {
 938   /* The fields are:
 939      1) most positive reach of this state,
 940      2) most negative reach of this state,
 941      3) how many bytes this mode will have in the variable part of the frag
 942      4) which index into the table to try if we can't fit into this one.  */
 943
 944   /* UNCOND_JUMP states.  */
 945   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 946   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 947   /* dword jmp adds 4 bytes to frag:
 948      0 extra opcode bytes, 4 displacement bytes.  */
 949   {0, 0, 4, 0},
 950   /* word jmp adds 2 byte2 to frag:
 951      0 extra opcode bytes, 2 displacement bytes.  */
 952   {0, 0, 2, 0},
 953
 954   /* COND_JUMP states.  */
 955   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 956   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 957   /* dword conditionals adds 5 bytes to frag:
 958      1 extra opcode byte, 4 displacement bytes.  */
 959   {0, 0, 5, 0},
 960   /* word conditionals add 3 bytes to frag:
 961      1 extra opcode byte, 2 displacement bytes.  */
 962   {0, 0, 3, 0},
 963
 964   /* COND_JUMP86 states.  */
 965   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 966   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 967   /* dword conditionals adds 5 bytes to frag:
 968      1 extra opcode byte, 4 displacement bytes.  */
 969   {0, 0, 5, 0},
 970   /* word conditionals add 4 bytes to frag:
 971      1 displacement byte and a 3 byte long branch insn.  */
 972   {0, 0, 4, 0}
 973 };
 974
 975 #define ARCH(n, t, f, s) \
 976   { STRING_COMMA_LEN (#n), s, PROCESSOR_ ## t, vsz_none, CPU_ ## f ## _FLAGS, \
 977     CPU_NONE_FLAGS }
 978 #define SUBARCH(n, e, d, s) \
 979   { STRING_COMMA_LEN (#n), s, PROCESSOR_NONE, vsz_none, CPU_ ## e ## _FLAGS, \
 980     CPU_ ## d ## _FLAGS }
 981 #define VECARCH(n, e, d, v) \
 982   { STRING_COMMA_LEN (#n), false, PROCESSOR_NONE, vsz_ ## v, \
 983     CPU_ ## e ## _FLAGS, CPU_ ## d ## _FLAGS }
 984
 985 static const arch_entry cpu_arch[] =
 986 {
 987   /* Do not replace the first two entries - i386_target_format() and
 988      set_cpu_arch() rely on them being there in this order.  */
 989   ARCH (generic32, GENERIC32, GENERIC32, false),
 990   ARCH (generic64, GENERIC64, GENERIC64, false),
 991   ARCH (i8086, UNKNOWN, NONE, false),
 992   ARCH (i186, UNKNOWN, 186, false),
 993   ARCH (i286, UNKNOWN, 286, false),
 994   ARCH (i386, I386, 386, false),
 995   ARCH (i486, I486, 486, false),
 996   ARCH (i586, PENTIUM, 586, false),
 997   ARCH (i686, PENTIUMPRO, 686, false),
 998   ARCH (pentium, PENTIUM, 586, false),
 999   ARCH (pentiumpro, PENTIUMPRO, PENTIUMPRO, false),
1000   ARCH (pentiumii, PENTIUMPRO, P2, false),
1001   ARCH (pentiumiii, PENTIUMPRO, P3, false),
1002   ARCH (pentium4, PENTIUM4, P4, false),
1003   ARCH (prescott, NOCONA, CORE, false),
1004   ARCH (nocona, NOCONA, NOCONA, false),
1005   ARCH (yonah, CORE, CORE, true),
1006   ARCH (core, CORE, CORE, false),
1007   ARCH (merom, CORE2, CORE2, true),
1008   ARCH (core2, CORE2, CORE2, false),
1009   ARCH (corei7, COREI7, COREI7, false),
1010   ARCH (iamcu, IAMCU, IAMCU, false),
1011   ARCH (k6, K6, K6, false),
1012   ARCH (k6_2, K6, K6_2, false),
1013   ARCH (athlon, ATHLON, ATHLON, false),
1014   ARCH (sledgehammer, K8, K8, true),
1015   ARCH (opteron, K8, K8, false),
1016   ARCH (k8, K8, K8, false),
1017   ARCH (amdfam10, AMDFAM10, AMDFAM10, false),
1018   ARCH (bdver1, BD, BDVER1, false),
1019   ARCH (bdver2, BD, BDVER2, false),
1020   ARCH (bdver3, BD, BDVER3, false),
1021   ARCH (bdver4, BD, BDVER4, false),
1022   ARCH (znver1, ZNVER, ZNVER1, false),
1023   ARCH (znver2, ZNVER, ZNVER2, false),
1024   ARCH (znver3, ZNVER, ZNVER3, false),
1025   ARCH (znver4, ZNVER, ZNVER4, false),
1026   ARCH (btver1, BT, BTVER1, false),
1027   ARCH (btver2, BT, BTVER2, false),
1028
1029   SUBARCH (8087, 8087, ANY_8087, false),
1030   SUBARCH (87, NONE, ANY_8087, false), /* Disable only!  */
1031   SUBARCH (287, 287, ANY_287, false),
1032   SUBARCH (387, 387, ANY_387, false),
1033   SUBARCH (687, 687, ANY_687, false),
1034   SUBARCH (cmov, CMOV, CMOV, false),
1035   SUBARCH (fxsr, FXSR, ANY_FXSR, false),
1036   SUBARCH (mmx, MMX, ANY_MMX, false),
1037   SUBARCH (sse, SSE, ANY_SSE, false),
1038   SUBARCH (sse2, SSE2, ANY_SSE2, false),
1039   SUBARCH (sse3, SSE3, ANY_SSE3, false),
1040   SUBARCH (sse4a, SSE4A, ANY_SSE4A, false),
1041   SUBARCH (ssse3, SSSE3, ANY_SSSE3, false),
1042   SUBARCH (sse4.1, SSE4_1, ANY_SSE4_1, false),
1043   SUBARCH (sse4.2, SSE4_2, ANY_SSE4_2, false),
1044   SUBARCH (sse4, SSE4_2, ANY_SSE4_1, false),
1045   VECARCH (avx, AVX, ANY_AVX, reset),
1046   VECARCH (avx2, AVX2, ANY_AVX2, reset),
1047   VECARCH (avx512f, AVX512F, ANY_AVX512F, reset),
1048   VECARCH (avx512cd, AVX512CD, ANY_AVX512CD, reset),
1049   VECARCH (avx512er, AVX512ER, ANY_AVX512ER, reset),
1050   VECARCH (avx512pf, AVX512PF, ANY_AVX512PF, reset),
1051   VECARCH (avx512dq, AVX512DQ, ANY_AVX512DQ, reset),
1052   VECARCH (avx512bw, AVX512BW, ANY_AVX512BW, reset),
1053   VECARCH (avx512vl, AVX512VL, ANY_AVX512VL, reset),
1054   SUBARCH (monitor, MONITOR, MONITOR, false),
1055   SUBARCH (vmx, VMX, ANY_VMX, false),
1056   SUBARCH (vmfunc, VMFUNC, ANY_VMFUNC, false),
1057   SUBARCH (smx, SMX, SMX, false),
1058   SUBARCH (xsave, XSAVE, ANY_XSAVE, false),
1059   SUBARCH (xsaveopt, XSAVEOPT, ANY_XSAVEOPT, false),
1060   SUBARCH (xsavec, XSAVEC, ANY_XSAVEC, false),
1061   SUBARCH (xsaves, XSAVES, ANY_XSAVES, false),
1062   SUBARCH (aes, AES, ANY_AES, false),
1063   SUBARCH (pclmul, PCLMULQDQ, ANY_PCLMULQDQ, false),
1064   SUBARCH (clmul, PCLMULQDQ, ANY_PCLMULQDQ, true),
1065   SUBARCH (fsgsbase, FSGSBASE, FSGSBASE, false),
1066   SUBARCH (rdrnd, RDRND, RDRND, false),
1067   SUBARCH (f16c, F16C, ANY_F16C, false),
1068   SUBARCH (bmi2, BMI2, BMI2, false),
1069   SUBARCH (fma, FMA, ANY_FMA, false),
1070   SUBARCH (fma4, FMA4, ANY_FMA4, false),
1071   SUBARCH (xop, XOP, ANY_XOP, false),
1072   SUBARCH (lwp, LWP, ANY_LWP, false),
1073   SUBARCH (movbe, MOVBE, MOVBE, false),
1074   SUBARCH (cx16, CX16, CX16, false),
1075   SUBARCH (lahf_sahf, LAHF_SAHF, LAHF_SAHF, false),
1076   SUBARCH (ept, EPT, ANY_EPT, false),
1077   SUBARCH (lzcnt, LZCNT, LZCNT, false),
1078   SUBARCH (popcnt, POPCNT, POPCNT, false),
1079   SUBARCH (hle, HLE, HLE, false),
1080   SUBARCH (rtm, RTM, ANY_RTM, false),
1081   SUBARCH (tsx, TSX, TSX, false),
1082   SUBARCH (invpcid, INVPCID, INVPCID, false),
1083   SUBARCH (clflush, CLFLUSH, CLFLUSH, false),
1084   SUBARCH (nop, NOP, NOP, false),
1085   SUBARCH (syscall, SYSCALL, SYSCALL, false),
1086   SUBARCH (rdtscp, RDTSCP, RDTSCP, false),
1087   SUBARCH (3dnow, 3DNOW, ANY_3DNOW, false),
1088   SUBARCH (3dnowa, 3DNOWA, ANY_3DNOWA, false),
1089   SUBARCH (padlock, PADLOCK, PADLOCK, false),
1090   SUBARCH (pacifica, SVME, ANY_SVME, true),
1091   SUBARCH (svme, SVME, ANY_SVME, false),
1092   SUBARCH (abm, ABM, ABM, false),
1093   SUBARCH (bmi, BMI, BMI, false),
1094   SUBARCH (tbm, TBM, TBM, false),
1095   SUBARCH (adx, ADX, ADX, false),
1096   SUBARCH (rdseed, RDSEED, RDSEED, false),
1097   SUBARCH (prfchw, PRFCHW, PRFCHW, false),
1098   SUBARCH (smap, SMAP, SMAP, false),
1099   SUBARCH (mpx, MPX, ANY_MPX, false),
1100   SUBARCH (sha, SHA, ANY_SHA, false),
1101   SUBARCH (clflushopt, CLFLUSHOPT, CLFLUSHOPT, false),
1102   SUBARCH (prefetchwt1, PREFETCHWT1, PREFETCHWT1, false),
1103   SUBARCH (se1, SE1, SE1, false),
1104   SUBARCH (clwb, CLWB, CLWB, false),
1105   VECARCH (avx512ifma, AVX512IFMA, ANY_AVX512IFMA, reset),
1106   VECARCH (avx512vbmi, AVX512VBMI, ANY_AVX512VBMI, reset),
1107   VECARCH (avx512_4fmaps, AVX512_4FMAPS, ANY_AVX512_4FMAPS, reset),
1108   VECARCH (avx512_4vnniw, AVX512_4VNNIW, ANY_AVX512_4VNNIW, reset),
1109   VECARCH (avx512_vpopcntdq, AVX512_VPOPCNTDQ, ANY_AVX512_VPOPCNTDQ, reset),
1110   VECARCH (avx512_vbmi2, AVX512_VBMI2, ANY_AVX512_VBMI2, reset),
1111   VECARCH (avx512_vnni, AVX512_VNNI, ANY_AVX512_VNNI, reset),
1112   VECARCH (avx512_bitalg, AVX512_BITALG, ANY_AVX512_BITALG, reset),
1113   VECARCH (avx_vnni, AVX_VNNI, ANY_AVX_VNNI, reset),
1114   SUBARCH (clzero, CLZERO, CLZERO, false),
1115   SUBARCH (mwaitx, MWAITX, MWAITX, false),
1116   SUBARCH (ospke, OSPKE, ANY_OSPKE, false),
1117   SUBARCH (rdpid, RDPID, RDPID, false),
1118   SUBARCH (ptwrite, PTWRITE, PTWRITE, false),
1119   SUBARCH (ibt, IBT, IBT, false),
1120   SUBARCH (shstk, SHSTK, SHSTK, false),
1121   SUBARCH (gfni, GFNI, ANY_GFNI, false),
1122   VECARCH (vaes, VAES, ANY_VAES, reset),
1123   VECARCH (vpclmulqdq, VPCLMULQDQ, ANY_VPCLMULQDQ, reset),
1124   SUBARCH (wbnoinvd, WBNOINVD, WBNOINVD, false),
1125   SUBARCH (pconfig, PCONFIG, PCONFIG, false),
1126   SUBARCH (waitpkg, WAITPKG, WAITPKG, false),
1127   SUBARCH (cldemote, CLDEMOTE, CLDEMOTE, false),
1128   SUBARCH (amx_int8, AMX_INT8, ANY_AMX_INT8, false),
1129   SUBARCH (amx_bf16, AMX_BF16, ANY_AMX_BF16, false),
1130   SUBARCH (amx_fp16, AMX_FP16, ANY_AMX_FP16, false),
1131   SUBARCH (amx_complex, AMX_COMPLEX, ANY_AMX_COMPLEX, false),
1132   SUBARCH (amx_tile, AMX_TILE, ANY_AMX_TILE, false),
1133   SUBARCH (movdiri, MOVDIRI, MOVDIRI, false),
1134   SUBARCH (movdir64b, MOVDIR64B, MOVDIR64B, false),
1135   VECARCH (avx512_bf16, AVX512_BF16, ANY_AVX512_BF16, reset),
1136   VECARCH (avx512_vp2intersect, AVX512_VP2INTERSECT,
1137            ANY_AVX512_VP2INTERSECT, reset),
1138   SUBARCH (tdx, TDX, TDX, false),
1139   SUBARCH (enqcmd, ENQCMD, ENQCMD, false),
1140   SUBARCH (serialize, SERIALIZE, SERIALIZE, false),
1141   SUBARCH (rdpru, RDPRU, RDPRU, false),
1142   SUBARCH (mcommit, MCOMMIT, MCOMMIT, false),
1143   SUBARCH (sev_es, SEV_ES, ANY_SEV_ES, false),
1144   SUBARCH (tsxldtrk, TSXLDTRK, ANY_TSXLDTRK, false),
1145   SUBARCH (kl, KL, ANY_KL, false),
1146   SUBARCH (widekl, WIDEKL, ANY_WIDEKL, false),
1147   SUBARCH (uintr, UINTR, UINTR, false),
1148   SUBARCH (hreset, HRESET, HRESET, false),
1149   VECARCH (avx512_fp16, AVX512_FP16, ANY_AVX512_FP16, reset),
1150   SUBARCH (prefetchi, PREFETCHI, PREFETCHI, false),
1151   VECARCH (avx_ifma, AVX_IFMA, ANY_AVX_IFMA, reset),
1152   VECARCH (avx_vnni_int8, AVX_VNNI_INT8, ANY_AVX_VNNI_INT8, reset),
1153   SUBARCH (cmpccxadd, CMPCCXADD, CMPCCXADD, false),
1154   SUBARCH (wrmsrns, WRMSRNS, WRMSRNS, false),
1155   SUBARCH (msrlist, MSRLIST, MSRLIST, false),
1156   VECARCH (avx_ne_convert, AVX_NE_CONVERT, ANY_AVX_NE_CONVERT, reset),
1157   SUBARCH (rao_int, RAO_INT, RAO_INT, false),
1158   SUBARCH (rmpquery, RMPQUERY, ANY_RMPQUERY, false),
1159   SUBARCH (fred, FRED, ANY_FRED, false),
1160   SUBARCH (lkgs, LKGS, ANY_LKGS, false),
1161   VECARCH (avx_vnni_int16, AVX_VNNI_INT16, ANY_AVX_VNNI_INT16, reset),
1162   VECARCH (sha512, SHA512, ANY_SHA512, reset),
1163   VECARCH (sm3, SM3, ANY_SM3, reset),
1164   VECARCH (sm4, SM4, ANY_SM4, reset),
1165   SUBARCH (pbndkb, PBNDKB, PBNDKB, false),
1166   VECARCH (avx10.1, AVX10_1, ANY_AVX512F, set),
1167 };
1168
1169 #undef SUBARCH
1170 #undef ARCH
1171
1172 #ifdef I386COFF
1173 /* Like s_lcomm_internal in gas/read.c but the alignment string
1174    is allowed to be optional.  */
1175
1176 static symbolS *
1177 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1178 {
1179   addressT align = 0;
1180
1181   SKIP_WHITESPACE ();
1182
1183   if (needs_align
1184       && *input_line_pointer == ',')
1185     {
1186       align = parse_align (needs_align - 1);
1187
1188       if (align == (addressT) -1)
1189         return NULL;
1190     }
1191   else
1192     {
1193       if (size >= 8)
1194         align = 3;
1195       else if (size >= 4)
1196         align = 2;
1197       else if (size >= 2)
1198         align = 1;
1199       else
1200         align = 0;
1201     }
1202
1203   bss_alloc (symbolP, size, align);
1204   return symbolP;
1205 }
1206
1207 static void
1208 pe_lcomm (int needs_align)
1209 {
1210   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1211 }
1212 #endif
1213
1214 const pseudo_typeS md_pseudo_table[] =
1215 {
1216 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1217   {"align", s_align_bytes, 0},
1218 #else
1219   {"align", s_align_ptwo, 0},
1220 #endif
1221   {"arch", set_cpu_arch, 0},
1222 #ifndef I386COFF
1223   {"bss", s_bss, 0},
1224 #else
1225   {"lcomm", pe_lcomm, 1},
1226 #endif
1227   {"ffloat", float_cons, 'f'},
1228   {"dfloat", float_cons, 'd'},
1229   {"tfloat", float_cons, 'x'},
1230   {"hfloat", float_cons, 'h'},
1231   {"bfloat16", float_cons, 'b'},
1232   {"value", cons, 2},
1233   {"slong", signed_cons, 4},
1234   {"insn", s_insn, 0},
1235   {"noopt", s_ignore, 0},
1236   {"optim", s_ignore, 0},
1237   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1238   {"code16", set_code_flag, CODE_16BIT},
1239   {"code32", set_code_flag, CODE_32BIT},
1240 #ifdef BFD64
1241   {"code64", set_code_flag, CODE_64BIT},
1242 #endif
1243   {"intel_syntax", set_intel_syntax, 1},
1244   {"att_syntax", set_intel_syntax, 0},
1245   {"intel_mnemonic", set_intel_mnemonic, 1},
1246   {"att_mnemonic", set_intel_mnemonic, 0},
1247   {"allow_index_reg", set_allow_index_reg, 1},
1248   {"disallow_index_reg", set_allow_index_reg, 0},
1249   {"sse_check", set_check, 0},
1250   {"operand_check", set_check, 1},
1251 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1252   {"largecomm", handle_large_common, 0},
1253 #else
1254   {"file", dwarf2_directive_file, 0},
1255   {"loc", dwarf2_directive_loc, 0},
1256   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1257 #endif
1258 #ifdef TE_PE
1259   {"secrel32", pe_directive_secrel, 0},
1260   {"secidx", pe_directive_secidx, 0},
1261 #endif
1262   {0, 0, 0}
1263 };
1264
1265 /* For interface with expression ().  */
1266 extern char *input_line_pointer;
1267
1268 /* Hash table for instruction mnemonic lookup.  */
1269 static htab_t op_hash;
1270
1271 /* Hash table for register lookup.  */
1272 static htab_t reg_hash;
1273 \f
1274   /* Various efficient no-op patterns for aligning code labels.
1275      Note: Don't try to assemble the instructions in the comments.
1276      0L and 0w are not legal.  */
1277 static const unsigned char f32_1[] =
1278   {0x90};                               /* nop                  */
1279 static const unsigned char f32_2[] =
1280   {0x66,0x90};                          /* xchg %ax,%ax         */
1281 static const unsigned char f32_3[] =
1282   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1283 static const unsigned char f32_4[] =
1284   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1285 static const unsigned char f32_6[] =
1286   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1287 static const unsigned char f32_7[] =
1288   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1289 static const unsigned char f16_3[] =
1290   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1291 static const unsigned char f16_4[] =
1292   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1293 static const unsigned char jump_disp8[] =
1294   {0xeb};                               /* jmp disp8           */
1295 static const unsigned char jump32_disp32[] =
1296   {0xe9};                               /* jmp disp32          */
1297 static const unsigned char jump16_disp32[] =
1298   {0x66,0xe9};                          /* jmp disp32          */
1299 /* 32-bit NOPs patterns.  */
1300 static const unsigned char *const f32_patt[] = {
1301   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1302 };
1303 /* 16-bit NOPs patterns.  */
1304 static const unsigned char *const f16_patt[] = {
1305   f32_1, f32_2, f16_3, f16_4
1306 };
1307 /* nopl (%[re]ax) */
1308 static const unsigned char alt_3[] =
1309   {0x0f,0x1f,0x00};
1310 /* nopl 0(%[re]ax) */
1311 static const unsigned char alt_4[] =
1312   {0x0f,0x1f,0x40,0x00};
1313 /* nopl 0(%[re]ax,%[re]ax,1) */
1314 static const unsigned char alt_5[] =
1315   {0x0f,0x1f,0x44,0x00,0x00};
1316 /* nopw 0(%[re]ax,%[re]ax,1) */
1317 static const unsigned char alt_6[] =
1318   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1319 /* nopl 0L(%[re]ax) */
1320 static const unsigned char alt_7[] =
1321   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1322 /* nopl 0L(%[re]ax,%[re]ax,1) */
1323 static const unsigned char alt_8[] =
1324   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1325 /* nopw 0L(%[re]ax,%[re]ax,1) */
1326 static const unsigned char alt_9[] =
1327   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1328 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1329 static const unsigned char alt_10[] =
1330   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1331 /* data16 nopw %cs:0L(%eax,%eax,1) */
1332 static const unsigned char alt_11[] =
1333   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1334 /* 32-bit and 64-bit NOPs patterns.  */
1335 static const unsigned char *const alt_patt[] = {
1336   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1337   alt_9, alt_10, alt_11
1338 };
1339
1340 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1341    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1342
1343 static void
1344 i386_output_nops (char *where, const unsigned char *const *patt,
1345                   int count, int max_single_nop_size)
1346
1347 {
1348   /* Place the longer NOP first.  */
1349   int last;
1350   int offset;
1351   const unsigned char *nops;
1352
1353   if (max_single_nop_size < 1)
1354     {
1355       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1356                 max_single_nop_size);
1357       return;
1358     }
1359
1360   nops = patt[max_single_nop_size - 1];
1361
1362   /* Use the smaller one if the requsted one isn't available.  */
1363   if (nops == NULL)
1364     {
1365       max_single_nop_size--;
1366       nops = patt[max_single_nop_size - 1];
1367     }
1368
1369   last = count % max_single_nop_size;
1370
1371   count -= last;
1372   for (offset = 0; offset < count; offset += max_single_nop_size)
1373     memcpy (where + offset, nops, max_single_nop_size);
1374
1375   if (last)
1376     {
1377       nops = patt[last - 1];
1378       if (nops == NULL)
1379         {
1380           /* Use the smaller one plus one-byte NOP if the needed one
1381              isn't available.  */
1382           last--;
1383           nops = patt[last - 1];
1384           memcpy (where + offset, nops, last);
1385           where[offset + last] = *patt[0];
1386         }
1387       else
1388         memcpy (where + offset, nops, last);
1389     }
1390 }
1391
1392 static INLINE int
1393 fits_in_imm7 (offsetT num)
1394 {
1395   return (num & 0x7f) == num;
1396 }
1397
1398 static INLINE int
1399 fits_in_imm31 (offsetT num)
1400 {
1401   return (num & 0x7fffffff) == num;
1402 }
1403
1404 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1405    single NOP instruction LIMIT.  */
1406
1407 void
1408 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1409 {
1410   const unsigned char *const *patt = NULL;
1411   int max_single_nop_size;
1412   /* Maximum number of NOPs before switching to jump over NOPs.  */
1413   int max_number_of_nops;
1414
1415   switch (fragP->fr_type)
1416     {
1417     case rs_fill_nop:
1418     case rs_align_code:
1419       break;
1420     case rs_machine_dependent:
1421       /* Allow NOP padding for jumps and calls.  */
1422       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1423           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1424         break;
1425       /* Fall through.  */
1426     default:
1427       return;
1428     }
1429
1430   /* We need to decide which NOP sequence to use for 32bit and
1431      64bit. When -mtune= is used:
1432
1433      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1434      PROCESSOR_GENERIC32, f32_patt will be used.
1435      2. For the rest, alt_patt will be used.
1436
1437      When -mtune= isn't used, alt_patt will be used if
1438      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1439      be used.
1440
1441      When -march= or .arch is used, we can't use anything beyond
1442      cpu_arch_isa_flags.   */
1443
1444   if (flag_code == CODE_16BIT)
1445     {
1446       patt = f16_patt;
1447       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1448       /* Limit number of NOPs to 2 in 16-bit mode.  */
1449       max_number_of_nops = 2;
1450     }
1451   else
1452     {
1453       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1454         {
1455           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1456           switch (cpu_arch_tune)
1457             {
1458             case PROCESSOR_UNKNOWN:
1459               /* We use cpu_arch_isa_flags to check if we SHOULD
1460                  optimize with nops.  */
1461               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1462                 patt = alt_patt;
1463               else
1464                 patt = f32_patt;
1465               break;
1466             case PROCESSOR_PENTIUM4:
1467             case PROCESSOR_NOCONA:
1468             case PROCESSOR_CORE:
1469             case PROCESSOR_CORE2:
1470             case PROCESSOR_COREI7:
1471             case PROCESSOR_GENERIC64:
1472             case PROCESSOR_K6:
1473             case PROCESSOR_ATHLON:
1474             case PROCESSOR_K8:
1475             case PROCESSOR_AMDFAM10:
1476             case PROCESSOR_BD:
1477             case PROCESSOR_ZNVER:
1478             case PROCESSOR_BT:
1479               patt = alt_patt;
1480               break;
1481             case PROCESSOR_I386:
1482             case PROCESSOR_I486:
1483             case PROCESSOR_PENTIUM:
1484             case PROCESSOR_PENTIUMPRO:
1485             case PROCESSOR_IAMCU:
1486             case PROCESSOR_GENERIC32:
1487               patt = f32_patt;
1488               break;
1489             case PROCESSOR_NONE:
1490               abort ();
1491             }
1492         }
1493       else
1494         {
1495           switch (fragP->tc_frag_data.tune)
1496             {
1497             case PROCESSOR_UNKNOWN:
1498               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1499                  PROCESSOR_UNKNOWN.  */
1500               abort ();
1501               break;
1502
1503             case PROCESSOR_I386:
1504             case PROCESSOR_I486:
1505             case PROCESSOR_PENTIUM:
1506             case PROCESSOR_IAMCU:
1507             case PROCESSOR_K6:
1508             case PROCESSOR_ATHLON:
1509             case PROCESSOR_K8:
1510             case PROCESSOR_AMDFAM10:
1511             case PROCESSOR_BD:
1512             case PROCESSOR_ZNVER:
1513             case PROCESSOR_BT:
1514             case PROCESSOR_GENERIC32:
1515               /* We use cpu_arch_isa_flags to check if we CAN optimize
1516                  with nops.  */
1517               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1518                 patt = alt_patt;
1519               else
1520                 patt = f32_patt;
1521               break;
1522             case PROCESSOR_PENTIUMPRO:
1523             case PROCESSOR_PENTIUM4:
1524             case PROCESSOR_NOCONA:
1525             case PROCESSOR_CORE:
1526             case PROCESSOR_CORE2:
1527             case PROCESSOR_COREI7:
1528               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1529                 patt = alt_patt;
1530               else
1531                 patt = f32_patt;
1532               break;
1533             case PROCESSOR_GENERIC64:
1534               patt = alt_patt;
1535               break;
1536             case PROCESSOR_NONE:
1537               abort ();
1538             }
1539         }
1540
1541       if (patt == f32_patt)
1542         {
1543           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1544           /* Limit number of NOPs to 2 for older processors.  */
1545           max_number_of_nops = 2;
1546         }
1547       else
1548         {
1549           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1550           /* Limit number of NOPs to 7 for newer processors.  */
1551           max_number_of_nops = 7;
1552         }
1553     }
1554
1555   if (limit == 0)
1556     limit = max_single_nop_size;
1557
1558   if (fragP->fr_type == rs_fill_nop)
1559     {
1560       /* Output NOPs for .nop directive.  */
1561       if (limit > max_single_nop_size)
1562         {
1563           as_bad_where (fragP->fr_file, fragP->fr_line,
1564                         _("invalid single nop size: %d "
1565                           "(expect within [0, %d])"),
1566                         limit, max_single_nop_size);
1567           return;
1568         }
1569     }
1570   else if (fragP->fr_type != rs_machine_dependent)
1571     fragP->fr_var = count;
1572
1573   if ((count / max_single_nop_size) > max_number_of_nops)
1574     {
1575       /* Generate jump over NOPs.  */
1576       offsetT disp = count - 2;
1577       if (fits_in_imm7 (disp))
1578         {
1579           /* Use "jmp disp8" if possible.  */
1580           count = disp;
1581           where[0] = jump_disp8[0];
1582           where[1] = count;
1583           where += 2;
1584         }
1585       else
1586         {
1587           unsigned int size_of_jump;
1588
1589           if (flag_code == CODE_16BIT)
1590             {
1591               where[0] = jump16_disp32[0];
1592               where[1] = jump16_disp32[1];
1593               size_of_jump = 2;
1594             }
1595           else
1596             {
1597               where[0] = jump32_disp32[0];
1598               size_of_jump = 1;
1599             }
1600
1601           count -= size_of_jump + 4;
1602           if (!fits_in_imm31 (count))
1603             {
1604               as_bad_where (fragP->fr_file, fragP->fr_line,
1605                             _("jump over nop padding out of range"));
1606               return;
1607             }
1608
1609           md_number_to_chars (where + size_of_jump, count, 4);
1610           where += size_of_jump + 4;
1611         }
1612     }
1613
1614   /* Generate multiple NOPs.  */
1615   i386_output_nops (where, patt, count, limit);
1616 }
1617
1618 static INLINE int
1619 operand_type_all_zero (const union i386_operand_type *x)
1620 {
1621   switch (ARRAY_SIZE(x->array))
1622     {
1623     case 3:
1624       if (x->array[2])
1625         return 0;
1626       /* Fall through.  */
1627     case 2:
1628       if (x->array[1])
1629         return 0;
1630       /* Fall through.  */
1631     case 1:
1632       return !x->array[0];
1633     default:
1634       abort ();
1635     }
1636 }
1637
1638 static INLINE void
1639 operand_type_set (union i386_operand_type *x, unsigned int v)
1640 {
1641   switch (ARRAY_SIZE(x->array))
1642     {
1643     case 3:
1644       x->array[2] = v;
1645       /* Fall through.  */
1646     case 2:
1647       x->array[1] = v;
1648       /* Fall through.  */
1649     case 1:
1650       x->array[0] = v;
1651       /* Fall through.  */
1652       break;
1653     default:
1654       abort ();
1655     }
1656
1657   x->bitfield.class = ClassNone;
1658   x->bitfield.instance = InstanceNone;
1659 }
1660
1661 static INLINE int
1662 operand_type_equal (const union i386_operand_type *x,
1663                     const union i386_operand_type *y)
1664 {
1665   switch (ARRAY_SIZE(x->array))
1666     {
1667     case 3:
1668       if (x->array[2] != y->array[2])
1669         return 0;
1670       /* Fall through.  */
1671     case 2:
1672       if (x->array[1] != y->array[1])
1673         return 0;
1674       /* Fall through.  */
1675     case 1:
1676       return x->array[0] == y->array[0];
1677       break;
1678     default:
1679       abort ();
1680     }
1681 }
1682
1683 static INLINE bool
1684 is_cpu (const insn_template *t, enum i386_cpu cpu)
1685 {
1686   switch (cpu)
1687     {
1688     case Cpu287:      return t->cpu.bitfield.cpu287;
1689     case Cpu387:      return t->cpu.bitfield.cpu387;
1690     case Cpu3dnow:    return t->cpu.bitfield.cpu3dnow;
1691     case Cpu3dnowA:   return t->cpu.bitfield.cpu3dnowa;
1692     case CpuAVX:      return t->cpu.bitfield.cpuavx;
1693     case CpuHLE:      return t->cpu.bitfield.cpuhle;
1694     case CpuAVX512F:  return t->cpu.bitfield.cpuavx512f;
1695     case CpuAVX512VL: return t->cpu.bitfield.cpuavx512vl;
1696     case Cpu64:       return t->cpu.bitfield.cpu64;
1697     case CpuNo64:     return t->cpu.bitfield.cpuno64;
1698     default:
1699       gas_assert (cpu < CpuAttrEnums);
1700     }
1701   return t->cpu.bitfield.isa == cpu + 1u;
1702 }
1703
1704 static i386_cpu_flags cpu_flags_from_attr (i386_cpu_attr a)
1705 {
1706   const unsigned int bps = sizeof (a.array[0]) * CHAR_BIT;
1707   i386_cpu_flags f = { .array[0] = 0 };
1708
1709   switch (ARRAY_SIZE(a.array))
1710     {
1711     case 1:
1712       f.array[CpuAttrEnums / bps]
1713         |= (a.array[0] >> CpuIsaBits) << (CpuAttrEnums % bps);
1714       if (CpuAttrEnums % bps > CpuIsaBits)
1715         f.array[CpuAttrEnums / bps + 1]
1716           = (a.array[0] >> CpuIsaBits) >> (bps - CpuAttrEnums % bps);
1717       break;
1718     default:
1719       abort ();
1720     }
1721
1722   if (a.bitfield.isa)
1723     f.array[(a.bitfield.isa - 1) / bps] |= 1u << ((a.bitfield.isa - 1) % bps);
1724
1725   return f;
1726 }
1727
1728 static INLINE int
1729 cpu_flags_all_zero (const union i386_cpu_flags *x)
1730 {
1731   switch (ARRAY_SIZE(x->array))
1732     {
1733     case 5:
1734       if (x->array[4])
1735         return 0;
1736       /* Fall through.  */
1737     case 4:
1738       if (x->array[3])
1739         return 0;
1740       /* Fall through.  */
1741     case 3:
1742       if (x->array[2])
1743         return 0;
1744       /* Fall through.  */
1745     case 2:
1746       if (x->array[1])
1747         return 0;
1748       /* Fall through.  */
1749     case 1:
1750       return !x->array[0];
1751     default:
1752       abort ();
1753     }
1754 }
1755
1756 static INLINE int
1757 cpu_flags_equal (const union i386_cpu_flags *x,
1758                  const union i386_cpu_flags *y)
1759 {
1760   switch (ARRAY_SIZE(x->array))
1761     {
1762     case 5:
1763       if (x->array[4] != y->array[4])
1764         return 0;
1765       /* Fall through.  */
1766     case 4:
1767       if (x->array[3] != y->array[3])
1768         return 0;
1769       /* Fall through.  */
1770     case 3:
1771       if (x->array[2] != y->array[2])
1772         return 0;
1773       /* Fall through.  */
1774     case 2:
1775       if (x->array[1] != y->array[1])
1776         return 0;
1777       /* Fall through.  */
1778     case 1:
1779       return x->array[0] == y->array[0];
1780       break;
1781     default:
1782       abort ();
1783     }
1784 }
1785
1786 static INLINE int
1787 cpu_flags_check_cpu64 (const insn_template *t)
1788 {
1789   return flag_code == CODE_64BIT
1790          ? !t->cpu.bitfield.cpuno64
1791          : !t->cpu.bitfield.cpu64;
1792 }
1793
1794 static INLINE i386_cpu_flags
1795 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1796 {
1797   switch (ARRAY_SIZE (x.array))
1798     {
1799     case 5:
1800       x.array [4] &= y.array [4];
1801       /* Fall through.  */
1802     case 4:
1803       x.array [3] &= y.array [3];
1804       /* Fall through.  */
1805     case 3:
1806       x.array [2] &= y.array [2];
1807       /* Fall through.  */
1808     case 2:
1809       x.array [1] &= y.array [1];
1810       /* Fall through.  */
1811     case 1:
1812       x.array [0] &= y.array [0];
1813       break;
1814     default:
1815       abort ();
1816     }
1817   return x;
1818 }
1819
1820 static INLINE i386_cpu_flags
1821 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1822 {
1823   switch (ARRAY_SIZE (x.array))
1824     {
1825     case 5:
1826       x.array [4] |= y.array [4];
1827       /* Fall through.  */
1828     case 4:
1829       x.array [3] |= y.array [3];
1830       /* Fall through.  */
1831     case 3:
1832       x.array [2] |= y.array [2];
1833       /* Fall through.  */
1834     case 2:
1835       x.array [1] |= y.array [1];
1836       /* Fall through.  */
1837     case 1:
1838       x.array [0] |= y.array [0];
1839       break;
1840     default:
1841       abort ();
1842     }
1843   return x;
1844 }
1845
1846 static INLINE i386_cpu_flags
1847 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1848 {
1849   switch (ARRAY_SIZE (x.array))
1850     {
1851     case 5:
1852       x.array [4] &= ~y.array [4];
1853       /* Fall through.  */
1854     case 4:
1855       x.array [3] &= ~y.array [3];
1856       /* Fall through.  */
1857     case 3:
1858       x.array [2] &= ~y.array [2];
1859       /* Fall through.  */
1860     case 2:
1861       x.array [1] &= ~y.array [1];
1862       /* Fall through.  */
1863     case 1:
1864       x.array [0] &= ~y.array [0];
1865       break;
1866     default:
1867       abort ();
1868     }
1869   return x;
1870 }
1871
1872 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1873
1874 static INLINE bool need_evex_encoding (void)
1875 {
1876   return i.vec_encoding == vex_encoding_evex
1877         || i.vec_encoding == vex_encoding_evex512
1878         || i.mask.reg;
1879 }
1880
1881 #define CPU_FLAGS_ARCH_MATCH            0x1
1882 #define CPU_FLAGS_64BIT_MATCH           0x2
1883
1884 #define CPU_FLAGS_PERFECT_MATCH \
1885   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1886
1887 /* Return CPU flags match bits. */
1888
1889 static int
1890 cpu_flags_match (const insn_template *t)
1891 {
1892   i386_cpu_flags x = cpu_flags_from_attr (t->cpu);
1893   int match = cpu_flags_check_cpu64 (t) ? CPU_FLAGS_64BIT_MATCH : 0;
1894
1895   x.bitfield.cpu64 = 0;
1896   x.bitfield.cpuno64 = 0;
1897
1898   if (cpu_flags_all_zero (&x))
1899     {
1900       /* This instruction is available on all archs.  */
1901       match |= CPU_FLAGS_ARCH_MATCH;
1902     }
1903   else
1904     {
1905       /* This instruction is available only on some archs.  */
1906       i386_cpu_flags cpu = cpu_arch_flags;
1907
1908       /* Dual VEX/EVEX templates may need stripping of one of the flags.  */
1909       if (t->opcode_modifier.vex && t->opcode_modifier.evex)
1910         {
1911           /* Dual AVX/AVX512F templates need to retain AVX512F only if we already
1912              know that EVEX encoding will be needed.  */
1913           if ((x.bitfield.cpuavx || x.bitfield.cpuavx2)
1914               && x.bitfield.cpuavx512f)
1915             {
1916               if (need_evex_encoding ())
1917                 {
1918                   x.bitfield.cpuavx = 0;
1919                   x.bitfield.cpuavx2 = 0;
1920                 }
1921               /* need_evex_encoding() isn't reliable before operands were
1922                  parsed.  */
1923               else if (i.operands)
1924                 {
1925                   x.bitfield.cpuavx512f = 0;
1926                   x.bitfield.cpuavx512vl = 0;
1927                   if (x.bitfield.cpufma && !cpu.bitfield.cpufma)
1928                     x.bitfield.cpuavx = 0;
1929                 }
1930             }
1931         }
1932
1933       /* AVX512VL is no standalone feature - match it and then strip it.  */
1934       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1935         return match;
1936       x.bitfield.cpuavx512vl = 0;
1937
1938       /* AVX and AVX2 present at the same time express an operand size
1939          dependency - strip AVX2 for the purposes here.  The operand size
1940          dependent check occurs in check_vecOperands().  */
1941       if (x.bitfield.cpuavx && x.bitfield.cpuavx2)
1942         x.bitfield.cpuavx2 = 0;
1943
1944       cpu = cpu_flags_and (x, cpu);
1945       if (!cpu_flags_all_zero (&cpu))
1946         {
1947           if (t->cpu.bitfield.cpuavx && t->cpu.bitfield.cpuavx512f)
1948             {
1949               if ((need_evex_encoding ()
1950                    ? cpu.bitfield.cpuavx512f
1951                    : cpu.bitfield.cpuavx)
1952                   && (!x.bitfield.cpufma || cpu.bitfield.cpufma
1953                       || cpu_arch_flags.bitfield.cpuavx512f)
1954                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1955                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1956                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1957                 match |= CPU_FLAGS_ARCH_MATCH;
1958             }
1959           else if (x.bitfield.cpuavx)
1960             {
1961               /* We need to check a few extra flags with AVX.  */
1962               if (cpu.bitfield.cpuavx
1963                   && (!t->opcode_modifier.sse2avx
1964                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1965                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1966                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1967                   && (!x.bitfield.cpupclmulqdq || cpu.bitfield.cpupclmulqdq))
1968                 match |= CPU_FLAGS_ARCH_MATCH;
1969             }
1970           else if (x.bitfield.cpuavx2 && cpu.bitfield.cpuavx2)
1971             match |= CPU_FLAGS_ARCH_MATCH;
1972           else if (x.bitfield.cpuavx512f)
1973             {
1974               /* We need to check a few extra flags with AVX512F.  */
1975               if (cpu.bitfield.cpuavx512f
1976                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni))
1977                 match |= CPU_FLAGS_ARCH_MATCH;
1978             }
1979           else
1980             match |= CPU_FLAGS_ARCH_MATCH;
1981         }
1982     }
1983   return match;
1984 }
1985
1986 static INLINE i386_operand_type
1987 operand_type_and (i386_operand_type x, i386_operand_type y)
1988 {
1989   if (x.bitfield.class != y.bitfield.class)
1990     x.bitfield.class = ClassNone;
1991   if (x.bitfield.instance != y.bitfield.instance)
1992     x.bitfield.instance = InstanceNone;
1993
1994   switch (ARRAY_SIZE (x.array))
1995     {
1996     case 3:
1997       x.array [2] &= y.array [2];
1998       /* Fall through.  */
1999     case 2:
2000       x.array [1] &= y.array [1];
2001       /* Fall through.  */
2002     case 1:
2003       x.array [0] &= y.array [0];
2004       break;
2005     default:
2006       abort ();
2007     }
2008   return x;
2009 }
2010
2011 static INLINE i386_operand_type
2012 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2013 {
2014   gas_assert (y.bitfield.class == ClassNone);
2015   gas_assert (y.bitfield.instance == InstanceNone);
2016
2017   switch (ARRAY_SIZE (x.array))
2018     {
2019     case 3:
2020       x.array [2] &= ~y.array [2];
2021       /* Fall through.  */
2022     case 2:
2023       x.array [1] &= ~y.array [1];
2024       /* Fall through.  */
2025     case 1:
2026       x.array [0] &= ~y.array [0];
2027       break;
2028     default:
2029       abort ();
2030     }
2031   return x;
2032 }
2033
2034 static INLINE i386_operand_type
2035 operand_type_or (i386_operand_type x, i386_operand_type y)
2036 {
2037   gas_assert (x.bitfield.class == ClassNone ||
2038               y.bitfield.class == ClassNone ||
2039               x.bitfield.class == y.bitfield.class);
2040   gas_assert (x.bitfield.instance == InstanceNone ||
2041               y.bitfield.instance == InstanceNone ||
2042               x.bitfield.instance == y.bitfield.instance);
2043
2044   switch (ARRAY_SIZE (x.array))
2045     {
2046     case 3:
2047       x.array [2] |= y.array [2];
2048       /* Fall through.  */
2049     case 2:
2050       x.array [1] |= y.array [1];
2051       /* Fall through.  */
2052     case 1:
2053       x.array [0] |= y.array [0];
2054       break;
2055     default:
2056       abort ();
2057     }
2058   return x;
2059 }
2060
2061 static INLINE i386_operand_type
2062 operand_type_xor (i386_operand_type x, i386_operand_type y)
2063 {
2064   gas_assert (y.bitfield.class == ClassNone);
2065   gas_assert (y.bitfield.instance == InstanceNone);
2066
2067   switch (ARRAY_SIZE (x.array))
2068     {
2069     case 3:
2070       x.array [2] ^= y.array [2];
2071       /* Fall through.  */
2072     case 2:
2073       x.array [1] ^= y.array [1];
2074       /* Fall through.  */
2075     case 1:
2076       x.array [0] ^= y.array [0];
2077       break;
2078     default:
2079       abort ();
2080     }
2081   return x;
2082 }
2083
2084 static const i386_operand_type anydisp = {
2085   .bitfield = { .disp8 = 1, .disp16 = 1, .disp32 = 1, .disp64 = 1 }
2086 };
2087
2088 enum operand_type
2089 {
2090   reg,
2091   imm,
2092   disp,
2093   anymem
2094 };
2095
2096 static INLINE int
2097 operand_type_check (i386_operand_type t, enum operand_type c)
2098 {
2099   switch (c)
2100     {
2101     case reg:
2102       return t.bitfield.class == Reg;
2103
2104     case imm:
2105       return (t.bitfield.imm8
2106               || t.bitfield.imm8s
2107               || t.bitfield.imm16
2108               || t.bitfield.imm32
2109               || t.bitfield.imm32s
2110               || t.bitfield.imm64);
2111
2112     case disp:
2113       return (t.bitfield.disp8
2114               || t.bitfield.disp16
2115               || t.bitfield.disp32
2116               || t.bitfield.disp64);
2117
2118     case anymem:
2119       return (t.bitfield.disp8
2120               || t.bitfield.disp16
2121               || t.bitfield.disp32
2122               || t.bitfield.disp64
2123               || t.bitfield.baseindex);
2124
2125     default:
2126       abort ();
2127     }
2128
2129   return 0;
2130 }
2131
2132 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2133    between operand GIVEN and opeand WANTED for instruction template T.  */
2134
2135 static INLINE int
2136 match_operand_size (const insn_template *t, unsigned int wanted,
2137                     unsigned int given)
2138 {
2139   return !((i.types[given].bitfield.byte
2140             && !t->operand_types[wanted].bitfield.byte)
2141            || (i.types[given].bitfield.word
2142                && !t->operand_types[wanted].bitfield.word)
2143            || (i.types[given].bitfield.dword
2144                && !t->operand_types[wanted].bitfield.dword)
2145            || (i.types[given].bitfield.qword
2146                && (!t->operand_types[wanted].bitfield.qword
2147                    /* Don't allow 64-bit (memory) operands outside of 64-bit
2148                       mode, when they're used where a 64-bit GPR could also
2149                       be used.  Checking is needed for Intel Syntax only.  */
2150                    || (intel_syntax
2151                        && flag_code != CODE_64BIT
2152                        && (t->operand_types[wanted].bitfield.class == Reg
2153                            || t->operand_types[wanted].bitfield.class == Accum
2154                            || t->opcode_modifier.isstring))))
2155            || (i.types[given].bitfield.tbyte
2156                && !t->operand_types[wanted].bitfield.tbyte));
2157 }
2158
2159 /* Return 1 if there is no conflict in SIMD register between operand
2160    GIVEN and opeand WANTED for instruction template T.  */
2161
2162 static INLINE int
2163 match_simd_size (const insn_template *t, unsigned int wanted,
2164                  unsigned int given)
2165 {
2166   return !((i.types[given].bitfield.xmmword
2167             && !t->operand_types[wanted].bitfield.xmmword)
2168            || (i.types[given].bitfield.ymmword
2169                && !t->operand_types[wanted].bitfield.ymmword)
2170            || (i.types[given].bitfield.zmmword
2171                && !t->operand_types[wanted].bitfield.zmmword)
2172            || (i.types[given].bitfield.tmmword
2173                && !t->operand_types[wanted].bitfield.tmmword));
2174 }
2175
2176 /* Return 1 if there is no conflict in any size between operand GIVEN
2177    and opeand WANTED for instruction template T.  */
2178
2179 static INLINE int
2180 match_mem_size (const insn_template *t, unsigned int wanted,
2181                 unsigned int given)
2182 {
2183   return (match_operand_size (t, wanted, given)
2184           && !((i.types[given].bitfield.unspecified
2185                 && !i.broadcast.type
2186                 && !i.broadcast.bytes
2187                 && !t->operand_types[wanted].bitfield.unspecified)
2188                || (i.types[given].bitfield.fword
2189                    && !t->operand_types[wanted].bitfield.fword)
2190                /* For scalar opcode templates to allow register and memory
2191                   operands at the same time, some special casing is needed
2192                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2193                   down-conversion vpmov*.  */
2194                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2195                     && t->operand_types[wanted].bitfield.byte
2196                        + t->operand_types[wanted].bitfield.word
2197                        + t->operand_types[wanted].bitfield.dword
2198                        + t->operand_types[wanted].bitfield.qword
2199                        > !!t->opcode_modifier.broadcast)
2200                    ? (i.types[given].bitfield.xmmword
2201                       || i.types[given].bitfield.ymmword
2202                       || i.types[given].bitfield.zmmword)
2203                    : !match_simd_size(t, wanted, given))));
2204 }
2205
2206 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2207    operands for instruction template T, and it has MATCH_REVERSE set if there
2208    is no size conflict on any operands for the template with operands reversed
2209    (and the template allows for reversing in the first place).  */
2210
2211 #define MATCH_STRAIGHT 1
2212 #define MATCH_REVERSE  2
2213
2214 static INLINE unsigned int
2215 operand_size_match (const insn_template *t)
2216 {
2217   unsigned int j, match = MATCH_STRAIGHT;
2218
2219   /* Don't check non-absolute jump instructions.  */
2220   if (t->opcode_modifier.jump
2221       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2222     return match;
2223
2224   /* Check memory and accumulator operand size.  */
2225   for (j = 0; j < i.operands; j++)
2226     {
2227       if (i.types[j].bitfield.class != Reg
2228           && i.types[j].bitfield.class != RegSIMD
2229           && t->opcode_modifier.operandconstraint == ANY_SIZE)
2230         continue;
2231
2232       if (t->operand_types[j].bitfield.class == Reg
2233           && !match_operand_size (t, j, j))
2234         {
2235           match = 0;
2236           break;
2237         }
2238
2239       if (t->operand_types[j].bitfield.class == RegSIMD
2240           && !match_simd_size (t, j, j))
2241         {
2242           match = 0;
2243           break;
2244         }
2245
2246       if (t->operand_types[j].bitfield.instance == Accum
2247           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2248         {
2249           match = 0;
2250           break;
2251         }
2252
2253       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2254         {
2255           match = 0;
2256           break;
2257         }
2258     }
2259
2260   if (!t->opcode_modifier.d)
2261     return match;
2262
2263   /* Check reverse.  */
2264   gas_assert (i.operands >= 2);
2265
2266   for (j = 0; j < i.operands; j++)
2267     {
2268       unsigned int given = i.operands - j - 1;
2269
2270       /* For FMA4 and XOP insns VEX.W controls just the first two
2271          register operands.  */
2272       if (is_cpu (t, CpuFMA4) || is_cpu (t, CpuXOP))
2273         given = j < 2 ? 1 - j : j;
2274
2275       if (t->operand_types[j].bitfield.class == Reg
2276           && !match_operand_size (t, j, given))
2277         return match;
2278
2279       if (t->operand_types[j].bitfield.class == RegSIMD
2280           && !match_simd_size (t, j, given))
2281         return match;
2282
2283       if (t->operand_types[j].bitfield.instance == Accum
2284           && (!match_operand_size (t, j, given)
2285               || !match_simd_size (t, j, given)))
2286         return match;
2287
2288       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2289         return match;
2290     }
2291
2292   return match | MATCH_REVERSE;
2293 }
2294
2295 static INLINE int
2296 operand_type_match (i386_operand_type overlap,
2297                     i386_operand_type given)
2298 {
2299   i386_operand_type temp = overlap;
2300
2301   temp.bitfield.unspecified = 0;
2302   temp.bitfield.byte = 0;
2303   temp.bitfield.word = 0;
2304   temp.bitfield.dword = 0;
2305   temp.bitfield.fword = 0;
2306   temp.bitfield.qword = 0;
2307   temp.bitfield.tbyte = 0;
2308   temp.bitfield.xmmword = 0;
2309   temp.bitfield.ymmword = 0;
2310   temp.bitfield.zmmword = 0;
2311   temp.bitfield.tmmword = 0;
2312   if (operand_type_all_zero (&temp))
2313     goto mismatch;
2314
2315   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2316     return 1;
2317
2318  mismatch:
2319   i.error = operand_type_mismatch;
2320   return 0;
2321 }
2322
2323 /* If given types g0 and g1 are registers they must be of the same type
2324    unless the expected operand type register overlap is null.
2325    Intel syntax sized memory operands are also checked here.  */
2326
2327 static INLINE int
2328 operand_type_register_match (i386_operand_type g0,
2329                              i386_operand_type t0,
2330                              i386_operand_type g1,
2331                              i386_operand_type t1)
2332 {
2333   if (g0.bitfield.class != Reg
2334       && g0.bitfield.class != RegSIMD
2335       && (g0.bitfield.unspecified
2336           || !operand_type_check (g0, anymem)))
2337     return 1;
2338
2339   if (g1.bitfield.class != Reg
2340       && g1.bitfield.class != RegSIMD
2341       && (g1.bitfield.unspecified
2342           || !operand_type_check (g1, anymem)))
2343     return 1;
2344
2345   if (g0.bitfield.byte == g1.bitfield.byte
2346       && g0.bitfield.word == g1.bitfield.word
2347       && g0.bitfield.dword == g1.bitfield.dword
2348       && g0.bitfield.qword == g1.bitfield.qword
2349       && g0.bitfield.xmmword == g1.bitfield.xmmword
2350       && g0.bitfield.ymmword == g1.bitfield.ymmword
2351       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2352     return 1;
2353
2354   /* If expectations overlap in no more than a single size, all is fine. */
2355   g0 = operand_type_and (t0, t1);
2356   if (g0.bitfield.byte
2357       + g0.bitfield.word
2358       + g0.bitfield.dword
2359       + g0.bitfield.qword
2360       + g0.bitfield.xmmword
2361       + g0.bitfield.ymmword
2362       + g0.bitfield.zmmword <= 1)
2363     return 1;
2364
2365   i.error = register_type_mismatch;
2366
2367   return 0;
2368 }
2369
2370 static INLINE unsigned int
2371 register_number (const reg_entry *r)
2372 {
2373   unsigned int nr = r->reg_num;
2374
2375   if (r->reg_flags & RegRex)
2376     nr += 8;
2377
2378   if (r->reg_flags & RegVRex)
2379     nr += 16;
2380
2381   return nr;
2382 }
2383
2384 static INLINE unsigned int
2385 mode_from_disp_size (i386_operand_type t)
2386 {
2387   if (t.bitfield.disp8)
2388     return 1;
2389   else if (t.bitfield.disp16
2390            || t.bitfield.disp32)
2391     return 2;
2392   else
2393     return 0;
2394 }
2395
2396 static INLINE int
2397 fits_in_signed_byte (addressT num)
2398 {
2399   return num + 0x80 <= 0xff;
2400 }
2401
2402 static INLINE int
2403 fits_in_unsigned_byte (addressT num)
2404 {
2405   return num <= 0xff;
2406 }
2407
2408 static INLINE int
2409 fits_in_unsigned_word (addressT num)
2410 {
2411   return num <= 0xffff;
2412 }
2413
2414 static INLINE int
2415 fits_in_signed_word (addressT num)
2416 {
2417   return num + 0x8000 <= 0xffff;
2418 }
2419
2420 static INLINE int
2421 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2422 {
2423 #ifndef BFD64
2424   return 1;
2425 #else
2426   return num + 0x80000000 <= 0xffffffff;
2427 #endif
2428 }                               /* fits_in_signed_long() */
2429
2430 static INLINE int
2431 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2432 {
2433 #ifndef BFD64
2434   return 1;
2435 #else
2436   return num <= 0xffffffff;
2437 #endif
2438 }                               /* fits_in_unsigned_long() */
2439
2440 static INLINE valueT extend_to_32bit_address (addressT num)
2441 {
2442 #ifdef BFD64
2443   if (fits_in_unsigned_long(num))
2444     return (num ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2445
2446   if (!fits_in_signed_long (num))
2447     return num & 0xffffffff;
2448 #endif
2449
2450   return num;
2451 }
2452
2453 static INLINE int
2454 fits_in_disp8 (offsetT num)
2455 {
2456   int shift = i.memshift;
2457   unsigned int mask;
2458
2459   if (shift == -1)
2460     abort ();
2461
2462   mask = (1 << shift) - 1;
2463
2464   /* Return 0 if NUM isn't properly aligned.  */
2465   if ((num & mask))
2466     return 0;
2467
2468   /* Check if NUM will fit in 8bit after shift.  */
2469   return fits_in_signed_byte (num >> shift);
2470 }
2471
2472 static INLINE int
2473 fits_in_imm4 (offsetT num)
2474 {
2475   /* Despite the name, check for imm3 if we're dealing with EVEX.  */
2476   return (num & (i.vec_encoding != vex_encoding_evex ? 0xf : 7)) == num;
2477 }
2478
2479 static i386_operand_type
2480 smallest_imm_type (offsetT num)
2481 {
2482   i386_operand_type t;
2483
2484   operand_type_set (&t, 0);
2485   t.bitfield.imm64 = 1;
2486
2487   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2488     {
2489       /* This code is disabled on the 486 because all the Imm1 forms
2490          in the opcode table are slower on the i486.  They're the
2491          versions with the implicitly specified single-position
2492          displacement, which has another syntax if you really want to
2493          use that form.  */
2494       t.bitfield.imm1 = 1;
2495       t.bitfield.imm8 = 1;
2496       t.bitfield.imm8s = 1;
2497       t.bitfield.imm16 = 1;
2498       t.bitfield.imm32 = 1;
2499       t.bitfield.imm32s = 1;
2500     }
2501   else if (fits_in_signed_byte (num))
2502     {
2503       if (fits_in_unsigned_byte (num))
2504         t.bitfield.imm8 = 1;
2505       t.bitfield.imm8s = 1;
2506       t.bitfield.imm16 = 1;
2507       t.bitfield.imm32 = 1;
2508       t.bitfield.imm32s = 1;
2509     }
2510   else if (fits_in_unsigned_byte (num))
2511     {
2512       t.bitfield.imm8 = 1;
2513       t.bitfield.imm16 = 1;
2514       t.bitfield.imm32 = 1;
2515       t.bitfield.imm32s = 1;
2516     }
2517   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2518     {
2519       t.bitfield.imm16 = 1;
2520       t.bitfield.imm32 = 1;
2521       t.bitfield.imm32s = 1;
2522     }
2523   else if (fits_in_signed_long (num))
2524     {
2525       t.bitfield.imm32 = 1;
2526       t.bitfield.imm32s = 1;
2527     }
2528   else if (fits_in_unsigned_long (num))
2529     t.bitfield.imm32 = 1;
2530
2531   return t;
2532 }
2533
2534 static offsetT
2535 offset_in_range (offsetT val, int size)
2536 {
2537   addressT mask;
2538
2539   switch (size)
2540     {
2541     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2542     case 2: mask = ((addressT) 1 << 16) - 1; break;
2543 #ifdef BFD64
2544     case 4: mask = ((addressT) 1 << 32) - 1; break;
2545 #endif
2546     case sizeof (val): return val;
2547     default: abort ();
2548     }
2549
2550   if ((val & ~mask) != 0 && (-val & ~mask) != 0)
2551     as_warn (_("0x%" PRIx64 " shortened to 0x%" PRIx64),
2552              (uint64_t) val, (uint64_t) (val & mask));
2553
2554   return val & mask;
2555 }
2556
2557 static INLINE const char *insn_name (const insn_template *t)
2558 {
2559   return &i386_mnemonics[t->mnem_off];
2560 }
2561
2562 enum PREFIX_GROUP
2563 {
2564   PREFIX_EXIST = 0,
2565   PREFIX_LOCK,
2566   PREFIX_REP,
2567   PREFIX_DS,
2568   PREFIX_OTHER
2569 };
2570
2571 /* Returns
2572    a. PREFIX_EXIST if attempting to add a prefix where one from the
2573    same class already exists.
2574    b. PREFIX_LOCK if lock prefix is added.
2575    c. PREFIX_REP if rep/repne prefix is added.
2576    d. PREFIX_DS if ds prefix is added.
2577    e. PREFIX_OTHER if other prefix is added.
2578  */
2579
2580 static enum PREFIX_GROUP
2581 add_prefix (unsigned int prefix)
2582 {
2583   enum PREFIX_GROUP ret = PREFIX_OTHER;
2584   unsigned int q;
2585
2586   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2587       && flag_code == CODE_64BIT)
2588     {
2589       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2590           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2591           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2592           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2593         ret = PREFIX_EXIST;
2594       q = REX_PREFIX;
2595     }
2596   else
2597     {
2598       switch (prefix)
2599         {
2600         default:
2601           abort ();
2602
2603         case DS_PREFIX_OPCODE:
2604           ret = PREFIX_DS;
2605           /* Fall through.  */
2606         case CS_PREFIX_OPCODE:
2607         case ES_PREFIX_OPCODE:
2608         case FS_PREFIX_OPCODE:
2609         case GS_PREFIX_OPCODE:
2610         case SS_PREFIX_OPCODE:
2611           q = SEG_PREFIX;
2612           break;
2613
2614         case REPNE_PREFIX_OPCODE:
2615         case REPE_PREFIX_OPCODE:
2616           q = REP_PREFIX;
2617           ret = PREFIX_REP;
2618           break;
2619
2620         case LOCK_PREFIX_OPCODE:
2621           q = LOCK_PREFIX;
2622           ret = PREFIX_LOCK;
2623           break;
2624
2625         case FWAIT_OPCODE:
2626           q = WAIT_PREFIX;
2627           break;
2628
2629         case ADDR_PREFIX_OPCODE:
2630           q = ADDR_PREFIX;
2631           break;
2632
2633         case DATA_PREFIX_OPCODE:
2634           q = DATA_PREFIX;
2635           break;
2636         }
2637       if (i.prefix[q] != 0)
2638         ret = PREFIX_EXIST;
2639     }
2640
2641   if (ret)
2642     {
2643       if (!i.prefix[q])
2644         ++i.prefixes;
2645       i.prefix[q] |= prefix;
2646     }
2647   else
2648     as_bad (_("same type of prefix used twice"));
2649
2650   return ret;
2651 }
2652
2653 static void
2654 update_code_flag (int value, int check)
2655 {
2656   PRINTF_LIKE ((*as_error)) = check ? as_fatal : as_bad;
2657
2658   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpu64 )
2659     {
2660       as_error (_("64bit mode not supported on `%s'."),
2661                 cpu_arch_name ? cpu_arch_name : default_arch);
2662       return;
2663     }
2664
2665   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2666     {
2667       as_error (_("32bit mode not supported on `%s'."),
2668                 cpu_arch_name ? cpu_arch_name : default_arch);
2669       return;
2670     }
2671
2672   flag_code = (enum flag_code) value;
2673
2674   stackop_size = '\0';
2675 }
2676
2677 static void
2678 set_code_flag (int value)
2679 {
2680   update_code_flag (value, 0);
2681 }
2682
2683 static void
2684 set_16bit_gcc_code_flag (int new_code_flag)
2685 {
2686   flag_code = (enum flag_code) new_code_flag;
2687   if (flag_code != CODE_16BIT)
2688     abort ();
2689   stackop_size = LONG_MNEM_SUFFIX;
2690 }
2691
2692 static void
2693 set_intel_syntax (int syntax_flag)
2694 {
2695   /* Find out if register prefixing is specified.  */
2696   int ask_naked_reg = 0;
2697
2698   SKIP_WHITESPACE ();
2699   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2700     {
2701       char *string;
2702       int e = get_symbol_name (&string);
2703
2704       if (strcmp (string, "prefix") == 0)
2705         ask_naked_reg = 1;
2706       else if (strcmp (string, "noprefix") == 0)
2707         ask_naked_reg = -1;
2708       else
2709         as_bad (_("bad argument to syntax directive."));
2710       (void) restore_line_pointer (e);
2711     }
2712   demand_empty_rest_of_line ();
2713
2714   intel_syntax = syntax_flag;
2715
2716   if (ask_naked_reg == 0)
2717     allow_naked_reg = (intel_syntax
2718                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2719   else
2720     allow_naked_reg = (ask_naked_reg < 0);
2721
2722   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2723
2724   register_prefix = allow_naked_reg ? "" : "%";
2725 }
2726
2727 static void
2728 set_intel_mnemonic (int mnemonic_flag)
2729 {
2730   intel_mnemonic = mnemonic_flag;
2731 }
2732
2733 static void
2734 set_allow_index_reg (int flag)
2735 {
2736   allow_index_reg = flag;
2737 }
2738
2739 static void
2740 set_check (int what)
2741 {
2742   enum check_kind *kind;
2743   const char *str;
2744
2745   if (what)
2746     {
2747       kind = &operand_check;
2748       str = "operand";
2749     }
2750   else
2751     {
2752       kind = &sse_check;
2753       str = "sse";
2754     }
2755
2756   SKIP_WHITESPACE ();
2757
2758   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2759     {
2760       char *string;
2761       int e = get_symbol_name (&string);
2762
2763       if (strcmp (string, "none") == 0)
2764         *kind = check_none;
2765       else if (strcmp (string, "warning") == 0)
2766         *kind = check_warning;
2767       else if (strcmp (string, "error") == 0)
2768         *kind = check_error;
2769       else
2770         as_bad (_("bad argument to %s_check directive."), str);
2771       (void) restore_line_pointer (e);
2772     }
2773   else
2774     as_bad (_("missing argument for %s_check directive"), str);
2775
2776   demand_empty_rest_of_line ();
2777 }
2778
2779 static void
2780 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2781                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2782 {
2783 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2784   static const char *arch;
2785
2786   /* Intel MCU is only supported on ELF.  */
2787   if (!IS_ELF)
2788     return;
2789
2790   if (!arch)
2791     {
2792       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2793          use default_arch.  */
2794       arch = cpu_arch_name;
2795       if (!arch)
2796         arch = default_arch;
2797     }
2798
2799   /* If we are targeting Intel MCU, we must enable it.  */
2800   if ((get_elf_backend_data (stdoutput)->elf_machine_code == EM_IAMCU)
2801       == new_flag.bitfield.cpuiamcu)
2802     return;
2803
2804   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2805 #endif
2806 }
2807
2808 static void
2809 extend_cpu_sub_arch_name (const char *pfx, const char *name)
2810 {
2811   if (cpu_sub_arch_name)
2812     cpu_sub_arch_name = reconcat (cpu_sub_arch_name, cpu_sub_arch_name,
2813                                   pfx, name, (const char *) NULL);
2814   else
2815     cpu_sub_arch_name = concat (pfx, name, (const char *) NULL);
2816 }
2817
2818 static void isa_enable (unsigned int idx)
2819 {
2820   i386_cpu_flags flags = cpu_flags_or (cpu_arch_flags, cpu_arch[idx].enable);
2821
2822   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2823     {
2824       extend_cpu_sub_arch_name (".", cpu_arch[idx].name);
2825       cpu_arch_flags = flags;
2826     }
2827
2828   cpu_arch_isa_flags = cpu_flags_or (cpu_arch_isa_flags, cpu_arch[idx].enable);
2829 }
2830
2831 static void isa_disable (unsigned int idx)
2832 {
2833   i386_cpu_flags flags
2834     = cpu_flags_and_not (cpu_arch_flags, cpu_arch[idx].disable);
2835
2836   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2837     {
2838       extend_cpu_sub_arch_name (".no", cpu_arch[idx].name);
2839       cpu_arch_flags = flags;
2840     }
2841
2842   cpu_arch_isa_flags
2843     = cpu_flags_and_not (cpu_arch_isa_flags, cpu_arch[idx].disable);
2844 }
2845
2846 static void
2847 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2848 {
2849   typedef struct arch_stack_entry
2850   {
2851     const struct arch_stack_entry *prev;
2852     const char *name;
2853     char *sub_name;
2854     i386_cpu_flags flags;
2855     i386_cpu_flags isa_flags;
2856     enum processor_type isa;
2857     enum flag_code flag_code;
2858     unsigned int vector_size;
2859     char stackop_size;
2860     bool no_cond_jump_promotion;
2861   } arch_stack_entry;
2862   static const arch_stack_entry *arch_stack_top;
2863   char *s;
2864   int e;
2865   const char *string;
2866   unsigned int j = 0;
2867
2868   SKIP_WHITESPACE ();
2869
2870   if (is_end_of_line[(unsigned char) *input_line_pointer])
2871     {
2872       as_bad (_("missing cpu architecture"));
2873       input_line_pointer++;
2874       return;
2875     }
2876
2877   e = get_symbol_name (&s);
2878   string = s;
2879
2880   if (strcmp (string, "push") == 0)
2881     {
2882       arch_stack_entry *top = XNEW (arch_stack_entry);
2883
2884       top->name = cpu_arch_name;
2885       if (cpu_sub_arch_name)
2886         top->sub_name = xstrdup (cpu_sub_arch_name);
2887       else
2888         top->sub_name = NULL;
2889       top->flags = cpu_arch_flags;
2890       top->isa = cpu_arch_isa;
2891       top->isa_flags = cpu_arch_isa_flags;
2892       top->flag_code = flag_code;
2893       top->vector_size = vector_size;
2894       top->stackop_size = stackop_size;
2895       top->no_cond_jump_promotion = no_cond_jump_promotion;
2896
2897       top->prev = arch_stack_top;
2898       arch_stack_top = top;
2899
2900       (void) restore_line_pointer (e);
2901       demand_empty_rest_of_line ();
2902       return;
2903     }
2904
2905   if (strcmp (string, "pop") == 0)
2906     {
2907       const arch_stack_entry *top = arch_stack_top;
2908
2909       if (!top)
2910         as_bad (_(".arch stack is empty"));
2911       else if (top->flag_code != flag_code
2912                || top->stackop_size != stackop_size)
2913         {
2914           static const unsigned int bits[] = {
2915             [CODE_16BIT] = 16,
2916             [CODE_32BIT] = 32,
2917             [CODE_64BIT] = 64,
2918           };
2919
2920           as_bad (_("this `.arch pop' requires `.code%u%s' to be in effect"),
2921                   bits[top->flag_code],
2922                   top->stackop_size == LONG_MNEM_SUFFIX ? "gcc" : "");
2923         }
2924       else
2925         {
2926           arch_stack_top = top->prev;
2927
2928           cpu_arch_name = top->name;
2929           free (cpu_sub_arch_name);
2930           cpu_sub_arch_name = top->sub_name;
2931           cpu_arch_flags = top->flags;
2932           cpu_arch_isa = top->isa;
2933           cpu_arch_isa_flags = top->isa_flags;
2934           vector_size = top->vector_size;
2935           no_cond_jump_promotion = top->no_cond_jump_promotion;
2936
2937           XDELETE (top);
2938         }
2939
2940       (void) restore_line_pointer (e);
2941       demand_empty_rest_of_line ();
2942       return;
2943     }
2944
2945   if (strcmp (string, "default") == 0)
2946     {
2947       if (strcmp (default_arch, "iamcu") == 0)
2948         string = default_arch;
2949       else
2950         {
2951           static const i386_cpu_flags cpu_unknown_flags = CPU_UNKNOWN_FLAGS;
2952
2953           cpu_arch_name = NULL;
2954           free (cpu_sub_arch_name);
2955           cpu_sub_arch_name = NULL;
2956           cpu_arch_flags = cpu_unknown_flags;
2957           cpu_arch_isa = PROCESSOR_UNKNOWN;
2958           cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].enable;
2959           if (!cpu_arch_tune_set)
2960             cpu_arch_tune = PROCESSOR_UNKNOWN;
2961
2962           vector_size = VSZ_DEFAULT;
2963
2964           j = ARRAY_SIZE (cpu_arch) + 1;
2965         }
2966     }
2967
2968   for (; j < ARRAY_SIZE (cpu_arch); j++)
2969     {
2970       if (strcmp (string + (*string == '.'), cpu_arch[j].name) == 0
2971           && (*string == '.') == (cpu_arch[j].type == PROCESSOR_NONE))
2972         {
2973           if (*string != '.')
2974             {
2975               check_cpu_arch_compatible (string, cpu_arch[j].enable);
2976
2977               if (flag_code == CODE_64BIT && !cpu_arch[j].enable.bitfield.cpu64 )
2978                 {
2979                   as_bad (_("64bit mode not supported on `%s'."),
2980                           cpu_arch[j].name);
2981                   (void) restore_line_pointer (e);
2982                   ignore_rest_of_line ();
2983                   return;
2984                 }
2985
2986               if (flag_code == CODE_32BIT && !cpu_arch[j].enable.bitfield.cpui386)
2987                 {
2988                   as_bad (_("32bit mode not supported on `%s'."),
2989                           cpu_arch[j].name);
2990                   (void) restore_line_pointer (e);
2991                   ignore_rest_of_line ();
2992                   return;
2993                 }
2994
2995               cpu_arch_name = cpu_arch[j].name;
2996               free (cpu_sub_arch_name);
2997               cpu_sub_arch_name = NULL;
2998               cpu_arch_flags = cpu_arch[j].enable;
2999               cpu_arch_isa = cpu_arch[j].type;
3000               cpu_arch_isa_flags = cpu_arch[j].enable;
3001               if (!cpu_arch_tune_set)
3002                 cpu_arch_tune = cpu_arch_isa;
3003
3004               vector_size = VSZ_DEFAULT;
3005
3006               pre_386_16bit_warned = false;
3007               break;
3008             }
3009
3010           if (cpu_flags_all_zero (&cpu_arch[j].enable))
3011             continue;
3012
3013           isa_enable (j);
3014
3015           (void) restore_line_pointer (e);
3016
3017           switch (cpu_arch[j].vsz)
3018             {
3019             default:
3020               break;
3021
3022             case vsz_set:
3023 #ifdef SVR4_COMMENT_CHARS
3024               if (*input_line_pointer == ':' || *input_line_pointer == '/')
3025 #else
3026               if (*input_line_pointer == '/')
3027 #endif
3028                 {
3029                   ++input_line_pointer;
3030                   switch (get_absolute_expression ())
3031                     {
3032                     case 512: vector_size = VSZ512; break;
3033                     case 256: vector_size = VSZ256; break;
3034                     case 128: vector_size = VSZ128; break;
3035                     default:
3036                       as_bad (_("Unrecognized vector size specifier"));
3037                       ignore_rest_of_line ();
3038                       return;
3039                     }
3040                   break;
3041                 }
3042                 /* Fall through.  */
3043             case vsz_reset:
3044               vector_size = VSZ_DEFAULT;
3045               break;
3046             }
3047
3048           demand_empty_rest_of_line ();
3049           return;
3050         }
3051     }
3052
3053   if (startswith (string, ".no") && j >= ARRAY_SIZE (cpu_arch))
3054     {
3055       /* Disable an ISA extension.  */
3056       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
3057         if (cpu_arch[j].type == PROCESSOR_NONE
3058             && strcmp (string + 3, cpu_arch[j].name) == 0)
3059           {
3060             isa_disable (j);
3061
3062             if (cpu_arch[j].vsz == vsz_set)
3063               vector_size = VSZ_DEFAULT;
3064
3065             (void) restore_line_pointer (e);
3066             demand_empty_rest_of_line ();
3067             return;
3068           }
3069     }
3070
3071   if (j == ARRAY_SIZE (cpu_arch))
3072     as_bad (_("no such architecture: `%s'"), string);
3073
3074   *input_line_pointer = e;
3075
3076   no_cond_jump_promotion = 0;
3077   if (*input_line_pointer == ','
3078       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
3079     {
3080       ++input_line_pointer;
3081       e = get_symbol_name (&s);
3082       string = s;
3083
3084       if (strcmp (string, "nojumps") == 0)
3085         no_cond_jump_promotion = 1;
3086       else if (strcmp (string, "jumps") == 0)
3087         ;
3088       else
3089         as_bad (_("no such architecture modifier: `%s'"), string);
3090
3091       (void) restore_line_pointer (e);
3092     }
3093
3094   demand_empty_rest_of_line ();
3095 }
3096
3097 enum bfd_architecture
3098 i386_arch (void)
3099 {
3100   if (cpu_arch_isa == PROCESSOR_IAMCU)
3101     {
3102       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3103           || flag_code == CODE_64BIT)
3104         as_fatal (_("Intel MCU is 32bit ELF only"));
3105       return bfd_arch_iamcu;
3106     }
3107   else
3108     return bfd_arch_i386;
3109 }
3110
3111 unsigned long
3112 i386_mach (void)
3113 {
3114   if (startswith (default_arch, "x86_64"))
3115     {
3116       if (default_arch[6] == '\0')
3117         return bfd_mach_x86_64;
3118       else
3119         return bfd_mach_x64_32;
3120     }
3121   else if (!strcmp (default_arch, "i386")
3122            || !strcmp (default_arch, "iamcu"))
3123     {
3124       if (cpu_arch_isa == PROCESSOR_IAMCU)
3125         {
3126           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3127             as_fatal (_("Intel MCU is 32bit ELF only"));
3128           return bfd_mach_i386_iamcu;
3129         }
3130       else
3131         return bfd_mach_i386_i386;
3132     }
3133   else
3134     as_fatal (_("unknown architecture"));
3135 }
3136 \f
3137 #include "opcodes/i386-tbl.h"
3138
3139 void
3140 md_begin (void)
3141 {
3142   /* Support pseudo prefixes like {disp32}.  */
3143   lex_type ['{'] = LEX_BEGIN_NAME;
3144
3145   /* Initialize op_hash hash table.  */
3146   op_hash = str_htab_create ();
3147
3148   {
3149     const insn_template *const *sets = i386_op_sets;
3150     const insn_template *const *end = sets + ARRAY_SIZE (i386_op_sets) - 1;
3151
3152     /* Type checks to compensate for the conversion through void * which
3153        occurs during hash table insertion / lookup.  */
3154     (void) sizeof (sets == &current_templates->start);
3155     (void) sizeof (end == &current_templates->end);
3156     for (; sets < end; ++sets)
3157       if (str_hash_insert (op_hash, insn_name (*sets), sets, 0))
3158         as_fatal (_("duplicate %s"), insn_name (*sets));
3159   }
3160
3161   /* Initialize reg_hash hash table.  */
3162   reg_hash = str_htab_create ();
3163   {
3164     const reg_entry *regtab;
3165     unsigned int regtab_size = i386_regtab_size;
3166
3167     for (regtab = i386_regtab; regtab_size--; regtab++)
3168       {
3169         switch (regtab->reg_type.bitfield.class)
3170           {
3171           case Reg:
3172             if (regtab->reg_type.bitfield.dword)
3173               {
3174                 if (regtab->reg_type.bitfield.instance == Accum)
3175                   reg_eax = regtab;
3176               }
3177             else if (regtab->reg_type.bitfield.tbyte)
3178               {
3179                 /* There's no point inserting st(<N>) in the hash table, as
3180                    parentheses aren't included in register_chars[] anyway.  */
3181                 if (regtab->reg_type.bitfield.instance != Accum)
3182                   continue;
3183                 reg_st0 = regtab;
3184               }
3185             break;
3186
3187           case SReg:
3188             switch (regtab->reg_num)
3189               {
3190               case 0: reg_es = regtab; break;
3191               case 2: reg_ss = regtab; break;
3192               case 3: reg_ds = regtab; break;
3193               }
3194             break;
3195
3196           case RegMask:
3197             if (!regtab->reg_num)
3198               reg_k0 = regtab;
3199             break;
3200           }
3201
3202         if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3203           as_fatal (_("duplicate %s"), regtab->reg_name);
3204       }
3205   }
3206
3207   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3208   {
3209     int c;
3210     const char *p;
3211
3212     for (c = 0; c < 256; c++)
3213       {
3214         if (ISDIGIT (c) || ISLOWER (c))
3215           {
3216             mnemonic_chars[c] = c;
3217             register_chars[c] = c;
3218             operand_chars[c] = c;
3219           }
3220         else if (ISUPPER (c))
3221           {
3222             mnemonic_chars[c] = TOLOWER (c);
3223             register_chars[c] = mnemonic_chars[c];
3224             operand_chars[c] = c;
3225           }
3226 #ifdef SVR4_COMMENT_CHARS
3227         else if (c == '\\' && strchr (i386_comment_chars, '/'))
3228           operand_chars[c] = c;
3229 #endif
3230
3231         if (c >= 128)
3232           operand_chars[c] = c;
3233       }
3234
3235     mnemonic_chars['_'] = '_';
3236     mnemonic_chars['-'] = '-';
3237     mnemonic_chars['.'] = '.';
3238
3239     for (p = extra_symbol_chars; *p != '\0'; p++)
3240       operand_chars[(unsigned char) *p] = *p;
3241     for (p = operand_special_chars; *p != '\0'; p++)
3242       operand_chars[(unsigned char) *p] = *p;
3243   }
3244
3245   if (flag_code == CODE_64BIT)
3246     {
3247 #if defined (OBJ_COFF) && defined (TE_PE)
3248       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3249                                   ? 32 : 16);
3250 #else
3251       x86_dwarf2_return_column = 16;
3252 #endif
3253       x86_cie_data_alignment = -8;
3254 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3255       x86_sframe_cfa_sp_reg = 7;
3256       x86_sframe_cfa_fp_reg = 6;
3257 #endif
3258     }
3259   else
3260     {
3261       x86_dwarf2_return_column = 8;
3262       x86_cie_data_alignment = -4;
3263     }
3264
3265   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3266      can be turned into BRANCH_PREFIX frag.  */
3267   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3268     abort ();
3269 }
3270
3271 void
3272 i386_print_statistics (FILE *file)
3273 {
3274   htab_print_statistics (file, "i386 opcode", op_hash);
3275   htab_print_statistics (file, "i386 register", reg_hash);
3276 }
3277
3278 void
3279 i386_md_end (void)
3280 {
3281   htab_delete (op_hash);
3282   htab_delete (reg_hash);
3283 }
3284 \f
3285 #ifdef DEBUG386
3286
3287 /* Debugging routines for md_assemble.  */
3288 static void pte (insn_template *);
3289 static void pt (i386_operand_type);
3290 static void pe (expressionS *);
3291 static void ps (symbolS *);
3292
3293 static void
3294 pi (const char *line, i386_insn *x)
3295 {
3296   unsigned int j;
3297
3298   fprintf (stdout, "%s: template ", line);
3299   pte (&x->tm);
3300   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3301            x->base_reg ? x->base_reg->reg_name : "none",
3302            x->index_reg ? x->index_reg->reg_name : "none",
3303            x->log2_scale_factor);
3304   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3305            x->rm.mode, x->rm.reg, x->rm.regmem);
3306   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3307            x->sib.base, x->sib.index, x->sib.scale);
3308   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3309            (x->rex & REX_W) != 0,
3310            (x->rex & REX_R) != 0,
3311            (x->rex & REX_X) != 0,
3312            (x->rex & REX_B) != 0);
3313   for (j = 0; j < x->operands; j++)
3314     {
3315       fprintf (stdout, "    #%d:  ", j + 1);
3316       pt (x->types[j]);
3317       fprintf (stdout, "\n");
3318       if (x->types[j].bitfield.class == Reg
3319           || x->types[j].bitfield.class == RegMMX
3320           || x->types[j].bitfield.class == RegSIMD
3321           || x->types[j].bitfield.class == RegMask
3322           || x->types[j].bitfield.class == SReg
3323           || x->types[j].bitfield.class == RegCR
3324           || x->types[j].bitfield.class == RegDR
3325           || x->types[j].bitfield.class == RegTR
3326           || x->types[j].bitfield.class == RegBND)
3327         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3328       if (operand_type_check (x->types[j], imm))
3329         pe (x->op[j].imms);
3330       if (operand_type_check (x->types[j], disp))
3331         pe (x->op[j].disps);
3332     }
3333 }
3334
3335 static void
3336 pte (insn_template *t)
3337 {
3338   static const unsigned char opc_pfx[] = { 0, 0x66, 0xf3, 0xf2 };
3339   static const char *const opc_spc[] = {
3340     NULL, "0f", "0f38", "0f3a", NULL, "evexmap5", "evexmap6", NULL,
3341     "XOP08", "XOP09", "XOP0A",
3342   };
3343   unsigned int j;
3344
3345   fprintf (stdout, " %d operands ", t->operands);
3346   if (opc_pfx[t->opcode_modifier.opcodeprefix])
3347     fprintf (stdout, "pfx %x ", opc_pfx[t->opcode_modifier.opcodeprefix]);
3348   if (opc_spc[t->opcode_space])
3349     fprintf (stdout, "space %s ", opc_spc[t->opcode_space]);
3350   fprintf (stdout, "opcode %x ", t->base_opcode);
3351   if (t->extension_opcode != None)
3352     fprintf (stdout, "ext %x ", t->extension_opcode);
3353   if (t->opcode_modifier.d)
3354     fprintf (stdout, "D");
3355   if (t->opcode_modifier.w)
3356     fprintf (stdout, "W");
3357   fprintf (stdout, "\n");
3358   for (j = 0; j < t->operands; j++)
3359     {
3360       fprintf (stdout, "    #%d type ", j + 1);
3361       pt (t->operand_types[j]);
3362       fprintf (stdout, "\n");
3363     }
3364 }
3365
3366 static void
3367 pe (expressionS *e)
3368 {
3369   fprintf (stdout, "    operation     %d\n", e->X_op);
3370   fprintf (stdout, "    add_number    %" PRId64 " (%" PRIx64 ")\n",
3371            (int64_t) e->X_add_number, (uint64_t) (valueT) e->X_add_number);
3372   if (e->X_add_symbol)
3373     {
3374       fprintf (stdout, "    add_symbol    ");
3375       ps (e->X_add_symbol);
3376       fprintf (stdout, "\n");
3377     }
3378   if (e->X_op_symbol)
3379     {
3380       fprintf (stdout, "    op_symbol    ");
3381       ps (e->X_op_symbol);
3382       fprintf (stdout, "\n");
3383     }
3384 }
3385
3386 static void
3387 ps (symbolS *s)
3388 {
3389   fprintf (stdout, "%s type %s%s",
3390            S_GET_NAME (s),
3391            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3392            segment_name (S_GET_SEGMENT (s)));
3393 }
3394
3395 static struct type_name
3396   {
3397     i386_operand_type mask;
3398     const char *name;
3399   }
3400 const type_names[] =
3401 {
3402   { { .bitfield = { .class = Reg, .byte = 1 } }, "r8" },
3403   { { .bitfield = { .class = Reg, .word = 1 } }, "r16" },
3404   { { .bitfield = { .class = Reg, .dword = 1 } }, "r32" },
3405   { { .bitfield = { .class = Reg, .qword = 1 } }, "r64" },
3406   { { .bitfield = { .instance = Accum, .byte = 1 } }, "acc8" },
3407   { { .bitfield = { .instance = Accum, .word = 1 } }, "acc16" },
3408   { { .bitfield = { .instance = Accum, .dword = 1 } }, "acc32" },
3409   { { .bitfield = { .instance = Accum, .qword = 1 } }, "acc64" },
3410   { { .bitfield = { .imm8 = 1 } }, "i8" },
3411   { { .bitfield = { .imm8s = 1 } }, "i8s" },
3412   { { .bitfield = { .imm16 = 1 } }, "i16" },
3413   { { .bitfield = { .imm32 = 1 } }, "i32" },
3414   { { .bitfield = { .imm32s = 1 } }, "i32s" },
3415   { { .bitfield = { .imm64 = 1 } }, "i64" },
3416   { { .bitfield = { .imm1 = 1 } }, "i1" },
3417   { { .bitfield = { .baseindex = 1 } }, "BaseIndex" },
3418   { { .bitfield = { .disp8 = 1 } }, "d8" },
3419   { { .bitfield = { .disp16 = 1 } }, "d16" },
3420   { { .bitfield = { .disp32 = 1 } }, "d32" },
3421   { { .bitfield = { .disp64 = 1 } }, "d64" },
3422   { { .bitfield = { .instance = RegD, .word = 1 } }, "InOutPortReg" },
3423   { { .bitfield = { .instance = RegC, .byte = 1 } }, "ShiftCount" },
3424   { { .bitfield = { .class = RegCR } }, "control reg" },
3425   { { .bitfield = { .class = RegTR } }, "test reg" },
3426   { { .bitfield = { .class = RegDR } }, "debug reg" },
3427   { { .bitfield = { .class = Reg, .tbyte = 1 } }, "FReg" },
3428   { { .bitfield = { .instance = Accum, .tbyte = 1 } }, "FAcc" },
3429   { { .bitfield = { .class = SReg } }, "SReg" },
3430   { { .bitfield = { .class = RegMMX } }, "rMMX" },
3431   { { .bitfield = { .class = RegSIMD, .xmmword = 1 } }, "rXMM" },
3432   { { .bitfield = { .class = RegSIMD, .ymmword = 1 } }, "rYMM" },
3433   { { .bitfield = { .class = RegSIMD, .zmmword = 1 } }, "rZMM" },
3434   { { .bitfield = { .class = RegSIMD, .tmmword = 1 } }, "rTMM" },
3435   { { .bitfield = { .class = RegMask } }, "Mask reg" },
3436 };
3437
3438 static void
3439 pt (i386_operand_type t)
3440 {
3441   unsigned int j;
3442   i386_operand_type a;
3443
3444   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3445     {
3446       a = operand_type_and (t, type_names[j].mask);
3447       if (operand_type_equal (&a, &type_names[j].mask))
3448         fprintf (stdout, "%s, ",  type_names[j].name);
3449     }
3450   fflush (stdout);
3451 }
3452
3453 #endif /* DEBUG386 */
3454 \f
3455 static bfd_reloc_code_real_type
3456 reloc (unsigned int size,
3457        int pcrel,
3458        int sign,
3459        bfd_reloc_code_real_type other)
3460 {
3461   if (other != NO_RELOC)
3462     {
3463       reloc_howto_type *rel;
3464
3465       if (size == 8)
3466         switch (other)
3467           {
3468           case BFD_RELOC_X86_64_GOT32:
3469             return BFD_RELOC_X86_64_GOT64;
3470             break;
3471           case BFD_RELOC_X86_64_GOTPLT64:
3472             return BFD_RELOC_X86_64_GOTPLT64;
3473             break;
3474           case BFD_RELOC_X86_64_PLTOFF64:
3475             return BFD_RELOC_X86_64_PLTOFF64;
3476             break;
3477           case BFD_RELOC_X86_64_GOTPC32:
3478             other = BFD_RELOC_X86_64_GOTPC64;
3479             break;
3480           case BFD_RELOC_X86_64_GOTPCREL:
3481             other = BFD_RELOC_X86_64_GOTPCREL64;
3482             break;
3483           case BFD_RELOC_X86_64_TPOFF32:
3484             other = BFD_RELOC_X86_64_TPOFF64;
3485             break;
3486           case BFD_RELOC_X86_64_DTPOFF32:
3487             other = BFD_RELOC_X86_64_DTPOFF64;
3488             break;
3489           default:
3490             break;
3491           }
3492
3493 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3494       if (other == BFD_RELOC_SIZE32)
3495         {
3496           if (size == 8)
3497             other = BFD_RELOC_SIZE64;
3498           if (pcrel)
3499             {
3500               as_bad (_("there are no pc-relative size relocations"));
3501               return NO_RELOC;
3502             }
3503         }
3504 #endif
3505
3506       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3507       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3508         sign = -1;
3509
3510       rel = bfd_reloc_type_lookup (stdoutput, other);
3511       if (!rel)
3512         as_bad (_("unknown relocation (%u)"), other);
3513       else if (size != bfd_get_reloc_size (rel))
3514         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3515                 bfd_get_reloc_size (rel),
3516                 size);
3517       else if (pcrel && !rel->pc_relative)
3518         as_bad (_("non-pc-relative relocation for pc-relative field"));
3519       else if ((rel->complain_on_overflow == complain_overflow_signed
3520                 && !sign)
3521                || (rel->complain_on_overflow == complain_overflow_unsigned
3522                    && sign > 0))
3523         as_bad (_("relocated field and relocation type differ in signedness"));
3524       else
3525         return other;
3526       return NO_RELOC;
3527     }
3528
3529   if (pcrel)
3530     {
3531       if (!sign)
3532         as_bad (_("there are no unsigned pc-relative relocations"));
3533       switch (size)
3534         {
3535         case 1: return BFD_RELOC_8_PCREL;
3536         case 2: return BFD_RELOC_16_PCREL;
3537         case 4: return BFD_RELOC_32_PCREL;
3538         case 8: return BFD_RELOC_64_PCREL;
3539         }
3540       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3541     }
3542   else
3543     {
3544       if (sign > 0)
3545         switch (size)
3546           {
3547           case 4: return BFD_RELOC_X86_64_32S;
3548           }
3549       else
3550         switch (size)
3551           {
3552           case 1: return BFD_RELOC_8;
3553           case 2: return BFD_RELOC_16;
3554           case 4: return BFD_RELOC_32;
3555           case 8: return BFD_RELOC_64;
3556           }
3557       as_bad (_("cannot do %s %u byte relocation"),
3558               sign > 0 ? "signed" : "unsigned", size);
3559     }
3560
3561   return NO_RELOC;
3562 }
3563
3564 /* Here we decide which fixups can be adjusted to make them relative to
3565    the beginning of the section instead of the symbol.  Basically we need
3566    to make sure that the dynamic relocations are done correctly, so in
3567    some cases we force the original symbol to be used.  */
3568
3569 int
3570 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3571 {
3572 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3573   if (!IS_ELF)
3574     return 1;
3575
3576   /* Don't adjust pc-relative references to merge sections in 64-bit
3577      mode.  */
3578   if (use_rela_relocations
3579       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3580       && fixP->fx_pcrel)
3581     return 0;
3582
3583   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3584      and changed later by validate_fix.  */
3585   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3586       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3587     return 0;
3588
3589   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3590      for size relocations.  */
3591   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3592       || fixP->fx_r_type == BFD_RELOC_SIZE64
3593       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3594       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3595       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3596       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3597       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3598       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3599       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3600       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3601       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3602       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3603       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3604       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3605       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3606       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3607       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3608       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3609       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3610       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3611       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3612       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3613       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3614       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3615       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3616       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3617       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3618       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3619       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3620       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3621       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3622     return 0;
3623 #endif
3624   return 1;
3625 }
3626
3627 static INLINE bool
3628 want_disp32 (const insn_template *t)
3629 {
3630   return flag_code != CODE_64BIT
3631          || i.prefix[ADDR_PREFIX]
3632          || (t->mnem_off == MN_lea
3633              && (!i.types[1].bitfield.qword
3634                 || t->opcode_modifier.size == SIZE32));
3635 }
3636
3637 static int
3638 intel_float_operand (const char *mnemonic)
3639 {
3640   /* Note that the value returned is meaningful only for opcodes with (memory)
3641      operands, hence the code here is free to improperly handle opcodes that
3642      have no operands (for better performance and smaller code). */
3643
3644   if (mnemonic[0] != 'f')
3645     return 0; /* non-math */
3646
3647   switch (mnemonic[1])
3648     {
3649     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3650        the fs segment override prefix not currently handled because no
3651        call path can make opcodes without operands get here */
3652     case 'i':
3653       return 2 /* integer op */;
3654     case 'l':
3655       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3656         return 3; /* fldcw/fldenv */
3657       break;
3658     case 'n':
3659       if (mnemonic[2] != 'o' /* fnop */)
3660         return 3; /* non-waiting control op */
3661       break;
3662     case 'r':
3663       if (mnemonic[2] == 's')
3664         return 3; /* frstor/frstpm */
3665       break;
3666     case 's':
3667       if (mnemonic[2] == 'a')
3668         return 3; /* fsave */
3669       if (mnemonic[2] == 't')
3670         {
3671           switch (mnemonic[3])
3672             {
3673             case 'c': /* fstcw */
3674             case 'd': /* fstdw */
3675             case 'e': /* fstenv */
3676             case 's': /* fsts[gw] */
3677               return 3;
3678             }
3679         }
3680       break;
3681     case 'x':
3682       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3683         return 0; /* fxsave/fxrstor are not really math ops */
3684       break;
3685     }
3686
3687   return 1;
3688 }
3689
3690 static INLINE void
3691 install_template (const insn_template *t)
3692 {
3693   unsigned int l;
3694
3695   i.tm = *t;
3696
3697   /* Dual VEX/EVEX templates need stripping one of the possible variants.  */
3698   if (t->opcode_modifier.vex && t->opcode_modifier.evex)
3699   {
3700       if ((is_cpu (t, CpuAVX) || is_cpu (t, CpuAVX2))
3701           && is_cpu (t, CpuAVX512F))
3702         {
3703           if (need_evex_encoding ())
3704             {
3705               i.tm.opcode_modifier.vex = 0;
3706               i.tm.cpu.bitfield.cpuavx = 0;
3707               if (is_cpu (&i.tm, CpuAVX2))
3708                 i.tm.cpu.bitfield.isa = 0;
3709             }
3710           else
3711             {
3712               i.tm.opcode_modifier.evex = 0;
3713               i.tm.cpu.bitfield.cpuavx512f = 0;
3714             }
3715         }
3716   }
3717
3718   /* Note that for pseudo prefixes this produces a length of 1. But for them
3719      the length isn't interesting at all.  */
3720   for (l = 1; l < 4; ++l)
3721     if (!(t->base_opcode >> (8 * l)))
3722       break;
3723
3724   i.opcode_length = l;
3725 }
3726
3727 /* Build the VEX prefix.  */
3728
3729 static void
3730 build_vex_prefix (const insn_template *t)
3731 {
3732   unsigned int register_specifier;
3733   unsigned int vector_length;
3734   unsigned int w;
3735
3736   /* Check register specifier.  */
3737   if (i.vex.register_specifier)
3738     {
3739       register_specifier =
3740         ~register_number (i.vex.register_specifier) & 0xf;
3741       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3742     }
3743   else
3744     register_specifier = 0xf;
3745
3746   /* Use 2-byte VEX prefix by swapping destination and source operand
3747      if there are more than 1 register operand.  */
3748   if (i.reg_operands > 1
3749       && i.vec_encoding != vex_encoding_vex3
3750       && i.dir_encoding == dir_encoding_default
3751       && i.operands == i.reg_operands
3752       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3753       && i.tm.opcode_space == SPACE_0F
3754       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3755       && i.rex == REX_B)
3756     {
3757       unsigned int xchg;
3758
3759       swap_2_operands (0, i.operands - 1);
3760
3761       gas_assert (i.rm.mode == 3);
3762
3763       i.rex = REX_R;
3764       xchg = i.rm.regmem;
3765       i.rm.regmem = i.rm.reg;
3766       i.rm.reg = xchg;
3767
3768       if (i.tm.opcode_modifier.d)
3769         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3770                             ? Opcode_ExtD : Opcode_SIMD_IntD;
3771       else /* Use the next insn.  */
3772         install_template (&t[1]);
3773     }
3774
3775   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3776      are no memory operands and at least 3 register ones.  */
3777   if (i.reg_operands >= 3
3778       && i.vec_encoding != vex_encoding_vex3
3779       && i.reg_operands == i.operands - i.imm_operands
3780       && i.tm.opcode_modifier.vex
3781       && i.tm.opcode_modifier.commutative
3782       && (i.tm.opcode_modifier.sse2avx
3783           || (optimize > 1 && !i.no_optimize))
3784       && i.rex == REX_B
3785       && i.vex.register_specifier
3786       && !(i.vex.register_specifier->reg_flags & RegRex))
3787     {
3788       unsigned int xchg = i.operands - i.reg_operands;
3789
3790       gas_assert (i.tm.opcode_space == SPACE_0F);
3791       gas_assert (!i.tm.opcode_modifier.sae);
3792       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3793                                       &i.types[i.operands - 3]));
3794       gas_assert (i.rm.mode == 3);
3795
3796       swap_2_operands (xchg, xchg + 1);
3797
3798       i.rex = 0;
3799       xchg = i.rm.regmem | 8;
3800       i.rm.regmem = ~register_specifier & 0xf;
3801       gas_assert (!(i.rm.regmem & 8));
3802       i.vex.register_specifier += xchg - i.rm.regmem;
3803       register_specifier = ~xchg & 0xf;
3804     }
3805
3806   if (i.tm.opcode_modifier.vex == VEXScalar)
3807     vector_length = avxscalar;
3808   else if (i.tm.opcode_modifier.vex == VEX256)
3809     vector_length = 1;
3810   else if (dot_insn () && i.tm.opcode_modifier.vex == VEX128)
3811     vector_length = 0;
3812   else
3813     {
3814       unsigned int op;
3815
3816       /* Determine vector length from the last multi-length vector
3817          operand.  */
3818       vector_length = 0;
3819       for (op = t->operands; op--;)
3820         if (t->operand_types[op].bitfield.xmmword
3821             && t->operand_types[op].bitfield.ymmword
3822             && i.types[op].bitfield.ymmword)
3823           {
3824             vector_length = 1;
3825             break;
3826           }
3827     }
3828
3829   /* Check the REX.W bit and VEXW.  */
3830   if (i.tm.opcode_modifier.vexw == VEXWIG)
3831     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3832   else if (i.tm.opcode_modifier.vexw)
3833     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3834   else
3835     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3836
3837   /* Use 2-byte VEX prefix if possible.  */
3838   if (w == 0
3839       && i.vec_encoding != vex_encoding_vex3
3840       && i.tm.opcode_space == SPACE_0F
3841       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3842     {
3843       /* 2-byte VEX prefix.  */
3844       unsigned int r;
3845
3846       i.vex.length = 2;
3847       i.vex.bytes[0] = 0xc5;
3848
3849       /* Check the REX.R bit.  */
3850       r = (i.rex & REX_R) ? 0 : 1;
3851       i.vex.bytes[1] = (r << 7
3852                         | register_specifier << 3
3853                         | vector_length << 2
3854                         | i.tm.opcode_modifier.opcodeprefix);
3855     }
3856   else
3857     {
3858       /* 3-byte VEX prefix.  */
3859       i.vex.length = 3;
3860
3861       switch (i.tm.opcode_space)
3862         {
3863         case SPACE_0F:
3864         case SPACE_0F38:
3865         case SPACE_0F3A:
3866           i.vex.bytes[0] = 0xc4;
3867           break;
3868         case SPACE_XOP08:
3869         case SPACE_XOP09:
3870         case SPACE_XOP0A:
3871           i.vex.bytes[0] = 0x8f;
3872           break;
3873         default:
3874           abort ();
3875         }
3876
3877       /* The high 3 bits of the second VEX byte are 1's compliment
3878          of RXB bits from REX.  */
3879       i.vex.bytes[1] = ((~i.rex & 7) << 5)
3880                        | (!dot_insn () ? i.tm.opcode_space
3881                                        : i.insn_opcode_space);
3882
3883       i.vex.bytes[2] = (w << 7
3884                         | register_specifier << 3
3885                         | vector_length << 2
3886                         | i.tm.opcode_modifier.opcodeprefix);
3887     }
3888 }
3889
3890 static INLINE bool
3891 is_evex_encoding (const insn_template *t)
3892 {
3893   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3894          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3895          || t->opcode_modifier.sae;
3896 }
3897
3898 static INLINE bool
3899 is_any_vex_encoding (const insn_template *t)
3900 {
3901   return t->opcode_modifier.vex || is_evex_encoding (t);
3902 }
3903
3904 static unsigned int
3905 get_broadcast_bytes (const insn_template *t, bool diag)
3906 {
3907   unsigned int op, bytes;
3908   const i386_operand_type *types;
3909
3910   if (i.broadcast.type)
3911     return (1 << (t->opcode_modifier.broadcast - 1)) * i.broadcast.type;
3912
3913   gas_assert (intel_syntax);
3914
3915   for (op = 0; op < t->operands; ++op)
3916     if (t->operand_types[op].bitfield.baseindex)
3917       break;
3918
3919   gas_assert (op < t->operands);
3920
3921   if (t->opcode_modifier.evex
3922       && t->opcode_modifier.evex != EVEXDYN)
3923     switch (i.broadcast.bytes)
3924       {
3925       case 1:
3926         if (t->operand_types[op].bitfield.word)
3927           return 2;
3928       /* Fall through.  */
3929       case 2:
3930         if (t->operand_types[op].bitfield.dword)
3931           return 4;
3932       /* Fall through.  */
3933       case 4:
3934         if (t->operand_types[op].bitfield.qword)
3935           return 8;
3936       /* Fall through.  */
3937       case 8:
3938         if (t->operand_types[op].bitfield.xmmword)
3939           return 16;
3940         if (t->operand_types[op].bitfield.ymmword)
3941           return 32;
3942         if (t->operand_types[op].bitfield.zmmword)
3943           return 64;
3944       /* Fall through.  */
3945       default:
3946         abort ();
3947       }
3948
3949   gas_assert (op + 1 < t->operands);
3950
3951   if (t->operand_types[op + 1].bitfield.xmmword
3952       + t->operand_types[op + 1].bitfield.ymmword
3953       + t->operand_types[op + 1].bitfield.zmmword > 1)
3954     {
3955       types = &i.types[op + 1];
3956       diag = false;
3957     }
3958   else /* Ambiguous - guess with a preference to non-AVX512VL forms.  */
3959     types = &t->operand_types[op];
3960
3961   if (types->bitfield.zmmword)
3962     bytes = 64;
3963   else if (types->bitfield.ymmword)
3964     bytes = 32;
3965   else
3966     bytes = 16;
3967
3968   if (diag)
3969     as_warn (_("ambiguous broadcast for `%s', using %u-bit form"),
3970              insn_name (t), bytes * 8);
3971
3972   return bytes;
3973 }
3974
3975 /* Build the EVEX prefix.  */
3976
3977 static void
3978 build_evex_prefix (void)
3979 {
3980   unsigned int register_specifier, w;
3981   rex_byte vrex_used = 0;
3982
3983   /* Check register specifier.  */
3984   if (i.vex.register_specifier)
3985     {
3986       gas_assert ((i.vrex & REX_X) == 0);
3987
3988       register_specifier = i.vex.register_specifier->reg_num;
3989       if ((i.vex.register_specifier->reg_flags & RegRex))
3990         register_specifier += 8;
3991       /* The upper 16 registers are encoded in the fourth byte of the
3992          EVEX prefix.  */
3993       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3994         i.vex.bytes[3] = 0x8;
3995       register_specifier = ~register_specifier & 0xf;
3996     }
3997   else
3998     {
3999       register_specifier = 0xf;
4000
4001       /* Encode upper 16 vector index register in the fourth byte of
4002          the EVEX prefix.  */
4003       if (!(i.vrex & REX_X))
4004         i.vex.bytes[3] = 0x8;
4005       else
4006         vrex_used |= REX_X;
4007     }
4008
4009   /* 4 byte EVEX prefix.  */
4010   i.vex.length = 4;
4011   i.vex.bytes[0] = 0x62;
4012
4013   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
4014      bits from REX.  */
4015   gas_assert (i.tm.opcode_space >= SPACE_0F);
4016   gas_assert (i.tm.opcode_space <= SPACE_EVEXMAP6);
4017   i.vex.bytes[1] = ((~i.rex & 7) << 5)
4018                    | (!dot_insn () ? i.tm.opcode_space
4019                                    : i.insn_opcode_space);
4020
4021   /* The fifth bit of the second EVEX byte is 1's compliment of the
4022      REX_R bit in VREX.  */
4023   if (!(i.vrex & REX_R))
4024     i.vex.bytes[1] |= 0x10;
4025   else
4026     vrex_used |= REX_R;
4027
4028   if ((i.reg_operands + i.imm_operands) == i.operands)
4029     {
4030       /* When all operands are registers, the REX_X bit in REX is not
4031          used.  We reuse it to encode the upper 16 registers, which is
4032          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
4033          as 1's compliment.  */
4034       if ((i.vrex & REX_B))
4035         {
4036           vrex_used |= REX_B;
4037           i.vex.bytes[1] &= ~0x40;
4038         }
4039     }
4040
4041   /* EVEX instructions shouldn't need the REX prefix.  */
4042   i.vrex &= ~vrex_used;
4043   gas_assert (i.vrex == 0);
4044
4045   /* Check the REX.W bit and VEXW.  */
4046   if (i.tm.opcode_modifier.vexw == VEXWIG)
4047     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
4048   else if (i.tm.opcode_modifier.vexw)
4049     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
4050   else
4051     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
4052
4053   /* The third byte of the EVEX prefix.  */
4054   i.vex.bytes[2] = ((w << 7)
4055                     | (register_specifier << 3)
4056                     | 4 /* Encode the U bit.  */
4057                     | i.tm.opcode_modifier.opcodeprefix);
4058
4059   /* The fourth byte of the EVEX prefix.  */
4060   /* The zeroing-masking bit.  */
4061   if (i.mask.reg && i.mask.zeroing)
4062     i.vex.bytes[3] |= 0x80;
4063
4064   /* Don't always set the broadcast bit if there is no RC.  */
4065   if (i.rounding.type == rc_none)
4066     {
4067       /* Encode the vector length.  */
4068       unsigned int vec_length;
4069
4070       if (!i.tm.opcode_modifier.evex
4071           || i.tm.opcode_modifier.evex == EVEXDYN)
4072         {
4073           unsigned int op;
4074
4075           /* Determine vector length from the last multi-length vector
4076              operand.  */
4077           for (op = i.operands; op--;)
4078             if (i.tm.operand_types[op].bitfield.xmmword
4079                 + i.tm.operand_types[op].bitfield.ymmword
4080                 + i.tm.operand_types[op].bitfield.zmmword > 1)
4081               {
4082                 if (i.types[op].bitfield.zmmword)
4083                   {
4084                     i.tm.opcode_modifier.evex = EVEX512;
4085                     break;
4086                   }
4087                 else if (i.types[op].bitfield.ymmword)
4088                   {
4089                     i.tm.opcode_modifier.evex = EVEX256;
4090                     break;
4091                   }
4092                 else if (i.types[op].bitfield.xmmword)
4093                   {
4094                     i.tm.opcode_modifier.evex = EVEX128;
4095                     break;
4096                   }
4097                 else if ((i.broadcast.type || i.broadcast.bytes)
4098                          && op == i.broadcast.operand)
4099                   {
4100                     switch (get_broadcast_bytes (&i.tm, true))
4101                       {
4102                         case 64:
4103                           i.tm.opcode_modifier.evex = EVEX512;
4104                           break;
4105                         case 32:
4106                           i.tm.opcode_modifier.evex = EVEX256;
4107                           break;
4108                         case 16:
4109                           i.tm.opcode_modifier.evex = EVEX128;
4110                           break;
4111                         default:
4112                           abort ();
4113                       }
4114                     break;
4115                   }
4116               }
4117
4118           if (op >= MAX_OPERANDS)
4119             abort ();
4120         }
4121
4122       switch (i.tm.opcode_modifier.evex)
4123         {
4124         case EVEXLIG: /* LL' is ignored */
4125           vec_length = evexlig << 5;
4126           break;
4127         case EVEX128:
4128           vec_length = 0 << 5;
4129           break;
4130         case EVEX256:
4131           vec_length = 1 << 5;
4132           break;
4133         case EVEX512:
4134           vec_length = 2 << 5;
4135           break;
4136         case EVEX_L3:
4137           if (dot_insn ())
4138             {
4139               vec_length = 3 << 5;
4140               break;
4141             }
4142           /* Fall through.  */
4143         default:
4144           abort ();
4145           break;
4146         }
4147       i.vex.bytes[3] |= vec_length;
4148       /* Encode the broadcast bit.  */
4149       if (i.broadcast.type || i.broadcast.bytes)
4150         i.vex.bytes[3] |= 0x10;
4151     }
4152   else if (i.rounding.type != saeonly)
4153     i.vex.bytes[3] |= 0x10 | (i.rounding.type << 5);
4154   else
4155     i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
4156
4157   if (i.mask.reg)
4158     i.vex.bytes[3] |= i.mask.reg->reg_num;
4159 }
4160
4161 static void
4162 process_immext (void)
4163 {
4164   expressionS *exp;
4165
4166   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
4167      which is coded in the same place as an 8-bit immediate field
4168      would be.  Here we fake an 8-bit immediate operand from the
4169      opcode suffix stored in tm.extension_opcode.
4170
4171      AVX instructions also use this encoding, for some of
4172      3 argument instructions.  */
4173
4174   gas_assert (i.imm_operands <= 1
4175               && (i.operands <= 2
4176                   || (is_any_vex_encoding (&i.tm)
4177                       && i.operands <= 4)));
4178
4179   exp = &im_expressions[i.imm_operands++];
4180   i.op[i.operands].imms = exp;
4181   i.types[i.operands].bitfield.imm8 = 1;
4182   i.operands++;
4183   exp->X_op = O_constant;
4184   exp->X_add_number = i.tm.extension_opcode;
4185   i.tm.extension_opcode = None;
4186 }
4187
4188
4189 static int
4190 check_hle (void)
4191 {
4192   switch (i.tm.opcode_modifier.prefixok)
4193     {
4194     default:
4195       abort ();
4196     case PrefixLock:
4197     case PrefixNone:
4198     case PrefixNoTrack:
4199     case PrefixRep:
4200       as_bad (_("invalid instruction `%s' after `%s'"),
4201               insn_name (&i.tm), i.hle_prefix);
4202       return 0;
4203     case PrefixHLELock:
4204       if (i.prefix[LOCK_PREFIX])
4205         return 1;
4206       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4207       return 0;
4208     case PrefixHLEAny:
4209       return 1;
4210     case PrefixHLERelease:
4211       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4212         {
4213           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4214                   insn_name (&i.tm));
4215           return 0;
4216         }
4217       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4218         {
4219           as_bad (_("memory destination needed for instruction `%s'"
4220                     " after `xrelease'"), insn_name (&i.tm));
4221           return 0;
4222         }
4223       return 1;
4224     }
4225 }
4226
4227 /* Encode aligned vector move as unaligned vector move.  */
4228
4229 static void
4230 encode_with_unaligned_vector_move (void)
4231 {
4232   switch (i.tm.base_opcode)
4233     {
4234     case 0x28:  /* Load instructions.  */
4235     case 0x29:  /* Store instructions.  */
4236       /* movaps/movapd/vmovaps/vmovapd.  */
4237       if (i.tm.opcode_space == SPACE_0F
4238           && i.tm.opcode_modifier.opcodeprefix <= PREFIX_0X66)
4239         i.tm.base_opcode = 0x10 | (i.tm.base_opcode & 1);
4240       break;
4241     case 0x6f:  /* Load instructions.  */
4242     case 0x7f:  /* Store instructions.  */
4243       /* movdqa/vmovdqa/vmovdqa64/vmovdqa32. */
4244       if (i.tm.opcode_space == SPACE_0F
4245           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0X66)
4246         i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
4247       break;
4248     default:
4249       break;
4250     }
4251 }
4252
4253 /* Try the shortest encoding by shortening operand size.  */
4254
4255 static void
4256 optimize_encoding (void)
4257 {
4258   unsigned int j;
4259
4260   if (i.tm.mnem_off == MN_lea)
4261     {
4262       /* Optimize: -O:
4263            lea symbol, %rN    -> mov $symbol, %rN
4264            lea (%rM), %rN     -> mov %rM, %rN
4265            lea (,%rM,1), %rN  -> mov %rM, %rN
4266
4267            and in 32-bit mode for 16-bit addressing
4268
4269            lea (%rM), %rN     -> movzx %rM, %rN
4270
4271            and in 64-bit mode zap 32-bit addressing in favor of using a
4272            32-bit (or less) destination.
4273        */
4274       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4275         {
4276           if (!i.op[1].regs->reg_type.bitfield.word)
4277             i.tm.opcode_modifier.size = SIZE32;
4278           i.prefix[ADDR_PREFIX] = 0;
4279         }
4280
4281       if (!i.index_reg && !i.base_reg)
4282         {
4283           /* Handle:
4284                lea symbol, %rN    -> mov $symbol, %rN
4285            */
4286           if (flag_code == CODE_64BIT)
4287             {
4288               /* Don't transform a relocation to a 16-bit one.  */
4289               if (i.op[0].disps
4290                   && i.op[0].disps->X_op != O_constant
4291                   && i.op[1].regs->reg_type.bitfield.word)
4292                 return;
4293
4294               if (!i.op[1].regs->reg_type.bitfield.qword
4295                   || i.tm.opcode_modifier.size == SIZE32)
4296                 {
4297                   i.tm.base_opcode = 0xb8;
4298                   i.tm.opcode_modifier.modrm = 0;
4299                   if (!i.op[1].regs->reg_type.bitfield.word)
4300                     i.types[0].bitfield.imm32 = 1;
4301                   else
4302                     {
4303                       i.tm.opcode_modifier.size = SIZE16;
4304                       i.types[0].bitfield.imm16 = 1;
4305                     }
4306                 }
4307               else
4308                 {
4309                   /* Subject to further optimization below.  */
4310                   i.tm.base_opcode = 0xc7;
4311                   i.tm.extension_opcode = 0;
4312                   i.types[0].bitfield.imm32s = 1;
4313                   i.types[0].bitfield.baseindex = 0;
4314                 }
4315             }
4316           /* Outside of 64-bit mode address and operand sizes have to match if
4317              a relocation is involved, as otherwise we wouldn't (currently) or
4318              even couldn't express the relocation correctly.  */
4319           else if (i.op[0].disps
4320                    && i.op[0].disps->X_op != O_constant
4321                    && ((!i.prefix[ADDR_PREFIX])
4322                        != (flag_code == CODE_32BIT
4323                            ? i.op[1].regs->reg_type.bitfield.dword
4324                            : i.op[1].regs->reg_type.bitfield.word)))
4325             return;
4326           /* In 16-bit mode converting LEA with 16-bit addressing and a 32-bit
4327              destination is going to grow encoding size.  */
4328           else if (flag_code == CODE_16BIT
4329                    && (optimize <= 1 || optimize_for_space)
4330                    && !i.prefix[ADDR_PREFIX]
4331                    && i.op[1].regs->reg_type.bitfield.dword)
4332             return;
4333           else
4334             {
4335               i.tm.base_opcode = 0xb8;
4336               i.tm.opcode_modifier.modrm = 0;
4337               if (i.op[1].regs->reg_type.bitfield.dword)
4338                 i.types[0].bitfield.imm32 = 1;
4339               else
4340                 i.types[0].bitfield.imm16 = 1;
4341
4342               if (i.op[0].disps
4343                   && i.op[0].disps->X_op == O_constant
4344                   && i.op[1].regs->reg_type.bitfield.dword
4345                   /* NB: Add () to !i.prefix[ADDR_PREFIX] to silence
4346                      GCC 5. */
4347                   && (!i.prefix[ADDR_PREFIX]) != (flag_code == CODE_32BIT))
4348                 i.op[0].disps->X_add_number &= 0xffff;
4349             }
4350
4351           i.tm.operand_types[0] = i.types[0];
4352           i.imm_operands = 1;
4353           if (!i.op[0].imms)
4354             {
4355               i.op[0].imms = &im_expressions[0];
4356               i.op[0].imms->X_op = O_absent;
4357             }
4358         }
4359       else if (i.op[0].disps
4360                   && (i.op[0].disps->X_op != O_constant
4361                       || i.op[0].disps->X_add_number))
4362         return;
4363       else
4364         {
4365           /* Handle:
4366                lea (%rM), %rN     -> mov %rM, %rN
4367                lea (,%rM,1), %rN  -> mov %rM, %rN
4368                lea (%rM), %rN     -> movzx %rM, %rN
4369            */
4370           const reg_entry *addr_reg;
4371
4372           if (!i.index_reg && i.base_reg->reg_num != RegIP)
4373             addr_reg = i.base_reg;
4374           else if (!i.base_reg
4375                    && i.index_reg->reg_num != RegIZ
4376                    && !i.log2_scale_factor)
4377             addr_reg = i.index_reg;
4378           else
4379             return;
4380
4381           if (addr_reg->reg_type.bitfield.word
4382               && i.op[1].regs->reg_type.bitfield.dword)
4383             {
4384               if (flag_code != CODE_32BIT)
4385                 return;
4386               i.tm.opcode_space = SPACE_0F;
4387               i.tm.base_opcode = 0xb7;
4388             }
4389           else
4390             i.tm.base_opcode = 0x8b;
4391
4392           if (addr_reg->reg_type.bitfield.dword
4393               && i.op[1].regs->reg_type.bitfield.qword)
4394             i.tm.opcode_modifier.size = SIZE32;
4395
4396           i.op[0].regs = addr_reg;
4397           i.reg_operands = 2;
4398         }
4399
4400       i.mem_operands = 0;
4401       i.disp_operands = 0;
4402       i.prefix[ADDR_PREFIX] = 0;
4403       i.prefix[SEG_PREFIX] = 0;
4404       i.seg[0] = NULL;
4405     }
4406
4407   if (optimize_for_space
4408       && i.tm.mnem_off == MN_test
4409       && i.reg_operands == 1
4410       && i.imm_operands == 1
4411       && !i.types[1].bitfield.byte
4412       && i.op[0].imms->X_op == O_constant
4413       && fits_in_imm7 (i.op[0].imms->X_add_number))
4414     {
4415       /* Optimize: -Os:
4416            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4417        */
4418       unsigned int base_regnum = i.op[1].regs->reg_num;
4419       if (flag_code == CODE_64BIT || base_regnum < 4)
4420         {
4421           i.types[1].bitfield.byte = 1;
4422           /* Ignore the suffix.  */
4423           i.suffix = 0;
4424           /* Convert to byte registers.  */
4425           if (i.types[1].bitfield.word)
4426             j = 16;
4427           else if (i.types[1].bitfield.dword)
4428             j = 32;
4429           else
4430             j = 48;
4431           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4432             j += 8;
4433           i.op[1].regs -= j;
4434         }
4435     }
4436   else if (flag_code == CODE_64BIT
4437            && i.tm.opcode_space == SPACE_BASE
4438            && ((i.types[1].bitfield.qword
4439                 && i.reg_operands == 1
4440                 && i.imm_operands == 1
4441                 && i.op[0].imms->X_op == O_constant
4442                 && ((i.tm.base_opcode == 0xb8
4443                      && i.tm.extension_opcode == None
4444                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4445                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4446                         && (i.tm.base_opcode == 0x24
4447                             || (i.tm.base_opcode == 0x80
4448                                 && i.tm.extension_opcode == 0x4)
4449                             || i.tm.mnem_off == MN_test
4450                             || ((i.tm.base_opcode | 1) == 0xc7
4451                                 && i.tm.extension_opcode == 0x0)))
4452                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4453                         && i.tm.base_opcode == 0x83
4454                         && i.tm.extension_opcode == 0x4)))
4455                || (i.types[0].bitfield.qword
4456                    && ((i.reg_operands == 2
4457                         && i.op[0].regs == i.op[1].regs
4458                         && (i.tm.mnem_off == MN_xor
4459                             || i.tm.mnem_off == MN_sub))
4460                        || i.tm.mnem_off == MN_clr))))
4461     {
4462       /* Optimize: -O:
4463            andq $imm31, %r64   -> andl $imm31, %r32
4464            andq $imm7, %r64    -> andl $imm7, %r32
4465            testq $imm31, %r64  -> testl $imm31, %r32
4466            xorq %r64, %r64     -> xorl %r32, %r32
4467            subq %r64, %r64     -> subl %r32, %r32
4468            movq $imm31, %r64   -> movl $imm31, %r32
4469            movq $imm32, %r64   -> movl $imm32, %r32
4470         */
4471       i.tm.opcode_modifier.size = SIZE32;
4472       if (i.imm_operands)
4473         {
4474           i.types[0].bitfield.imm32 = 1;
4475           i.types[0].bitfield.imm32s = 0;
4476           i.types[0].bitfield.imm64 = 0;
4477         }
4478       else
4479         {
4480           i.types[0].bitfield.dword = 1;
4481           i.types[0].bitfield.qword = 0;
4482         }
4483       i.types[1].bitfield.dword = 1;
4484       i.types[1].bitfield.qword = 0;
4485       if (i.tm.mnem_off == MN_mov || i.tm.mnem_off == MN_lea)
4486         {
4487           /* Handle
4488                movq $imm31, %r64   -> movl $imm31, %r32
4489                movq $imm32, %r64   -> movl $imm32, %r32
4490            */
4491           i.tm.operand_types[0].bitfield.imm32 = 1;
4492           i.tm.operand_types[0].bitfield.imm32s = 0;
4493           i.tm.operand_types[0].bitfield.imm64 = 0;
4494           if ((i.tm.base_opcode | 1) == 0xc7)
4495             {
4496               /* Handle
4497                    movq $imm31, %r64   -> movl $imm31, %r32
4498                */
4499               i.tm.base_opcode = 0xb8;
4500               i.tm.extension_opcode = None;
4501               i.tm.opcode_modifier.w = 0;
4502               i.tm.opcode_modifier.modrm = 0;
4503             }
4504         }
4505     }
4506   else if (optimize > 1
4507            && !optimize_for_space
4508            && i.reg_operands == 2
4509            && i.op[0].regs == i.op[1].regs
4510            && (i.tm.mnem_off == MN_and || i.tm.mnem_off == MN_or)
4511            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4512     {
4513       /* Optimize: -O2:
4514            andb %rN, %rN  -> testb %rN, %rN
4515            andw %rN, %rN  -> testw %rN, %rN
4516            andq %rN, %rN  -> testq %rN, %rN
4517            orb %rN, %rN   -> testb %rN, %rN
4518            orw %rN, %rN   -> testw %rN, %rN
4519            orq %rN, %rN   -> testq %rN, %rN
4520
4521            and outside of 64-bit mode
4522
4523            andl %rN, %rN  -> testl %rN, %rN
4524            orl %rN, %rN   -> testl %rN, %rN
4525        */
4526       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4527     }
4528   else if (i.tm.base_opcode == 0xba
4529            && i.tm.opcode_space == SPACE_0F
4530            && i.reg_operands == 1
4531            && i.op[0].imms->X_op == O_constant
4532            && i.op[0].imms->X_add_number >= 0)
4533     {
4534       /* Optimize: -O:
4535            btw $n, %rN -> btl $n, %rN (outside of 16-bit mode, n < 16)
4536            btq $n, %rN -> btl $n, %rN (in 64-bit mode, n < 32, N < 8)
4537            btl $n, %rN -> btw $n, %rN (in 16-bit mode, n < 16)
4538
4539            With <BT> one of bts, btr, and bts also:
4540            <BT>w $n, %rN -> btl $n, %rN (in 32-bit mode, n < 16)
4541            <BT>l $n, %rN -> btw $n, %rN (in 16-bit mode, n < 16)
4542        */
4543       switch (flag_code)
4544         {
4545         case CODE_64BIT:
4546           if (i.tm.extension_opcode != 4)
4547             break;
4548           if (i.types[1].bitfield.qword
4549               && i.op[0].imms->X_add_number < 32
4550               && !(i.op[1].regs->reg_flags & RegRex))
4551             i.tm.opcode_modifier.size = SIZE32;
4552           /* Fall through.  */
4553         case CODE_32BIT:
4554           if (i.types[1].bitfield.word
4555               && i.op[0].imms->X_add_number < 16)
4556             i.tm.opcode_modifier.size = SIZE32;
4557           break;
4558         case CODE_16BIT:
4559           if (i.op[0].imms->X_add_number < 16)
4560             i.tm.opcode_modifier.size = SIZE16;
4561           break;
4562         }
4563     }
4564   else if (i.reg_operands == 3
4565            && i.op[0].regs == i.op[1].regs
4566            && !i.types[2].bitfield.xmmword
4567            && (i.tm.opcode_modifier.vex
4568                || ((!i.mask.reg || i.mask.zeroing)
4569                    && is_evex_encoding (&i.tm)
4570                    && (i.vec_encoding != vex_encoding_evex
4571                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4572                        || is_cpu (&i.tm, CpuAVX512VL)
4573                        || (i.tm.operand_types[2].bitfield.zmmword
4574                            && i.types[2].bitfield.ymmword))))
4575            && i.tm.opcode_space == SPACE_0F
4576            && ((i.tm.base_opcode | 2) == 0x57
4577                || i.tm.base_opcode == 0xdf
4578                || i.tm.base_opcode == 0xef
4579                || (i.tm.base_opcode | 3) == 0xfb
4580                || i.tm.base_opcode == 0x42
4581                || i.tm.base_opcode == 0x47))
4582     {
4583       /* Optimize: -O1:
4584            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4585            vpsubq and vpsubw:
4586              EVEX VOP %zmmM, %zmmM, %zmmN
4587                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4588                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4589              EVEX VOP %ymmM, %ymmM, %ymmN
4590                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4591                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4592              VEX VOP %ymmM, %ymmM, %ymmN
4593                -> VEX VOP %xmmM, %xmmM, %xmmN
4594            VOP, one of vpandn and vpxor:
4595              VEX VOP %ymmM, %ymmM, %ymmN
4596                -> VEX VOP %xmmM, %xmmM, %xmmN
4597            VOP, one of vpandnd and vpandnq:
4598              EVEX VOP %zmmM, %zmmM, %zmmN
4599                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4600                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4601              EVEX VOP %ymmM, %ymmM, %ymmN
4602                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4603                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4604            VOP, one of vpxord and vpxorq:
4605              EVEX VOP %zmmM, %zmmM, %zmmN
4606                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4607                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4608              EVEX VOP %ymmM, %ymmM, %ymmN
4609                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4610                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4611            VOP, one of kxord and kxorq:
4612              VEX VOP %kM, %kM, %kN
4613                -> VEX kxorw %kM, %kM, %kN
4614            VOP, one of kandnd and kandnq:
4615              VEX VOP %kM, %kM, %kN
4616                -> VEX kandnw %kM, %kM, %kN
4617        */
4618       if (is_evex_encoding (&i.tm))
4619         {
4620           if (i.vec_encoding != vex_encoding_evex)
4621             {
4622               i.tm.opcode_modifier.vex = VEX128;
4623               i.tm.opcode_modifier.vexw = VEXW0;
4624               i.tm.opcode_modifier.evex = 0;
4625               i.vec_encoding = vex_encoding_vex;
4626               i.mask.reg = NULL;
4627             }
4628           else if (optimize > 1)
4629             i.tm.opcode_modifier.evex = EVEX128;
4630           else
4631             return;
4632         }
4633       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4634         {
4635           i.tm.opcode_modifier.opcodeprefix = PREFIX_NONE;
4636           i.tm.opcode_modifier.vexw = VEXW0;
4637         }
4638       else
4639         i.tm.opcode_modifier.vex = VEX128;
4640
4641       if (i.tm.opcode_modifier.vex)
4642         for (j = 0; j < 3; j++)
4643           {
4644             i.types[j].bitfield.xmmword = 1;
4645             i.types[j].bitfield.ymmword = 0;
4646           }
4647     }
4648   else if (i.vec_encoding != vex_encoding_evex
4649            && !i.types[0].bitfield.zmmword
4650            && !i.types[1].bitfield.zmmword
4651            && !i.mask.reg
4652            && !i.broadcast.type
4653            && !i.broadcast.bytes
4654            && is_evex_encoding (&i.tm)
4655            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4656                || (i.tm.base_opcode & ~4) == 0xdb
4657                || (i.tm.base_opcode & ~4) == 0xeb)
4658            && i.tm.extension_opcode == None)
4659     {
4660       /* Optimize: -O1:
4661            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4662            vmovdqu32 and vmovdqu64:
4663              EVEX VOP %xmmM, %xmmN
4664                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4665              EVEX VOP %ymmM, %ymmN
4666                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4667              EVEX VOP %xmmM, mem
4668                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4669              EVEX VOP %ymmM, mem
4670                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4671              EVEX VOP mem, %xmmN
4672                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4673              EVEX VOP mem, %ymmN
4674                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4675            VOP, one of vpand, vpandn, vpor, vpxor:
4676              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4677                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4678              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4679                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4680              EVEX VOP{d,q} mem, %xmmM, %xmmN
4681                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4682              EVEX VOP{d,q} mem, %ymmM, %ymmN
4683                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4684        */
4685       for (j = 0; j < i.operands; j++)
4686         if (operand_type_check (i.types[j], disp)
4687             && i.op[j].disps->X_op == O_constant)
4688           {
4689             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4690                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4691                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4692             int evex_disp8, vex_disp8;
4693             unsigned int memshift = i.memshift;
4694             offsetT n = i.op[j].disps->X_add_number;
4695
4696             evex_disp8 = fits_in_disp8 (n);
4697             i.memshift = 0;
4698             vex_disp8 = fits_in_disp8 (n);
4699             if (evex_disp8 != vex_disp8)
4700               {
4701                 i.memshift = memshift;
4702                 return;
4703               }
4704
4705             i.types[j].bitfield.disp8 = vex_disp8;
4706             break;
4707           }
4708       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4709           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2)
4710         i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
4711       i.tm.opcode_modifier.vex
4712         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4713       i.tm.opcode_modifier.vexw = VEXW0;
4714       /* VPAND, VPOR, and VPXOR are commutative.  */
4715       if (i.reg_operands == 3 && i.tm.base_opcode != 0xdf)
4716         i.tm.opcode_modifier.commutative = 1;
4717       i.tm.opcode_modifier.evex = 0;
4718       i.tm.opcode_modifier.masking = 0;
4719       i.tm.opcode_modifier.broadcast = 0;
4720       i.tm.opcode_modifier.disp8memshift = 0;
4721       i.memshift = 0;
4722       if (j < i.operands)
4723         i.types[j].bitfield.disp8
4724           = fits_in_disp8 (i.op[j].disps->X_add_number);
4725     }
4726   else if (optimize_for_space
4727            && i.tm.base_opcode == 0x29
4728            && i.tm.opcode_space == SPACE_0F38
4729            && i.operands == i.reg_operands
4730            && i.op[0].regs == i.op[1].regs
4731            && (!i.tm.opcode_modifier.vex
4732                || !(i.op[0].regs->reg_flags & RegRex))
4733            && !is_evex_encoding (&i.tm))
4734     {
4735       /* Optimize: -Os:
4736          pcmpeqq %xmmN, %xmmN          -> pcmpeqd %xmmN, %xmmN
4737          vpcmpeqq %xmmN, %xmmN, %xmmM  -> vpcmpeqd %xmmN, %xmmN, %xmmM (N < 8)
4738          vpcmpeqq %ymmN, %ymmN, %ymmM  -> vpcmpeqd %ymmN, %ymmN, %ymmM (N < 8)
4739        */
4740       i.tm.opcode_space = SPACE_0F;
4741       i.tm.base_opcode = 0x76;
4742     }
4743   else if (((i.tm.base_opcode >= 0x64
4744              && i.tm.base_opcode <= 0x66
4745              && i.tm.opcode_space == SPACE_0F)
4746             || (i.tm.base_opcode == 0x37
4747                 && i.tm.opcode_space == SPACE_0F38))
4748            && i.operands == i.reg_operands
4749            && i.op[0].regs == i.op[1].regs
4750            && !is_evex_encoding (&i.tm))
4751     {
4752       /* Optimize: -O:
4753          pcmpgt[bwd] %mmN, %mmN             -> pxor %mmN, %mmN
4754          pcmpgt[bwdq] %xmmN, %xmmN          -> pxor %xmmN, %xmmN
4755          vpcmpgt[bwdq] %xmmN, %xmmN, %xmmM  -> vpxor %xmmN, %xmmN, %xmmM (N < 8)
4756          vpcmpgt[bwdq] %xmmN, %xmmN, %xmmM  -> vpxor %xmm0, %xmm0, %xmmM (N > 7)
4757          vpcmpgt[bwdq] %ymmN, %ymmN, %ymmM  -> vpxor %ymmN, %ymmN, %ymmM (N < 8)
4758          vpcmpgt[bwdq] %ymmN, %ymmN, %ymmM  -> vpxor %ymm0, %ymm0, %ymmM (N > 7)
4759        */
4760       i.tm.opcode_space = SPACE_0F;
4761       i.tm.base_opcode = 0xef;
4762       if (i.tm.opcode_modifier.vex && (i.op[0].regs->reg_flags & RegRex))
4763         {
4764           if (i.operands == 2)
4765             {
4766               gas_assert (i.tm.opcode_modifier.sse2avx);
4767
4768               i.operands = 3;
4769               i.reg_operands = 3;
4770               i.tm.operands = 3;
4771
4772               i.op[2].regs = i.op[0].regs;
4773               i.types[2] = i.types[0];
4774               i.flags[2] = i.flags[0];
4775               i.tm.operand_types[2] = i.tm.operand_types[0];
4776
4777               i.tm.opcode_modifier.sse2avx = 0;
4778             }
4779           i.op[0].regs -= i.op[0].regs->reg_num + 8;
4780           i.op[1].regs = i.op[0].regs;
4781         }
4782     }
4783   else if (optimize_for_space
4784            && i.tm.base_opcode == 0x59
4785            && i.tm.opcode_space == SPACE_0F38
4786            && i.operands == i.reg_operands
4787            && i.tm.opcode_modifier.vex
4788            && !(i.op[0].regs->reg_flags & RegRex)
4789            && i.op[0].regs->reg_type.bitfield.xmmword
4790            && i.vec_encoding != vex_encoding_vex3)
4791     {
4792       /* Optimize: -Os:
4793          vpbroadcastq %xmmN, %xmmM  -> vpunpcklqdq %xmmN, %xmmN, %xmmM (N < 8)
4794        */
4795       i.tm.opcode_space = SPACE_0F;
4796       i.tm.base_opcode = 0x6c;
4797       i.tm.opcode_modifier.vexvvvv = 1;
4798
4799       ++i.operands;
4800       ++i.reg_operands;
4801       ++i.tm.operands;
4802
4803       i.op[2].regs = i.op[0].regs;
4804       i.types[2] = i.types[0];
4805       i.flags[2] = i.flags[0];
4806       i.tm.operand_types[2] = i.tm.operand_types[0];
4807
4808       swap_2_operands (1, 2);
4809     }
4810 }
4811
4812 /* Return non-zero for load instruction.  */
4813
4814 static int
4815 load_insn_p (void)
4816 {
4817   unsigned int dest;
4818   int any_vex_p = is_any_vex_encoding (&i.tm);
4819   unsigned int base_opcode = i.tm.base_opcode | 1;
4820
4821   if (!any_vex_p)
4822     {
4823       /* Anysize insns: lea, invlpg, clflush, prefetch*, bndmk, bndcl, bndcu,
4824          bndcn, bndstx, bndldx, clflushopt, clwb, cldemote.  */
4825       if (i.tm.opcode_modifier.operandconstraint == ANY_SIZE)
4826         return 0;
4827
4828       /* pop.   */
4829       if (i.tm.mnem_off == MN_pop)
4830         return 1;
4831     }
4832
4833   if (i.tm.opcode_space == SPACE_BASE)
4834     {
4835       /* popf, popa.   */
4836       if (i.tm.base_opcode == 0x9d
4837           || i.tm.base_opcode == 0x61)
4838         return 1;
4839
4840       /* movs, cmps, lods, scas.  */
4841       if ((i.tm.base_opcode | 0xb) == 0xaf)
4842         return 1;
4843
4844       /* outs, xlatb.  */
4845       if (base_opcode == 0x6f
4846           || i.tm.base_opcode == 0xd7)
4847         return 1;
4848       /* NB: For AMD-specific insns with implicit memory operands,
4849          they're intentionally not covered.  */
4850     }
4851
4852   /* No memory operand.  */
4853   if (!i.mem_operands)
4854     return 0;
4855
4856   if (any_vex_p)
4857     {
4858       if (i.tm.mnem_off == MN_vldmxcsr)
4859         return 1;
4860     }
4861   else if (i.tm.opcode_space == SPACE_BASE)
4862     {
4863       /* test, not, neg, mul, imul, div, idiv.  */
4864       if (base_opcode == 0xf7 && i.tm.extension_opcode != 1)
4865         return 1;
4866
4867       /* inc, dec.  */
4868       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4869         return 1;
4870
4871       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4872       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4873         return 1;
4874
4875       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4876       if ((base_opcode == 0xc1 || (base_opcode | 2) == 0xd3)
4877           && i.tm.extension_opcode != 6)
4878         return 1;
4879
4880       /* Check for x87 instructions.  */
4881       if ((base_opcode | 6) == 0xdf)
4882         {
4883           /* Skip fst, fstp, fstenv, fstcw.  */
4884           if (i.tm.base_opcode == 0xd9
4885               && (i.tm.extension_opcode == 2
4886                   || i.tm.extension_opcode == 3
4887                   || i.tm.extension_opcode == 6
4888                   || i.tm.extension_opcode == 7))
4889             return 0;
4890
4891           /* Skip fisttp, fist, fistp, fstp.  */
4892           if (i.tm.base_opcode == 0xdb
4893               && (i.tm.extension_opcode == 1
4894                   || i.tm.extension_opcode == 2
4895                   || i.tm.extension_opcode == 3
4896                   || i.tm.extension_opcode == 7))
4897             return 0;
4898
4899           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4900           if (i.tm.base_opcode == 0xdd
4901               && (i.tm.extension_opcode == 1
4902                   || i.tm.extension_opcode == 2
4903                   || i.tm.extension_opcode == 3
4904                   || i.tm.extension_opcode == 6
4905                   || i.tm.extension_opcode == 7))
4906             return 0;
4907
4908           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4909           if (i.tm.base_opcode == 0xdf
4910               && (i.tm.extension_opcode == 1
4911                   || i.tm.extension_opcode == 2
4912                   || i.tm.extension_opcode == 3
4913                   || i.tm.extension_opcode == 6
4914                   || i.tm.extension_opcode == 7))
4915             return 0;
4916
4917           return 1;
4918         }
4919     }
4920   else if (i.tm.opcode_space == SPACE_0F)
4921     {
4922       /* bt, bts, btr, btc.  */
4923       if (i.tm.base_opcode == 0xba
4924           && (i.tm.extension_opcode | 3) == 7)
4925         return 1;
4926
4927       /* cmpxchg8b, cmpxchg16b, xrstors, vmptrld.  */
4928       if (i.tm.base_opcode == 0xc7
4929           && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4930           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3
4931               || i.tm.extension_opcode == 6))
4932         return 1;
4933
4934       /* fxrstor, ldmxcsr, xrstor.  */
4935       if (i.tm.base_opcode == 0xae
4936           && (i.tm.extension_opcode == 1
4937               || i.tm.extension_opcode == 2
4938               || i.tm.extension_opcode == 5))
4939         return 1;
4940
4941       /* lgdt, lidt, lmsw.  */
4942       if (i.tm.base_opcode == 0x01
4943           && (i.tm.extension_opcode == 2
4944               || i.tm.extension_opcode == 3
4945               || i.tm.extension_opcode == 6))
4946         return 1;
4947     }
4948
4949   dest = i.operands - 1;
4950
4951   /* Check fake imm8 operand and 3 source operands.  */
4952   if ((i.tm.opcode_modifier.immext
4953        || i.reg_operands + i.mem_operands == 4)
4954       && i.types[dest].bitfield.imm8)
4955     dest--;
4956
4957   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg.  */
4958   if (i.tm.opcode_space == SPACE_BASE
4959       && ((base_opcode | 0x38) == 0x39
4960           || (base_opcode | 2) == 0x87))
4961     return 1;
4962
4963   if (i.tm.mnem_off == MN_xadd)
4964     return 1;
4965
4966   /* Check for load instruction.  */
4967   return (i.types[dest].bitfield.class != ClassNone
4968           || i.types[dest].bitfield.instance == Accum);
4969 }
4970
4971 /* Output lfence, 0xfaee8, after instruction.  */
4972
4973 static void
4974 insert_lfence_after (void)
4975 {
4976   if (lfence_after_load && load_insn_p ())
4977     {
4978       /* There are also two REP string instructions that require
4979          special treatment. Specifically, the compare string (CMPS)
4980          and scan string (SCAS) instructions set EFLAGS in a manner
4981          that depends on the data being compared/scanned. When used
4982          with a REP prefix, the number of iterations may therefore
4983          vary depending on this data. If the data is a program secret
4984          chosen by the adversary using an LVI method,
4985          then this data-dependent behavior may leak some aspect
4986          of the secret.  */
4987       if (((i.tm.base_opcode | 0x9) == 0xaf)
4988           && i.prefix[REP_PREFIX])
4989         {
4990             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4991                      insn_name (&i.tm));
4992         }
4993       char *p = frag_more (3);
4994       *p++ = 0xf;
4995       *p++ = 0xae;
4996       *p = 0xe8;
4997     }
4998 }
4999
5000 /* Output lfence, 0xfaee8, before instruction.  */
5001
5002 static void
5003 insert_lfence_before (void)
5004 {
5005   char *p;
5006
5007   if (i.tm.opcode_space != SPACE_BASE)
5008     return;
5009
5010   if (i.tm.base_opcode == 0xff
5011       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
5012     {
5013       /* Insert lfence before indirect branch if needed.  */
5014
5015       if (lfence_before_indirect_branch == lfence_branch_none)
5016         return;
5017
5018       if (i.operands != 1)
5019         abort ();
5020
5021       if (i.reg_operands == 1)
5022         {
5023           /* Indirect branch via register.  Don't insert lfence with
5024              -mlfence-after-load=yes.  */
5025           if (lfence_after_load
5026               || lfence_before_indirect_branch == lfence_branch_memory)
5027             return;
5028         }
5029       else if (i.mem_operands == 1
5030                && lfence_before_indirect_branch != lfence_branch_register)
5031         {
5032           as_warn (_("indirect `%s` with memory operand should be avoided"),
5033                    insn_name (&i.tm));
5034           return;
5035         }
5036       else
5037         return;
5038
5039       if (last_insn.kind != last_insn_other
5040           && last_insn.seg == now_seg)
5041         {
5042           as_warn_where (last_insn.file, last_insn.line,
5043                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
5044                          last_insn.name, insn_name (&i.tm));
5045           return;
5046         }
5047
5048       p = frag_more (3);
5049       *p++ = 0xf;
5050       *p++ = 0xae;
5051       *p = 0xe8;
5052       return;
5053     }
5054
5055   /* Output or/not/shl and lfence before near ret.  */
5056   if (lfence_before_ret != lfence_before_ret_none
5057       && (i.tm.base_opcode | 1) == 0xc3)
5058     {
5059       if (last_insn.kind != last_insn_other
5060           && last_insn.seg == now_seg)
5061         {
5062           as_warn_where (last_insn.file, last_insn.line,
5063                          _("`%s` skips -mlfence-before-ret on `%s`"),
5064                          last_insn.name, insn_name (&i.tm));
5065           return;
5066         }
5067
5068       /* Near ret ingore operand size override under CPU64.  */
5069       char prefix = flag_code == CODE_64BIT
5070                     ? 0x48
5071                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
5072
5073       if (lfence_before_ret == lfence_before_ret_not)
5074         {
5075           /* not: 0xf71424, may add prefix
5076              for operand size override or 64-bit code.  */
5077           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
5078           if (prefix)
5079             *p++ = prefix;
5080           *p++ = 0xf7;
5081           *p++ = 0x14;
5082           *p++ = 0x24;
5083           if (prefix)
5084             *p++ = prefix;
5085           *p++ = 0xf7;
5086           *p++ = 0x14;
5087           *p++ = 0x24;
5088         }
5089       else
5090         {
5091           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
5092           if (prefix)
5093             *p++ = prefix;
5094           if (lfence_before_ret == lfence_before_ret_or)
5095             {
5096               /* or: 0x830c2400, may add prefix
5097                  for operand size override or 64-bit code.  */
5098               *p++ = 0x83;
5099               *p++ = 0x0c;
5100             }
5101           else
5102             {
5103               /* shl: 0xc1242400, may add prefix
5104                  for operand size override or 64-bit code.  */
5105               *p++ = 0xc1;
5106               *p++ = 0x24;
5107             }
5108
5109           *p++ = 0x24;
5110           *p++ = 0x0;
5111         }
5112
5113       *p++ = 0xf;
5114       *p++ = 0xae;
5115       *p = 0xe8;
5116     }
5117 }
5118
5119 /* Shared helper for md_assemble() and s_insn().  */
5120 static void init_globals (void)
5121 {
5122   unsigned int j;
5123
5124   memset (&i, '\0', sizeof (i));
5125   i.rounding.type = rc_none;
5126   for (j = 0; j < MAX_OPERANDS; j++)
5127     i.reloc[j] = NO_RELOC;
5128   memset (disp_expressions, '\0', sizeof (disp_expressions));
5129   memset (im_expressions, '\0', sizeof (im_expressions));
5130   save_stack_p = save_stack;
5131 }
5132
5133 /* Helper for md_assemble() to decide whether to prepare for a possible 2nd
5134    parsing pass. Instead of introducing a rarely use new insn attribute this
5135    utilizes a common pattern between affected templates. It is deemed
5136    acceptable that this will lead to unnecessary pass 2 preparations in a
5137    limited set of cases.  */
5138 static INLINE bool may_need_pass2 (const insn_template *t)
5139 {
5140   return t->opcode_modifier.sse2avx
5141          /* Note that all SSE2AVX templates have at least one operand.  */
5142          ? t->operand_types[t->operands - 1].bitfield.class == RegSIMD
5143          : (t->opcode_space == SPACE_0F
5144             && (t->base_opcode | 1) == 0xbf)
5145            || (t->opcode_space == SPACE_BASE
5146                && t->base_opcode == 0x63);
5147 }
5148
5149 /* This is the guts of the machine-dependent assembler.  LINE points to a
5150    machine dependent instruction.  This function is supposed to emit
5151    the frags/bytes it assembles to.  */
5152
5153 void
5154 md_assemble (char *line)
5155 {
5156   unsigned int j;
5157   char mnemonic[MAX_MNEM_SIZE], mnem_suffix = 0, *copy = NULL;
5158   const char *end, *pass1_mnem = NULL;
5159   enum i386_error pass1_err = 0;
5160   const insn_template *t;
5161
5162   /* Initialize globals.  */
5163   current_templates = NULL;
5164  retry:
5165   init_globals ();
5166
5167   /* First parse an instruction mnemonic & call i386_operand for the operands.
5168      We assume that the scrubber has arranged it so that line[0] is the valid
5169      start of a (possibly prefixed) mnemonic.  */
5170
5171   end = parse_insn (line, mnemonic, false);
5172   if (end == NULL)
5173     {
5174       if (pass1_mnem != NULL)
5175         goto match_error;
5176       if (i.error != no_error)
5177         {
5178           gas_assert (current_templates != NULL);
5179           if (may_need_pass2 (current_templates->start) && !i.suffix)
5180             goto no_match;
5181           /* No point in trying a 2nd pass - it'll only find the same suffix
5182              again.  */
5183           mnem_suffix = i.suffix;
5184           goto match_error;
5185         }
5186       return;
5187     }
5188   t = current_templates->start;
5189   if (may_need_pass2 (t))
5190     {
5191       /* Make a copy of the full line in case we need to retry.  */
5192       copy = xstrdup (line);
5193     }
5194   line += end - line;
5195   mnem_suffix = i.suffix;
5196
5197   line = parse_operands (line, mnemonic);
5198   this_operand = -1;
5199   if (line == NULL)
5200     {
5201       free (copy);
5202       return;
5203     }
5204
5205   /* Now we've parsed the mnemonic into a set of templates, and have the
5206      operands at hand.  */
5207
5208   /* All Intel opcodes have reversed operands except for "bound", "enter",
5209      "invlpg*", "monitor*", "mwait*", "tpause", "umwait", "pvalidate",
5210      "rmpadjust", "rmpupdate", and "rmpquery".  We also don't reverse
5211      intersegment "jmp" and "call" instructions with 2 immediate operands so
5212      that the immediate segment precedes the offset consistently in Intel and
5213      AT&T modes.  */
5214   if (intel_syntax
5215       && i.operands > 1
5216       && (t->mnem_off != MN_bound)
5217       && !startswith (mnemonic, "invlpg")
5218       && !startswith (mnemonic, "monitor")
5219       && !startswith (mnemonic, "mwait")
5220       && (t->mnem_off != MN_pvalidate)
5221       && !startswith (mnemonic, "rmp")
5222       && (t->mnem_off != MN_tpause)
5223       && (t->mnem_off != MN_umwait)
5224       && !(i.operands == 2
5225            && operand_type_check (i.types[0], imm)
5226            && operand_type_check (i.types[1], imm)))
5227     swap_operands ();
5228
5229   /* The order of the immediates should be reversed
5230      for 2 immediates extrq and insertq instructions */
5231   if (i.imm_operands == 2
5232       && (t->mnem_off == MN_extrq || t->mnem_off == MN_insertq))
5233       swap_2_operands (0, 1);
5234
5235   if (i.imm_operands)
5236     optimize_imm ();
5237
5238   if (i.disp_operands && !optimize_disp (t))
5239     return;
5240
5241   /* Next, we find a template that matches the given insn,
5242      making sure the overlap of the given operands types is consistent
5243      with the template operand types.  */
5244
5245   if (!(t = match_template (mnem_suffix)))
5246     {
5247       const char *err_msg;
5248
5249       if (copy && !mnem_suffix)
5250         {
5251           line = copy;
5252           copy = NULL;
5253   no_match:
5254           pass1_err = i.error;
5255           pass1_mnem = insn_name (current_templates->start);
5256           goto retry;
5257         }
5258
5259       /* If a non-/only-64bit template (group) was found in pass 1, and if
5260          _some_ template (group) was found in pass 2, squash pass 1's
5261          error.  */
5262       if (pass1_err == unsupported_64bit)
5263         pass1_mnem = NULL;
5264
5265   match_error:
5266       free (copy);
5267
5268       switch (pass1_mnem ? pass1_err : i.error)
5269         {
5270         default:
5271           abort ();
5272         case operand_size_mismatch:
5273           err_msg = _("operand size mismatch");
5274           break;
5275         case operand_type_mismatch:
5276           err_msg = _("operand type mismatch");
5277           break;
5278         case register_type_mismatch:
5279           err_msg = _("register type mismatch");
5280           break;
5281         case number_of_operands_mismatch:
5282           err_msg = _("number of operands mismatch");
5283           break;
5284         case invalid_instruction_suffix:
5285           err_msg = _("invalid instruction suffix");
5286           break;
5287         case bad_imm4:
5288           err_msg = _("constant doesn't fit in 4 bits");
5289           break;
5290         case unsupported_with_intel_mnemonic:
5291           err_msg = _("unsupported with Intel mnemonic");
5292           break;
5293         case unsupported_syntax:
5294           err_msg = _("unsupported syntax");
5295           break;
5296         case unsupported:
5297           as_bad (_("unsupported instruction `%s'"),
5298                   pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
5299           return;
5300         case unsupported_on_arch:
5301           as_bad (_("`%s' is not supported on `%s%s'"),
5302                   pass1_mnem ? pass1_mnem : insn_name (current_templates->start),
5303                   cpu_arch_name ? cpu_arch_name : default_arch,
5304                   cpu_sub_arch_name ? cpu_sub_arch_name : "");
5305           return;
5306         case unsupported_64bit:
5307           if (ISLOWER (mnem_suffix))
5308             {
5309               if (flag_code == CODE_64BIT)
5310                 as_bad (_("`%s%c' is not supported in 64-bit mode"),
5311                         pass1_mnem ? pass1_mnem : insn_name (current_templates->start),
5312                         mnem_suffix);
5313               else
5314                 as_bad (_("`%s%c' is only supported in 64-bit mode"),
5315                         pass1_mnem ? pass1_mnem : insn_name (current_templates->start),
5316                         mnem_suffix);
5317             }
5318           else
5319             {
5320               if (flag_code == CODE_64BIT)
5321                 as_bad (_("`%s' is not supported in 64-bit mode"),
5322                         pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
5323               else
5324                 as_bad (_("`%s' is only supported in 64-bit mode"),
5325                         pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
5326             }
5327           return;
5328         case invalid_sib_address:
5329           err_msg = _("invalid SIB address");
5330           break;
5331         case invalid_vsib_address:
5332           err_msg = _("invalid VSIB address");
5333           break;
5334         case invalid_vector_register_set:
5335           err_msg = _("mask, index, and destination registers must be distinct");
5336           break;
5337         case invalid_tmm_register_set:
5338           err_msg = _("all tmm registers must be distinct");
5339           break;
5340         case invalid_dest_and_src_register_set:
5341           err_msg = _("destination and source registers must be distinct");
5342           break;
5343         case unsupported_vector_index_register:
5344           err_msg = _("unsupported vector index register");
5345           break;
5346         case unsupported_broadcast:
5347           err_msg = _("unsupported broadcast");
5348           break;
5349         case broadcast_needed:
5350           err_msg = _("broadcast is needed for operand of such type");
5351           break;
5352         case unsupported_masking:
5353           err_msg = _("unsupported masking");
5354           break;
5355         case mask_not_on_destination:
5356           err_msg = _("mask not on destination operand");
5357           break;
5358         case no_default_mask:
5359           err_msg = _("default mask isn't allowed");
5360           break;
5361         case unsupported_rc_sae:
5362           err_msg = _("unsupported static rounding/sae");
5363           break;
5364         case invalid_register_operand:
5365           err_msg = _("invalid register operand");
5366           break;
5367         case internal_error:
5368           err_msg = _("internal error");
5369           break;
5370         }
5371       as_bad (_("%s for `%s'"), err_msg,
5372               pass1_mnem ? pass1_mnem : insn_name (current_templates->start));
5373       return;
5374     }
5375
5376   free (copy);
5377
5378   if (sse_check != check_none
5379       /* The opcode space check isn't strictly needed; it's there only to
5380          bypass the logic below when easily possible.  */
5381       && t->opcode_space >= SPACE_0F
5382       && t->opcode_space <= SPACE_0F3A
5383       && !is_cpu (&i.tm, CpuSSE4a)
5384       && !is_any_vex_encoding (t))
5385     {
5386       bool simd = false;
5387
5388       for (j = 0; j < t->operands; ++j)
5389         {
5390           if (t->operand_types[j].bitfield.class == RegMMX)
5391             break;
5392           if (t->operand_types[j].bitfield.class == RegSIMD)
5393             simd = true;
5394         }
5395
5396       if (j >= t->operands && simd)
5397         (sse_check == check_warning
5398          ? as_warn
5399          : as_bad) (_("SSE instruction `%s' is used"), insn_name (&i.tm));
5400     }
5401
5402   if (i.tm.opcode_modifier.fwait)
5403     if (!add_prefix (FWAIT_OPCODE))
5404       return;
5405
5406   /* Check if REP prefix is OK.  */
5407   if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
5408     {
5409       as_bad (_("invalid instruction `%s' after `%s'"),
5410                 insn_name (&i.tm), i.rep_prefix);
5411       return;
5412     }
5413
5414   /* Check for lock without a lockable instruction.  Destination operand
5415      must be memory unless it is xchg (0x86).  */
5416   if (i.prefix[LOCK_PREFIX])
5417     {
5418       if (i.tm.opcode_modifier.prefixok < PrefixLock
5419           || i.mem_operands == 0
5420           || (i.tm.base_opcode != 0x86
5421               && !(i.flags[i.operands - 1] & Operand_Mem)))
5422         {
5423           as_bad (_("expecting lockable instruction after `lock'"));
5424           return;
5425         }
5426
5427       /* Zap the redundant prefix from XCHG when optimizing.  */
5428       if (i.tm.base_opcode == 0x86 && optimize && !i.no_optimize)
5429         i.prefix[LOCK_PREFIX] = 0;
5430     }
5431
5432   if (is_any_vex_encoding (&i.tm)
5433       || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
5434       || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX)
5435     {
5436       /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
5437       if (i.prefix[DATA_PREFIX])
5438         {
5439           as_bad (_("data size prefix invalid with `%s'"), insn_name (&i.tm));
5440           return;
5441         }
5442
5443       /* Don't allow e.g. KMOV in TLS code sequences.  */
5444       for (j = i.imm_operands; j < i.operands; ++j)
5445         switch (i.reloc[j])
5446           {
5447           case BFD_RELOC_386_TLS_GOTIE:
5448           case BFD_RELOC_386_TLS_LE_32:
5449           case BFD_RELOC_X86_64_GOTTPOFF:
5450           case BFD_RELOC_X86_64_TLSLD:
5451             as_bad (_("TLS relocation cannot be used with `%s'"), insn_name (&i.tm));
5452             return;
5453           default:
5454             break;
5455           }
5456     }
5457
5458   /* Check if HLE prefix is OK.  */
5459   if (i.hle_prefix && !check_hle ())
5460     return;
5461
5462   /* Check BND prefix.  */
5463   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
5464     as_bad (_("expecting valid branch instruction after `bnd'"));
5465
5466   /* Check NOTRACK prefix.  */
5467   if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
5468     as_bad (_("expecting indirect branch instruction after `notrack'"));
5469
5470   if (is_cpu (&i.tm, CpuMPX))
5471     {
5472       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
5473         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
5474       else if (flag_code != CODE_16BIT
5475                ? i.prefix[ADDR_PREFIX]
5476                : i.mem_operands && !i.prefix[ADDR_PREFIX])
5477         as_bad (_("16-bit address isn't allowed in MPX instructions"));
5478     }
5479
5480   /* Insert BND prefix.  */
5481   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
5482     {
5483       if (!i.prefix[BND_PREFIX])
5484         add_prefix (BND_PREFIX_OPCODE);
5485       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
5486         {
5487           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
5488           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
5489         }
5490     }
5491
5492   /* Check string instruction segment overrides.  */
5493   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
5494     {
5495       gas_assert (i.mem_operands);
5496       if (!check_string ())
5497         return;
5498       i.disp_operands = 0;
5499     }
5500
5501   /* The memory operand of (%dx) should be only used with input/output
5502      instructions (base opcodes: 0x6c, 0x6e, 0xec, 0xee).  */
5503   if (i.input_output_operand
5504       && ((i.tm.base_opcode | 0x82) != 0xee
5505           || i.tm.opcode_space != SPACE_BASE))
5506     {
5507       as_bad (_("input/output port address isn't allowed with `%s'"),
5508               insn_name (&i.tm));
5509       return;
5510     }
5511
5512   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
5513     optimize_encoding ();
5514
5515   /* Past optimization there's no need to distinguish vex_encoding_evex and
5516      vex_encoding_evex512 anymore.  */
5517   if (i.vec_encoding == vex_encoding_evex512)
5518     i.vec_encoding = vex_encoding_evex;
5519
5520   if (use_unaligned_vector_move)
5521     encode_with_unaligned_vector_move ();
5522
5523   if (!process_suffix ())
5524     return;
5525
5526   /* Check if IP-relative addressing requirements can be satisfied.  */
5527   if (is_cpu (&i.tm, CpuPREFETCHI)
5528       && !(i.base_reg && i.base_reg->reg_num == RegIP))
5529     as_warn (_("'%s' only supports RIP-relative address"), insn_name (&i.tm));
5530
5531   /* Update operand types and check extended states.  */
5532   for (j = 0; j < i.operands; j++)
5533     {
5534       i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
5535       switch (i.tm.operand_types[j].bitfield.class)
5536         {
5537         default:
5538           break;
5539         case RegMMX:
5540           i.xstate |= xstate_mmx;
5541           break;
5542         case RegMask:
5543           i.xstate |= xstate_mask;
5544           break;
5545         case RegSIMD:
5546           if (i.tm.operand_types[j].bitfield.tmmword)
5547             i.xstate |= xstate_tmm;
5548           else if (i.tm.operand_types[j].bitfield.zmmword
5549                    && !i.tm.opcode_modifier.vex
5550                    && vector_size >= VSZ512)
5551             i.xstate |= xstate_zmm;
5552           else if (i.tm.operand_types[j].bitfield.ymmword
5553                    && vector_size >= VSZ256)
5554             i.xstate |= xstate_ymm;
5555           else if (i.tm.operand_types[j].bitfield.xmmword)
5556             i.xstate |= xstate_xmm;
5557           break;
5558         }
5559     }
5560
5561   /* Make still unresolved immediate matches conform to size of immediate
5562      given in i.suffix.  */
5563   if (!finalize_imm ())
5564     return;
5565
5566   if (i.types[0].bitfield.imm1)
5567     i.imm_operands = 0; /* kludge for shift insns.  */
5568
5569   /* For insns with operands there are more diddles to do to the opcode.  */
5570   if (i.operands)
5571     {
5572       if (!process_operands ())
5573         return;
5574     }
5575   else if (!quiet_warnings && i.tm.opcode_modifier.operandconstraint == UGH)
5576     {
5577       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
5578       as_warn (_("translating to `%sp'"), insn_name (&i.tm));
5579     }
5580
5581   if (is_any_vex_encoding (&i.tm))
5582     {
5583       if (!cpu_arch_flags.bitfield.cpui286)
5584         {
5585           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
5586                   insn_name (&i.tm));
5587           return;
5588         }
5589
5590       /* Check for explicit REX prefix.  */
5591       if (i.prefix[REX_PREFIX] || i.rex_encoding)
5592         {
5593           as_bad (_("REX prefix invalid with `%s'"), insn_name (&i.tm));
5594           return;
5595         }
5596
5597       if (i.tm.opcode_modifier.vex)
5598         build_vex_prefix (t);
5599       else
5600         build_evex_prefix ();
5601
5602       /* The individual REX.RXBW bits got consumed.  */
5603       i.rex &= REX_OPCODE;
5604     }
5605
5606   /* Handle conversion of 'int $3' --> special int3 insn.  */
5607   if (i.tm.mnem_off == MN_int
5608       && i.op[0].imms->X_add_number == 3)
5609     {
5610       i.tm.base_opcode = INT3_OPCODE;
5611       i.imm_operands = 0;
5612     }
5613
5614   if ((i.tm.opcode_modifier.jump == JUMP
5615        || i.tm.opcode_modifier.jump == JUMP_BYTE
5616        || i.tm.opcode_modifier.jump == JUMP_DWORD)
5617       && i.op[0].disps->X_op == O_constant)
5618     {
5619       /* Convert "jmp constant" (and "call constant") to a jump (call) to
5620          the absolute address given by the constant.  Since ix86 jumps and
5621          calls are pc relative, we need to generate a reloc.  */
5622       i.op[0].disps->X_add_symbol = &abs_symbol;
5623       i.op[0].disps->X_op = O_symbol;
5624     }
5625
5626   /* For 8 bit registers we need an empty rex prefix.  Also if the
5627      instruction already has a prefix, we need to convert old
5628      registers to new ones.  */
5629
5630   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
5631        && (i.op[0].regs->reg_flags & RegRex64) != 0)
5632       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
5633           && (i.op[1].regs->reg_flags & RegRex64) != 0)
5634       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
5635            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
5636           && i.rex != 0))
5637     {
5638       int x;
5639
5640       i.rex |= REX_OPCODE;
5641       for (x = 0; x < 2; x++)
5642         {
5643           /* Look for 8 bit operand that uses old registers.  */
5644           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
5645               && (i.op[x].regs->reg_flags & RegRex64) == 0)
5646             {
5647               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5648               /* In case it is "hi" register, give up.  */
5649               if (i.op[x].regs->reg_num > 3)
5650                 as_bad (_("can't encode register '%s%s' in an "
5651                           "instruction requiring REX prefix."),
5652                         register_prefix, i.op[x].regs->reg_name);
5653
5654               /* Otherwise it is equivalent to the extended register.
5655                  Since the encoding doesn't change this is merely
5656                  cosmetic cleanup for debug output.  */
5657
5658               i.op[x].regs = i.op[x].regs + 8;
5659             }
5660         }
5661     }
5662
5663   if (i.rex == 0 && i.rex_encoding)
5664     {
5665       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
5666          that uses legacy register.  If it is "hi" register, don't add
5667          the REX_OPCODE byte.  */
5668       int x;
5669       for (x = 0; x < 2; x++)
5670         if (i.types[x].bitfield.class == Reg
5671             && i.types[x].bitfield.byte
5672             && (i.op[x].regs->reg_flags & RegRex64) == 0
5673             && i.op[x].regs->reg_num > 3)
5674           {
5675             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5676             i.rex_encoding = false;
5677             break;
5678           }
5679
5680       if (i.rex_encoding)
5681         i.rex = REX_OPCODE;
5682     }
5683
5684   if (i.rex != 0)
5685     add_prefix (REX_OPCODE | i.rex);
5686
5687   insert_lfence_before ();
5688
5689   /* We are ready to output the insn.  */
5690   output_insn ();
5691
5692   insert_lfence_after ();
5693
5694   last_insn.seg = now_seg;
5695
5696   if (i.tm.opcode_modifier.isprefix)
5697     {
5698       last_insn.kind = last_insn_prefix;
5699       last_insn.name = insn_name (&i.tm);
5700       last_insn.file = as_where (&last_insn.line);
5701     }
5702   else
5703     last_insn.kind = last_insn_other;
5704 }
5705
5706 /* The Q suffix is generally valid only in 64-bit mode, with very few
5707    exceptions: fild, fistp, fisttp, and cmpxchg8b.  Note that for fild
5708    and fisttp only one of their two templates is matched below: That's
5709    sufficient since other relevant attributes are the same between both
5710    respective templates.  */
5711 static INLINE bool q_suffix_allowed(const insn_template *t)
5712 {
5713   return flag_code == CODE_64BIT
5714          || (t->opcode_space == SPACE_BASE
5715              && t->base_opcode == 0xdf
5716              && (t->extension_opcode & 1)) /* fild / fistp / fisttp */
5717          || t->mnem_off == MN_cmpxchg8b;
5718 }
5719
5720 static const char *
5721 parse_insn (const char *line, char *mnemonic, bool prefix_only)
5722 {
5723   const char *l = line, *token_start = l;
5724   char *mnem_p;
5725   bool pass1 = !current_templates;
5726   int supported;
5727   const insn_template *t;
5728   char *dot_p = NULL;
5729
5730   while (1)
5731     {
5732       mnem_p = mnemonic;
5733       /* Pseudo-prefixes start with an opening figure brace.  */
5734       if ((*mnem_p = *l) == '{')
5735         {
5736           ++mnem_p;
5737           ++l;
5738         }
5739       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5740         {
5741           if (*mnem_p == '.')
5742             dot_p = mnem_p;
5743           mnem_p++;
5744           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5745             {
5746             too_long:
5747               as_bad (_("no such instruction: `%s'"), token_start);
5748               return NULL;
5749             }
5750           l++;
5751         }
5752       /* Pseudo-prefixes end with a closing figure brace.  */
5753       if (*mnemonic == '{' && *l == '}')
5754         {
5755           *mnem_p++ = *l++;
5756           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5757             goto too_long;
5758           *mnem_p = '\0';
5759
5760           /* Point l at the closing brace if there's no other separator.  */
5761           if (*l != END_OF_INSN && !is_space_char (*l)
5762               && *l != PREFIX_SEPARATOR)
5763             --l;
5764         }
5765       else if (!is_space_char (*l)
5766                && *l != END_OF_INSN
5767                && (intel_syntax
5768                    || (*l != PREFIX_SEPARATOR && *l != ',')))
5769         {
5770           if (prefix_only)
5771             break;
5772           as_bad (_("invalid character %s in mnemonic"),
5773                   output_invalid (*l));
5774           return NULL;
5775         }
5776       if (token_start == l)
5777         {
5778           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5779             as_bad (_("expecting prefix; got nothing"));
5780           else
5781             as_bad (_("expecting mnemonic; got nothing"));
5782           return NULL;
5783         }
5784
5785       /* Look up instruction (or prefix) via hash table.  */
5786       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5787
5788       if (*l != END_OF_INSN
5789           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5790           && current_templates
5791           && current_templates->start->opcode_modifier.isprefix)
5792         {
5793           if (!cpu_flags_check_cpu64 (current_templates->start))
5794             {
5795               as_bad ((flag_code != CODE_64BIT
5796                        ? _("`%s' is only supported in 64-bit mode")
5797                        : _("`%s' is not supported in 64-bit mode")),
5798                       insn_name (current_templates->start));
5799               return NULL;
5800             }
5801           /* If we are in 16-bit mode, do not allow addr16 or data16.
5802              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5803           if ((current_templates->start->opcode_modifier.size == SIZE16
5804                || current_templates->start->opcode_modifier.size == SIZE32)
5805               && flag_code != CODE_64BIT
5806               && ((current_templates->start->opcode_modifier.size == SIZE32)
5807                   ^ (flag_code == CODE_16BIT)))
5808             {
5809               as_bad (_("redundant %s prefix"),
5810                       insn_name (current_templates->start));
5811               return NULL;
5812             }
5813
5814           if (current_templates->start->base_opcode == PSEUDO_PREFIX)
5815             {
5816               /* Handle pseudo prefixes.  */
5817               switch (current_templates->start->extension_opcode)
5818                 {
5819                 case Prefix_Disp8:
5820                   /* {disp8} */
5821                   i.disp_encoding = disp_encoding_8bit;
5822                   break;
5823                 case Prefix_Disp16:
5824                   /* {disp16} */
5825                   i.disp_encoding = disp_encoding_16bit;
5826                   break;
5827                 case Prefix_Disp32:
5828                   /* {disp32} */
5829                   i.disp_encoding = disp_encoding_32bit;
5830                   break;
5831                 case Prefix_Load:
5832                   /* {load} */
5833                   i.dir_encoding = dir_encoding_load;
5834                   break;
5835                 case Prefix_Store:
5836                   /* {store} */
5837                   i.dir_encoding = dir_encoding_store;
5838                   break;
5839                 case Prefix_VEX:
5840                   /* {vex} */
5841                   i.vec_encoding = vex_encoding_vex;
5842                   break;
5843                 case Prefix_VEX3:
5844                   /* {vex3} */
5845                   i.vec_encoding = vex_encoding_vex3;
5846                   break;
5847                 case Prefix_EVEX:
5848                   /* {evex} */
5849                   i.vec_encoding = vex_encoding_evex;
5850                   break;
5851                 case Prefix_REX:
5852                   /* {rex} */
5853                   i.rex_encoding = true;
5854                   break;
5855                 case Prefix_NoOptimize:
5856                   /* {nooptimize} */
5857                   i.no_optimize = true;
5858                   break;
5859                 default:
5860                   abort ();
5861                 }
5862             }
5863           else
5864             {
5865               /* Add prefix, checking for repeated prefixes.  */
5866               switch (add_prefix (current_templates->start->base_opcode))
5867                 {
5868                 case PREFIX_EXIST:
5869                   return NULL;
5870                 case PREFIX_DS:
5871                   if (is_cpu (current_templates->start, CpuIBT))
5872                     i.notrack_prefix = insn_name (current_templates->start);
5873                   break;
5874                 case PREFIX_REP:
5875                   if (is_cpu (current_templates->start, CpuHLE))
5876                     i.hle_prefix = insn_name (current_templates->start);
5877                   else if (is_cpu (current_templates->start, CpuMPX))
5878                     i.bnd_prefix = insn_name (current_templates->start);
5879                   else
5880                     i.rep_prefix = insn_name (current_templates->start);
5881                   break;
5882                 default:
5883                   break;
5884                 }
5885             }
5886           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5887           token_start = ++l;
5888         }
5889       else
5890         break;
5891     }
5892
5893   if (prefix_only)
5894     return token_start;
5895
5896   if (!current_templates)
5897     {
5898       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5899          Check if we should swap operand or force 32bit displacement in
5900          encoding.  */
5901       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5902         i.dir_encoding = dir_encoding_swap;
5903       else if (mnem_p - 3 == dot_p
5904                && dot_p[1] == 'd'
5905                && dot_p[2] == '8')
5906         i.disp_encoding = disp_encoding_8bit;
5907       else if (mnem_p - 4 == dot_p
5908                && dot_p[1] == 'd'
5909                && dot_p[2] == '3'
5910                && dot_p[3] == '2')
5911         i.disp_encoding = disp_encoding_32bit;
5912       else
5913         goto check_suffix;
5914       mnem_p = dot_p;
5915       *dot_p = '\0';
5916       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5917     }
5918
5919   if (!current_templates || !pass1)
5920     {
5921       current_templates = NULL;
5922
5923     check_suffix:
5924       if (mnem_p > mnemonic)
5925         {
5926           /* See if we can get a match by trimming off a suffix.  */
5927           switch (mnem_p[-1])
5928             {
5929             case WORD_MNEM_SUFFIX:
5930               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5931                 i.suffix = SHORT_MNEM_SUFFIX;
5932               else
5933                 /* Fall through.  */
5934               case BYTE_MNEM_SUFFIX:
5935               case QWORD_MNEM_SUFFIX:
5936                 i.suffix = mnem_p[-1];
5937               mnem_p[-1] = '\0';
5938               current_templates
5939                 = (const templates *) str_hash_find (op_hash, mnemonic);
5940               break;
5941             case SHORT_MNEM_SUFFIX:
5942             case LONG_MNEM_SUFFIX:
5943               if (!intel_syntax)
5944                 {
5945                   i.suffix = mnem_p[-1];
5946                   mnem_p[-1] = '\0';
5947                   current_templates
5948                     = (const templates *) str_hash_find (op_hash, mnemonic);
5949                 }
5950               break;
5951
5952               /* Intel Syntax.  */
5953             case 'd':
5954               if (intel_syntax)
5955                 {
5956                   if (intel_float_operand (mnemonic) == 1)
5957                     i.suffix = SHORT_MNEM_SUFFIX;
5958                   else
5959                     i.suffix = LONG_MNEM_SUFFIX;
5960                   mnem_p[-1] = '\0';
5961                   current_templates
5962                     = (const templates *) str_hash_find (op_hash, mnemonic);
5963                 }
5964               /* For compatibility reasons accept MOVSD and CMPSD without
5965                  operands even in AT&T mode.  */
5966               else if (*l == END_OF_INSN
5967                        || (is_space_char (*l) && l[1] == END_OF_INSN))
5968                 {
5969                   mnem_p[-1] = '\0';
5970                   current_templates
5971                     = (const templates *) str_hash_find (op_hash, mnemonic);
5972                   if (current_templates != NULL
5973                       /* MOVS or CMPS */
5974                       && (current_templates->start->base_opcode | 2) == 0xa6
5975                       && current_templates->start->opcode_space
5976                          == SPACE_BASE
5977                       && mnem_p[-2] == 's')
5978                     {
5979                       as_warn (_("found `%sd'; assuming `%sl' was meant"),
5980                                mnemonic, mnemonic);
5981                       i.suffix = LONG_MNEM_SUFFIX;
5982                     }
5983                   else
5984                     {
5985                       current_templates = NULL;
5986                       mnem_p[-1] = 'd';
5987                     }
5988                 }
5989               break;
5990             }
5991         }
5992
5993       if (!current_templates)
5994         {
5995           if (pass1)
5996             as_bad (_("no such instruction: `%s'"), token_start);
5997           return NULL;
5998         }
5999     }
6000
6001   if (current_templates->start->opcode_modifier.jump == JUMP
6002       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
6003     {
6004       /* Check for a branch hint.  We allow ",pt" and ",pn" for
6005          predict taken and predict not taken respectively.
6006          I'm not sure that branch hints actually do anything on loop
6007          and jcxz insns (JumpByte) for current Pentium4 chips.  They
6008          may work in the future and it doesn't hurt to accept them
6009          now.  */
6010       if (l[0] == ',' && l[1] == 'p')
6011         {
6012           if (l[2] == 't')
6013             {
6014               if (!add_prefix (DS_PREFIX_OPCODE))
6015                 return NULL;
6016               l += 3;
6017             }
6018           else if (l[2] == 'n')
6019             {
6020               if (!add_prefix (CS_PREFIX_OPCODE))
6021                 return NULL;
6022               l += 3;
6023             }
6024         }
6025     }
6026   /* Any other comma loses.  */
6027   if (*l == ',')
6028     {
6029       as_bad (_("invalid character %s in mnemonic"),
6030               output_invalid (*l));
6031       return NULL;
6032     }
6033
6034   /* Check if instruction is supported on specified architecture.  */
6035   supported = 0;
6036   for (t = current_templates->start; t < current_templates->end; ++t)
6037     {
6038       supported |= cpu_flags_match (t);
6039
6040       if (i.suffix == QWORD_MNEM_SUFFIX && !q_suffix_allowed (t))
6041         supported &= ~CPU_FLAGS_64BIT_MATCH;
6042
6043       if (supported == CPU_FLAGS_PERFECT_MATCH)
6044         return l;
6045     }
6046
6047   if (pass1)
6048     {
6049       if (supported & CPU_FLAGS_64BIT_MATCH)
6050         i.error = unsupported_on_arch;
6051       else
6052         i.error = unsupported_64bit;
6053     }
6054
6055   return NULL;
6056 }
6057
6058 static char *
6059 parse_operands (char *l, const char *mnemonic)
6060 {
6061   char *token_start;
6062
6063   /* 1 if operand is pending after ','.  */
6064   unsigned int expecting_operand = 0;
6065
6066   while (*l != END_OF_INSN)
6067     {
6068       /* Non-zero if operand parens not balanced.  */
6069       unsigned int paren_not_balanced = 0;
6070       /* True if inside double quotes.  */
6071       bool in_quotes = false;
6072
6073       /* Skip optional white space before operand.  */
6074       if (is_space_char (*l))
6075         ++l;
6076       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
6077         {
6078           as_bad (_("invalid character %s before operand %d"),
6079                   output_invalid (*l),
6080                   i.operands + 1);
6081           return NULL;
6082         }
6083       token_start = l;  /* After white space.  */
6084       while (in_quotes || paren_not_balanced || *l != ',')
6085         {
6086           if (*l == END_OF_INSN)
6087             {
6088               if (in_quotes)
6089                 {
6090                   as_bad (_("unbalanced double quotes in operand %d."),
6091                           i.operands + 1);
6092                   return NULL;
6093                 }
6094               if (paren_not_balanced)
6095                 {
6096                   know (!intel_syntax);
6097                   as_bad (_("unbalanced parenthesis in operand %d."),
6098                           i.operands + 1);
6099                   return NULL;
6100                 }
6101               else
6102                 break;  /* we are done */
6103             }
6104           else if (*l == '\\' && l[1] == '"')
6105             ++l;
6106           else if (*l == '"')
6107             in_quotes = !in_quotes;
6108           else if (!in_quotes && !is_operand_char (*l) && !is_space_char (*l))
6109             {
6110               as_bad (_("invalid character %s in operand %d"),
6111                       output_invalid (*l),
6112                       i.operands + 1);
6113               return NULL;
6114             }
6115           if (!intel_syntax && !in_quotes)
6116             {
6117               if (*l == '(')
6118                 ++paren_not_balanced;
6119               if (*l == ')')
6120                 --paren_not_balanced;
6121             }
6122           l++;
6123         }
6124       if (l != token_start)
6125         {                       /* Yes, we've read in another operand.  */
6126           unsigned int operand_ok;
6127           this_operand = i.operands++;
6128           if (i.operands > MAX_OPERANDS)
6129             {
6130               as_bad (_("spurious operands; (%d operands/instruction max)"),
6131                       MAX_OPERANDS);
6132               return NULL;
6133             }
6134           i.types[this_operand].bitfield.unspecified = 1;
6135           /* Now parse operand adding info to 'i' as we go along.  */
6136           END_STRING_AND_SAVE (l);
6137
6138           if (i.mem_operands > 1)
6139             {
6140               as_bad (_("too many memory references for `%s'"),
6141                       mnemonic);
6142               return 0;
6143             }
6144
6145           if (intel_syntax)
6146             operand_ok =
6147               i386_intel_operand (token_start,
6148                                   intel_float_operand (mnemonic));
6149           else
6150             operand_ok = i386_att_operand (token_start);
6151
6152           RESTORE_END_STRING (l);
6153           if (!operand_ok)
6154             return NULL;
6155         }
6156       else
6157         {
6158           if (expecting_operand)
6159             {
6160             expecting_operand_after_comma:
6161               as_bad (_("expecting operand after ','; got nothing"));
6162               return NULL;
6163             }
6164           if (*l == ',')
6165             {
6166               as_bad (_("expecting operand before ','; got nothing"));
6167               return NULL;
6168             }
6169         }
6170
6171       /* Now *l must be either ',' or END_OF_INSN.  */
6172       if (*l == ',')
6173         {
6174           if (*++l == END_OF_INSN)
6175             {
6176               /* Just skip it, if it's \n complain.  */
6177               goto expecting_operand_after_comma;
6178             }
6179           expecting_operand = 1;
6180         }
6181     }
6182   return l;
6183 }
6184
6185 static void
6186 swap_2_operands (unsigned int xchg1, unsigned int xchg2)
6187 {
6188   union i386_op temp_op;
6189   i386_operand_type temp_type;
6190   unsigned int temp_flags;
6191   enum bfd_reloc_code_real temp_reloc;
6192
6193   temp_type = i.types[xchg2];
6194   i.types[xchg2] = i.types[xchg1];
6195   i.types[xchg1] = temp_type;
6196
6197   temp_flags = i.flags[xchg2];
6198   i.flags[xchg2] = i.flags[xchg1];
6199   i.flags[xchg1] = temp_flags;
6200
6201   temp_op = i.op[xchg2];
6202   i.op[xchg2] = i.op[xchg1];
6203   i.op[xchg1] = temp_op;
6204
6205   temp_reloc = i.reloc[xchg2];
6206   i.reloc[xchg2] = i.reloc[xchg1];
6207   i.reloc[xchg1] = temp_reloc;
6208
6209   temp_flags = i.imm_bits[xchg2];
6210   i.imm_bits[xchg2] = i.imm_bits[xchg1];
6211   i.imm_bits[xchg1] = temp_flags;
6212
6213   if (i.mask.reg)
6214     {
6215       if (i.mask.operand == xchg1)
6216         i.mask.operand = xchg2;
6217       else if (i.mask.operand == xchg2)
6218         i.mask.operand = xchg1;
6219     }
6220   if (i.broadcast.type || i.broadcast.bytes)
6221     {
6222       if (i.broadcast.operand == xchg1)
6223         i.broadcast.operand = xchg2;
6224       else if (i.broadcast.operand == xchg2)
6225         i.broadcast.operand = xchg1;
6226     }
6227 }
6228
6229 static void
6230 swap_operands (void)
6231 {
6232   switch (i.operands)
6233     {
6234     case 5:
6235     case 4:
6236       swap_2_operands (1, i.operands - 2);
6237       /* Fall through.  */
6238     case 3:
6239     case 2:
6240       swap_2_operands (0, i.operands - 1);
6241       break;
6242     default:
6243       abort ();
6244     }
6245
6246   if (i.mem_operands == 2)
6247     {
6248       const reg_entry *temp_seg;
6249       temp_seg = i.seg[0];
6250       i.seg[0] = i.seg[1];
6251       i.seg[1] = temp_seg;
6252     }
6253 }
6254
6255 /* Try to ensure constant immediates are represented in the smallest
6256    opcode possible.  */
6257 static void
6258 optimize_imm (void)
6259 {
6260   char guess_suffix = 0;
6261   int op;
6262
6263   if (i.suffix)
6264     guess_suffix = i.suffix;
6265   else if (i.reg_operands)
6266     {
6267       /* Figure out a suffix from the last register operand specified.
6268          We can't do this properly yet, i.e. excluding special register
6269          instances, but the following works for instructions with
6270          immediates.  In any case, we can't set i.suffix yet.  */
6271       for (op = i.operands; --op >= 0;)
6272         if (i.types[op].bitfield.class != Reg)
6273           continue;
6274         else if (i.types[op].bitfield.byte)
6275           {
6276             guess_suffix = BYTE_MNEM_SUFFIX;
6277             break;
6278           }
6279         else if (i.types[op].bitfield.word)
6280           {
6281             guess_suffix = WORD_MNEM_SUFFIX;
6282             break;
6283           }
6284         else if (i.types[op].bitfield.dword)
6285           {
6286             guess_suffix = LONG_MNEM_SUFFIX;
6287             break;
6288           }
6289         else if (i.types[op].bitfield.qword)
6290           {
6291             guess_suffix = QWORD_MNEM_SUFFIX;
6292             break;
6293           }
6294     }
6295   else if ((flag_code == CODE_16BIT)
6296             ^ (i.prefix[DATA_PREFIX] != 0 && !(i.prefix[REX_PREFIX] & REX_W)))
6297     guess_suffix = WORD_MNEM_SUFFIX;
6298   else if (flag_code != CODE_64BIT
6299            || (!(i.prefix[REX_PREFIX] & REX_W)
6300                /* A more generic (but also more involved) way of dealing
6301                   with the special case(s) would be to go look for
6302                   DefaultSize attributes on any of the templates.  */
6303                && current_templates->start->mnem_off != MN_push))
6304     guess_suffix = LONG_MNEM_SUFFIX;
6305
6306   for (op = i.operands; --op >= 0;)
6307     if (operand_type_check (i.types[op], imm))
6308       {
6309         switch (i.op[op].imms->X_op)
6310           {
6311           case O_constant:
6312             /* If a suffix is given, this operand may be shortened.  */
6313             switch (guess_suffix)
6314               {
6315               case LONG_MNEM_SUFFIX:
6316                 i.types[op].bitfield.imm32 = 1;
6317                 i.types[op].bitfield.imm64 = 1;
6318                 break;
6319               case WORD_MNEM_SUFFIX:
6320                 i.types[op].bitfield.imm16 = 1;
6321                 i.types[op].bitfield.imm32 = 1;
6322                 i.types[op].bitfield.imm32s = 1;
6323                 i.types[op].bitfield.imm64 = 1;
6324                 break;
6325               case BYTE_MNEM_SUFFIX:
6326                 i.types[op].bitfield.imm8 = 1;
6327                 i.types[op].bitfield.imm8s = 1;
6328                 i.types[op].bitfield.imm16 = 1;
6329                 i.types[op].bitfield.imm32 = 1;
6330                 i.types[op].bitfield.imm32s = 1;
6331                 i.types[op].bitfield.imm64 = 1;
6332                 break;
6333               }
6334
6335             /* If this operand is at most 16 bits, convert it
6336                to a signed 16 bit number before trying to see
6337                whether it will fit in an even smaller size.
6338                This allows a 16-bit operand such as $0xffe0 to
6339                be recognised as within Imm8S range.  */
6340             if ((i.types[op].bitfield.imm16)
6341                 && fits_in_unsigned_word (i.op[op].imms->X_add_number))
6342               {
6343                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
6344                                                 ^ 0x8000) - 0x8000);
6345               }
6346 #ifdef BFD64
6347             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
6348             if ((i.types[op].bitfield.imm32)
6349                 && fits_in_unsigned_long (i.op[op].imms->X_add_number))
6350               {
6351                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
6352                                                 ^ ((offsetT) 1 << 31))
6353                                                - ((offsetT) 1 << 31));
6354               }
6355 #endif
6356             i.types[op]
6357               = operand_type_or (i.types[op],
6358                                  smallest_imm_type (i.op[op].imms->X_add_number));
6359
6360             /* We must avoid matching of Imm32 templates when 64bit
6361                only immediate is available.  */
6362             if (guess_suffix == QWORD_MNEM_SUFFIX)
6363               i.types[op].bitfield.imm32 = 0;
6364             break;
6365
6366           case O_absent:
6367           case O_register:
6368             abort ();
6369
6370             /* Symbols and expressions.  */
6371           default:
6372             /* Convert symbolic operand to proper sizes for matching, but don't
6373                prevent matching a set of insns that only supports sizes other
6374                than those matching the insn suffix.  */
6375             {
6376               i386_operand_type mask, allowed;
6377               const insn_template *t = current_templates->start;
6378
6379               operand_type_set (&mask, 0);
6380               switch (guess_suffix)
6381                 {
6382                 case QWORD_MNEM_SUFFIX:
6383                   mask.bitfield.imm64 = 1;
6384                   mask.bitfield.imm32s = 1;
6385                   break;
6386                 case LONG_MNEM_SUFFIX:
6387                   mask.bitfield.imm32 = 1;
6388                   break;
6389                 case WORD_MNEM_SUFFIX:
6390                   mask.bitfield.imm16 = 1;
6391                   break;
6392                 case BYTE_MNEM_SUFFIX:
6393                   mask.bitfield.imm8 = 1;
6394                   break;
6395                 default:
6396                   break;
6397                 }
6398
6399               allowed = operand_type_and (t->operand_types[op], mask);
6400               while (++t < current_templates->end)
6401                 {
6402                   allowed = operand_type_or (allowed, t->operand_types[op]);
6403                   allowed = operand_type_and (allowed, mask);
6404                 }
6405
6406               if (!operand_type_all_zero (&allowed))
6407                 i.types[op] = operand_type_and (i.types[op], mask);
6408             }
6409             break;
6410           }
6411       }
6412 }
6413
6414 /* Try to use the smallest displacement type too.  */
6415 static bool
6416 optimize_disp (const insn_template *t)
6417 {
6418   unsigned int op;
6419
6420   if (!want_disp32 (t)
6421       && (!t->opcode_modifier.jump
6422           || i.jumpabsolute || i.types[0].bitfield.baseindex))
6423     {
6424       for (op = 0; op < i.operands; ++op)
6425         {
6426           const expressionS *exp = i.op[op].disps;
6427
6428           if (!operand_type_check (i.types[op], disp))
6429             continue;
6430
6431           if (exp->X_op != O_constant)
6432             continue;
6433
6434           /* Since displacement is signed extended to 64bit, don't allow
6435              disp32 if it is out of range.  */
6436           if (fits_in_signed_long (exp->X_add_number))
6437             continue;
6438
6439           i.types[op].bitfield.disp32 = 0;
6440           if (i.types[op].bitfield.baseindex)
6441             {
6442               as_bad (_("0x%" PRIx64 " out of range of signed 32bit displacement"),
6443                       (uint64_t) exp->X_add_number);
6444               return false;
6445             }
6446         }
6447     }
6448
6449   /* Don't optimize displacement for movabs since it only takes 64bit
6450      displacement.  */
6451   if (i.disp_encoding > disp_encoding_8bit
6452       || (flag_code == CODE_64BIT && t->mnem_off == MN_movabs))
6453     return true;
6454
6455   for (op = i.operands; op-- > 0;)
6456     if (operand_type_check (i.types[op], disp))
6457       {
6458         if (i.op[op].disps->X_op == O_constant)
6459           {
6460             offsetT op_disp = i.op[op].disps->X_add_number;
6461
6462             if (!op_disp && i.types[op].bitfield.baseindex)
6463               {
6464                 i.types[op] = operand_type_and_not (i.types[op], anydisp);
6465                 i.op[op].disps = NULL;
6466                 i.disp_operands--;
6467                 continue;
6468               }
6469
6470             if (i.types[op].bitfield.disp16
6471                 && fits_in_unsigned_word (op_disp))
6472               {
6473                 /* If this operand is at most 16 bits, convert
6474                    to a signed 16 bit number and don't use 64bit
6475                    displacement.  */
6476                 op_disp = ((op_disp ^ 0x8000) - 0x8000);
6477                 i.types[op].bitfield.disp64 = 0;
6478               }
6479
6480 #ifdef BFD64
6481             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
6482             if ((flag_code != CODE_64BIT
6483                  ? i.types[op].bitfield.disp32
6484                  : want_disp32 (t)
6485                    && (!t->opcode_modifier.jump
6486                        || i.jumpabsolute || i.types[op].bitfield.baseindex))
6487                 && fits_in_unsigned_long (op_disp))
6488               {
6489                 /* If this operand is at most 32 bits, convert
6490                    to a signed 32 bit number and don't use 64bit
6491                    displacement.  */
6492                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
6493                 i.types[op].bitfield.disp64 = 0;
6494                 i.types[op].bitfield.disp32 = 1;
6495               }
6496
6497             if (flag_code == CODE_64BIT && fits_in_signed_long (op_disp))
6498               {
6499                 i.types[op].bitfield.disp64 = 0;
6500                 i.types[op].bitfield.disp32 = 1;
6501               }
6502 #endif
6503             if ((i.types[op].bitfield.disp32
6504                  || i.types[op].bitfield.disp16)
6505                 && fits_in_disp8 (op_disp))
6506               i.types[op].bitfield.disp8 = 1;
6507
6508             i.op[op].disps->X_add_number = op_disp;
6509           }
6510         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
6511                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
6512           {
6513             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
6514                          i.op[op].disps, 0, i.reloc[op]);
6515             i.types[op] = operand_type_and_not (i.types[op], anydisp);
6516           }
6517         else
6518           /* We only support 64bit displacement on constants.  */
6519           i.types[op].bitfield.disp64 = 0;
6520       }
6521
6522   return true;
6523 }
6524
6525 /* Return 1 if there is a match in broadcast bytes between operand
6526    GIVEN and instruction template T.   */
6527
6528 static INLINE int
6529 match_broadcast_size (const insn_template *t, unsigned int given)
6530 {
6531   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
6532            && i.types[given].bitfield.byte)
6533           || (t->opcode_modifier.broadcast == WORD_BROADCAST
6534               && i.types[given].bitfield.word)
6535           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
6536               && i.types[given].bitfield.dword)
6537           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
6538               && i.types[given].bitfield.qword));
6539 }
6540
6541 /* Check if operands are valid for the instruction.  */
6542
6543 static int
6544 check_VecOperands (const insn_template *t)
6545 {
6546   unsigned int op;
6547   i386_cpu_flags cpu;
6548
6549   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
6550      any one operand are implicity requiring AVX512VL support if the actual
6551      operand size is YMMword or XMMword.  Since this function runs after
6552      template matching, there's no need to check for YMMword/XMMword in
6553      the template.  */
6554   cpu = cpu_flags_and (cpu_flags_from_attr (t->cpu), avx512);
6555   if (!cpu_flags_all_zero (&cpu)
6556       && !is_cpu (t, CpuAVX512VL)
6557       && !cpu_arch_flags.bitfield.cpuavx512vl
6558       && (!t->opcode_modifier.vex || need_evex_encoding ()))
6559     {
6560       for (op = 0; op < t->operands; ++op)
6561         {
6562           if (t->operand_types[op].bitfield.zmmword
6563               && (i.types[op].bitfield.ymmword
6564                   || i.types[op].bitfield.xmmword))
6565             {
6566               i.error = unsupported;
6567               return 1;
6568             }
6569         }
6570     }
6571
6572   /* Somewhat similarly, templates specifying both AVX and AVX2 are
6573      requiring AVX2 support if the actual operand size is YMMword.  */
6574   if (is_cpu (t, CpuAVX) && is_cpu (t, CpuAVX2)
6575       && !cpu_arch_flags.bitfield.cpuavx2)
6576     {
6577       for (op = 0; op < t->operands; ++op)
6578         {
6579           if (t->operand_types[op].bitfield.xmmword
6580               && i.types[op].bitfield.ymmword)
6581             {
6582               i.error = unsupported;
6583               return 1;
6584             }
6585         }
6586     }
6587
6588   /* Without VSIB byte, we can't have a vector register for index.  */
6589   if (!t->opcode_modifier.sib
6590       && i.index_reg
6591       && (i.index_reg->reg_type.bitfield.xmmword
6592           || i.index_reg->reg_type.bitfield.ymmword
6593           || i.index_reg->reg_type.bitfield.zmmword))
6594     {
6595       i.error = unsupported_vector_index_register;
6596       return 1;
6597     }
6598
6599   /* Check if default mask is allowed.  */
6600   if (t->opcode_modifier.operandconstraint == NO_DEFAULT_MASK
6601       && (!i.mask.reg || i.mask.reg->reg_num == 0))
6602     {
6603       i.error = no_default_mask;
6604       return 1;
6605     }
6606
6607   /* For VSIB byte, we need a vector register for index, and all vector
6608      registers must be distinct.  */
6609   if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
6610     {
6611       if (!i.index_reg
6612           || !((t->opcode_modifier.sib == VECSIB128
6613                 && i.index_reg->reg_type.bitfield.xmmword)
6614                || (t->opcode_modifier.sib == VECSIB256
6615                    && i.index_reg->reg_type.bitfield.ymmword)
6616                || (t->opcode_modifier.sib == VECSIB512
6617                    && i.index_reg->reg_type.bitfield.zmmword)))
6618       {
6619         i.error = invalid_vsib_address;
6620         return 1;
6621       }
6622
6623       gas_assert (i.reg_operands == 2 || i.mask.reg);
6624       if (i.reg_operands == 2 && !i.mask.reg)
6625         {
6626           gas_assert (i.types[0].bitfield.class == RegSIMD);
6627           gas_assert (i.types[0].bitfield.xmmword
6628                       || i.types[0].bitfield.ymmword);
6629           gas_assert (i.types[2].bitfield.class == RegSIMD);
6630           gas_assert (i.types[2].bitfield.xmmword
6631                       || i.types[2].bitfield.ymmword);
6632           if (operand_check == check_none)
6633             return 0;
6634           if (register_number (i.op[0].regs)
6635               != register_number (i.index_reg)
6636               && register_number (i.op[2].regs)
6637                  != register_number (i.index_reg)
6638               && register_number (i.op[0].regs)
6639                  != register_number (i.op[2].regs))
6640             return 0;
6641           if (operand_check == check_error)
6642             {
6643               i.error = invalid_vector_register_set;
6644               return 1;
6645             }
6646           as_warn (_("mask, index, and destination registers should be distinct"));
6647         }
6648       else if (i.reg_operands == 1 && i.mask.reg)
6649         {
6650           if (i.types[1].bitfield.class == RegSIMD
6651               && (i.types[1].bitfield.xmmword
6652                   || i.types[1].bitfield.ymmword
6653                   || i.types[1].bitfield.zmmword)
6654               && (register_number (i.op[1].regs)
6655                   == register_number (i.index_reg)))
6656             {
6657               if (operand_check == check_error)
6658                 {
6659                   i.error = invalid_vector_register_set;
6660                   return 1;
6661                 }
6662               if (operand_check != check_none)
6663                 as_warn (_("index and destination registers should be distinct"));
6664             }
6665         }
6666     }
6667
6668   /* For AMX instructions with 3 TMM register operands, all operands
6669       must be distinct.  */
6670   if (i.reg_operands == 3
6671       && t->operand_types[0].bitfield.tmmword
6672       && (i.op[0].regs == i.op[1].regs
6673           || i.op[0].regs == i.op[2].regs
6674           || i.op[1].regs == i.op[2].regs))
6675     {
6676       i.error = invalid_tmm_register_set;
6677       return 1;
6678     }
6679
6680   /* For some special instructions require that destination must be distinct
6681      from source registers.  */
6682   if (t->opcode_modifier.operandconstraint == DISTINCT_DEST)
6683     {
6684       unsigned int dest_reg = i.operands - 1;
6685
6686       know (i.operands >= 3);
6687
6688       /* #UD if dest_reg == src1_reg or dest_reg == src2_reg.  */
6689       if (i.op[dest_reg - 1].regs == i.op[dest_reg].regs
6690           || (i.reg_operands > 2
6691               && i.op[dest_reg - 2].regs == i.op[dest_reg].regs))
6692         {
6693           i.error = invalid_dest_and_src_register_set;
6694           return 1;
6695         }
6696     }
6697
6698   /* Check if broadcast is supported by the instruction and is applied
6699      to the memory operand.  */
6700   if (i.broadcast.type || i.broadcast.bytes)
6701     {
6702       i386_operand_type type, overlap;
6703
6704       /* Check if specified broadcast is supported in this instruction,
6705          and its broadcast bytes match the memory operand.  */
6706       op = i.broadcast.operand;
6707       if (!t->opcode_modifier.broadcast
6708           || !(i.flags[op] & Operand_Mem)
6709           || (!i.types[op].bitfield.unspecified
6710               && !match_broadcast_size (t, op)))
6711         {
6712         bad_broadcast:
6713           i.error = unsupported_broadcast;
6714           return 1;
6715         }
6716
6717       operand_type_set (&type, 0);
6718       switch (get_broadcast_bytes (t, false))
6719         {
6720         case 2:
6721           type.bitfield.word = 1;
6722           break;
6723         case 4:
6724           type.bitfield.dword = 1;
6725           break;
6726         case 8:
6727           type.bitfield.qword = 1;
6728           break;
6729         case 16:
6730           type.bitfield.xmmword = 1;
6731           break;
6732         case 32:
6733           if (vector_size < VSZ256)
6734             goto bad_broadcast;
6735           type.bitfield.ymmword = 1;
6736           break;
6737         case 64:
6738           if (vector_size < VSZ512)
6739             goto bad_broadcast;
6740           type.bitfield.zmmword = 1;
6741           break;
6742         default:
6743           goto bad_broadcast;
6744         }
6745
6746       overlap = operand_type_and (type, t->operand_types[op]);
6747       if (t->operand_types[op].bitfield.class == RegSIMD
6748           && t->operand_types[op].bitfield.byte
6749              + t->operand_types[op].bitfield.word
6750              + t->operand_types[op].bitfield.dword
6751              + t->operand_types[op].bitfield.qword > 1)
6752         {
6753           overlap.bitfield.xmmword = 0;
6754           overlap.bitfield.ymmword = 0;
6755           overlap.bitfield.zmmword = 0;
6756         }
6757       if (operand_type_all_zero (&overlap))
6758           goto bad_broadcast;
6759
6760       if (t->opcode_modifier.checkoperandsize)
6761         {
6762           unsigned int j;
6763
6764           type.bitfield.baseindex = 1;
6765           for (j = 0; j < i.operands; ++j)
6766             {
6767               if (j != op
6768                   && !operand_type_register_match(i.types[j],
6769                                                   t->operand_types[j],
6770                                                   type,
6771                                                   t->operand_types[op]))
6772                 goto bad_broadcast;
6773             }
6774         }
6775     }
6776   /* If broadcast is supported in this instruction, we need to check if
6777      operand of one-element size isn't specified without broadcast.  */
6778   else if (t->opcode_modifier.broadcast && i.mem_operands)
6779     {
6780       /* Find memory operand.  */
6781       for (op = 0; op < i.operands; op++)
6782         if (i.flags[op] & Operand_Mem)
6783           break;
6784       gas_assert (op < i.operands);
6785       /* Check size of the memory operand.  */
6786       if (match_broadcast_size (t, op))
6787         {
6788           i.error = broadcast_needed;
6789           return 1;
6790         }
6791     }
6792   else
6793     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
6794
6795   /* Check if requested masking is supported.  */
6796   if (i.mask.reg)
6797     {
6798       if (!t->opcode_modifier.masking)
6799         {
6800           i.error = unsupported_masking;
6801           return 1;
6802         }
6803
6804       /* Common rules for masking:
6805          - mask register destinations permit only zeroing-masking, without
6806            that actually being expressed by a {z} operand suffix or EVEX.z,
6807          - memory destinations allow only merging-masking,
6808          - scatter/gather insns (i.e. ones using vSIB) only allow merging-
6809            masking.  */
6810       if (i.mask.zeroing
6811           && (t->operand_types[t->operands - 1].bitfield.class == RegMask
6812               || (i.flags[t->operands - 1] & Operand_Mem)
6813               || t->opcode_modifier.sib))
6814         {
6815           i.error = unsupported_masking;
6816           return 1;
6817         }
6818     }
6819
6820   /* Check if masking is applied to dest operand.  */
6821   if (i.mask.reg && (i.mask.operand != i.operands - 1))
6822     {
6823       i.error = mask_not_on_destination;
6824       return 1;
6825     }
6826
6827   /* Check RC/SAE.  */
6828   if (i.rounding.type != rc_none)
6829     {
6830       if (!t->opcode_modifier.sae
6831           || ((i.rounding.type != saeonly) != t->opcode_modifier.staticrounding)
6832           || i.mem_operands)
6833         {
6834           i.error = unsupported_rc_sae;
6835           return 1;
6836         }
6837
6838       /* Non-EVEX.LIG forms need to have a ZMM register as at least one
6839          operand.  */
6840       if (t->opcode_modifier.evex != EVEXLIG)
6841         {
6842           for (op = 0; op < t->operands; ++op)
6843             if (i.types[op].bitfield.zmmword)
6844               break;
6845           if (op >= t->operands)
6846             {
6847               i.error = operand_size_mismatch;
6848               return 1;
6849             }
6850         }
6851     }
6852
6853   /* Check the special Imm4 cases; must be the first operand.  */
6854   if (is_cpu (t, CpuXOP) && t->operands == 5)
6855     {
6856       if (i.op[0].imms->X_op != O_constant
6857           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6858         {
6859           i.error = bad_imm4;
6860           return 1;
6861         }
6862
6863       /* Turn off Imm<N> so that update_imm won't complain.  */
6864       operand_type_set (&i.types[0], 0);
6865     }
6866
6867   /* Check vector Disp8 operand.  */
6868   if (t->opcode_modifier.disp8memshift
6869       && (!t->opcode_modifier.vex
6870           || need_evex_encoding ())
6871       && i.disp_encoding <= disp_encoding_8bit)
6872     {
6873       if (i.broadcast.type || i.broadcast.bytes)
6874         i.memshift = t->opcode_modifier.broadcast - 1;
6875       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6876         i.memshift = t->opcode_modifier.disp8memshift;
6877       else
6878         {
6879           const i386_operand_type *type = NULL, *fallback = NULL;
6880
6881           i.memshift = 0;
6882           for (op = 0; op < i.operands; op++)
6883             if (i.flags[op] & Operand_Mem)
6884               {
6885                 if (t->opcode_modifier.evex == EVEXLIG)
6886                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6887                 else if (t->operand_types[op].bitfield.xmmword
6888                          + t->operand_types[op].bitfield.ymmword
6889                          + t->operand_types[op].bitfield.zmmword <= 1)
6890                   type = &t->operand_types[op];
6891                 else if (!i.types[op].bitfield.unspecified)
6892                   type = &i.types[op];
6893                 else /* Ambiguities get resolved elsewhere.  */
6894                   fallback = &t->operand_types[op];
6895               }
6896             else if (i.types[op].bitfield.class == RegSIMD
6897                      && t->opcode_modifier.evex != EVEXLIG)
6898               {
6899                 if (i.types[op].bitfield.zmmword)
6900                   i.memshift = 6;
6901                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6902                   i.memshift = 5;
6903                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6904                   i.memshift = 4;
6905               }
6906
6907           if (!type && !i.memshift)
6908             type = fallback;
6909           if (type)
6910             {
6911               if (type->bitfield.zmmword)
6912                 i.memshift = 6;
6913               else if (type->bitfield.ymmword)
6914                 i.memshift = 5;
6915               else if (type->bitfield.xmmword)
6916                 i.memshift = 4;
6917             }
6918
6919           /* For the check in fits_in_disp8().  */
6920           if (i.memshift == 0)
6921             i.memshift = -1;
6922         }
6923
6924       for (op = 0; op < i.operands; op++)
6925         if (operand_type_check (i.types[op], disp)
6926             && i.op[op].disps->X_op == O_constant)
6927           {
6928             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6929               {
6930                 i.types[op].bitfield.disp8 = 1;
6931                 return 0;
6932               }
6933             i.types[op].bitfield.disp8 = 0;
6934           }
6935     }
6936
6937   i.memshift = 0;
6938
6939   return 0;
6940 }
6941
6942 /* Check if encoding requirements are met by the instruction.  */
6943
6944 static int
6945 VEX_check_encoding (const insn_template *t)
6946 {
6947   if (i.vec_encoding == vex_encoding_error)
6948     {
6949       i.error = unsupported;
6950       return 1;
6951     }
6952
6953   /* Vector size restrictions.  */
6954   if ((vector_size < VSZ512
6955        && (t->opcode_modifier.evex == EVEX512
6956            || t->opcode_modifier.vsz >= VSZ512))
6957       || (vector_size < VSZ256
6958           && (t->opcode_modifier.evex == EVEX256
6959               || t->opcode_modifier.vex == VEX256
6960               || t->opcode_modifier.vsz >= VSZ256)))
6961     {
6962       i.error = unsupported;
6963       return 1;
6964     }
6965
6966   if (i.vec_encoding == vex_encoding_evex
6967       || i.vec_encoding == vex_encoding_evex512)
6968     {
6969       /* This instruction must be encoded with EVEX prefix.  */
6970       if (!is_evex_encoding (t))
6971         {
6972           i.error = unsupported;
6973           return 1;
6974         }
6975       return 0;
6976     }
6977
6978   if (!t->opcode_modifier.vex)
6979     {
6980       /* This instruction template doesn't have VEX prefix.  */
6981       if (i.vec_encoding != vex_encoding_default)
6982         {
6983           i.error = unsupported;
6984           return 1;
6985         }
6986       return 0;
6987     }
6988
6989   return 0;
6990 }
6991
6992 /* Helper function for the progress() macro in match_template().  */
6993 static INLINE enum i386_error progress (enum i386_error new,
6994                                         enum i386_error last,
6995                                         unsigned int line, unsigned int *line_p)
6996 {
6997   if (line <= *line_p)
6998     return last;
6999   *line_p = line;
7000   return new;
7001 }
7002
7003 static const insn_template *
7004 match_template (char mnem_suffix)
7005 {
7006   /* Points to template once we've found it.  */
7007   const insn_template *t;
7008   i386_operand_type overlap0, overlap1, overlap2, overlap3;
7009   i386_operand_type overlap4;
7010   unsigned int found_reverse_match;
7011   i386_operand_type operand_types [MAX_OPERANDS];
7012   int addr_prefix_disp;
7013   unsigned int j, size_match, check_register, errline = __LINE__;
7014   enum i386_error specific_error = number_of_operands_mismatch;
7015 #define progress(err) progress (err, specific_error, __LINE__, &errline)
7016
7017 #if MAX_OPERANDS != 5
7018 # error "MAX_OPERANDS must be 5."
7019 #endif
7020
7021   found_reverse_match = 0;
7022   addr_prefix_disp = -1;
7023
7024   for (t = current_templates->start; t < current_templates->end; t++)
7025     {
7026       addr_prefix_disp = -1;
7027       found_reverse_match = 0;
7028
7029       /* Must have right number of operands.  */
7030       if (i.operands != t->operands)
7031         continue;
7032
7033       /* Check processor support.  */
7034       specific_error = progress (unsupported);
7035       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
7036         continue;
7037
7038       /* Check AT&T mnemonic.   */
7039       specific_error = progress (unsupported_with_intel_mnemonic);
7040       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
7041         continue;
7042
7043       /* Check AT&T/Intel syntax.  */
7044       specific_error = progress (unsupported_syntax);
7045       if ((intel_syntax && t->opcode_modifier.attsyntax)
7046           || (!intel_syntax && t->opcode_modifier.intelsyntax))
7047         continue;
7048
7049       /* Check Intel64/AMD64 ISA.   */
7050       switch (isa64)
7051         {
7052         default:
7053           /* Default: Don't accept Intel64.  */
7054           if (t->opcode_modifier.isa64 == INTEL64)
7055             continue;
7056           break;
7057         case amd64:
7058           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
7059           if (t->opcode_modifier.isa64 >= INTEL64)
7060             continue;
7061           break;
7062         case intel64:
7063           /* -mintel64: Don't accept AMD64.  */
7064           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
7065             continue;
7066           break;
7067         }
7068
7069       /* Check the suffix.  */
7070       specific_error = progress (invalid_instruction_suffix);
7071       if ((t->opcode_modifier.no_bsuf && mnem_suffix == BYTE_MNEM_SUFFIX)
7072           || (t->opcode_modifier.no_wsuf && mnem_suffix == WORD_MNEM_SUFFIX)
7073           || (t->opcode_modifier.no_lsuf && mnem_suffix == LONG_MNEM_SUFFIX)
7074           || (t->opcode_modifier.no_ssuf && mnem_suffix == SHORT_MNEM_SUFFIX)
7075           || (t->opcode_modifier.no_qsuf && mnem_suffix == QWORD_MNEM_SUFFIX))
7076         continue;
7077
7078       specific_error = progress (operand_size_mismatch);
7079       size_match = operand_size_match (t);
7080       if (!size_match)
7081         continue;
7082
7083       /* This is intentionally not
7084
7085          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
7086
7087          as the case of a missing * on the operand is accepted (perhaps with
7088          a warning, issued further down).  */
7089       specific_error = progress (operand_type_mismatch);
7090       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
7091         continue;
7092
7093       /* In Intel syntax, normally we can check for memory operand size when
7094          there is no mnemonic suffix.  But jmp and call have 2 different
7095          encodings with Dword memory operand size.  Skip the "near" one
7096          (permitting a register operand) when "far" was requested.  */
7097       if (i.far_branch
7098           && t->opcode_modifier.jump == JUMP_ABSOLUTE
7099           && t->operand_types[0].bitfield.class == Reg)
7100         continue;
7101
7102       for (j = 0; j < MAX_OPERANDS; j++)
7103         operand_types[j] = t->operand_types[j];
7104
7105       /* In general, don't allow 32-bit operands on pre-386.  */
7106       specific_error = progress (mnem_suffix ? invalid_instruction_suffix
7107                                              : operand_size_mismatch);
7108       j = i.imm_operands + (t->operands > i.imm_operands + 1);
7109       if (i.suffix == LONG_MNEM_SUFFIX
7110           && !cpu_arch_flags.bitfield.cpui386
7111           && (intel_syntax
7112               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
7113                  && !intel_float_operand (insn_name (t)))
7114               : intel_float_operand (insn_name (t)) != 2)
7115           && (t->operands == i.imm_operands
7116               || (operand_types[i.imm_operands].bitfield.class != RegMMX
7117                && operand_types[i.imm_operands].bitfield.class != RegSIMD
7118                && operand_types[i.imm_operands].bitfield.class != RegMask)
7119               || (operand_types[j].bitfield.class != RegMMX
7120                   && operand_types[j].bitfield.class != RegSIMD
7121                   && operand_types[j].bitfield.class != RegMask))
7122           && !t->opcode_modifier.sib)
7123         continue;
7124
7125       /* Do not verify operands when there are none.  */
7126       if (!t->operands)
7127         {
7128           if (VEX_check_encoding (t))
7129             {
7130               specific_error = progress (i.error);
7131               continue;
7132             }
7133
7134           /* We've found a match; break out of loop.  */
7135           break;
7136         }
7137
7138       if (!t->opcode_modifier.jump
7139           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
7140         {
7141           /* There should be only one Disp operand.  */
7142           for (j = 0; j < MAX_OPERANDS; j++)
7143             if (operand_type_check (operand_types[j], disp))
7144               break;
7145           if (j < MAX_OPERANDS)
7146             {
7147               bool override = (i.prefix[ADDR_PREFIX] != 0);
7148
7149               addr_prefix_disp = j;
7150
7151               /* Address size prefix will turn Disp64 operand into Disp32 and
7152                  Disp32/Disp16 one into Disp16/Disp32 respectively.  */
7153               switch (flag_code)
7154                 {
7155                 case CODE_16BIT:
7156                   override = !override;
7157                   /* Fall through.  */
7158                 case CODE_32BIT:
7159                   if (operand_types[j].bitfield.disp32
7160                       && operand_types[j].bitfield.disp16)
7161                     {
7162                       operand_types[j].bitfield.disp16 = override;
7163                       operand_types[j].bitfield.disp32 = !override;
7164                     }
7165                   gas_assert (!operand_types[j].bitfield.disp64);
7166                   break;
7167
7168                 case CODE_64BIT:
7169                   if (operand_types[j].bitfield.disp64)
7170                     {
7171                       gas_assert (!operand_types[j].bitfield.disp32);
7172                       operand_types[j].bitfield.disp32 = override;
7173                       operand_types[j].bitfield.disp64 = !override;
7174                     }
7175                   operand_types[j].bitfield.disp16 = 0;
7176                   break;
7177                 }
7178             }
7179         }
7180
7181       /* We check register size if needed.  */
7182       if (t->opcode_modifier.checkoperandsize)
7183         {
7184           check_register = (1 << t->operands) - 1;
7185           if (i.broadcast.type || i.broadcast.bytes)
7186             check_register &= ~(1 << i.broadcast.operand);
7187         }
7188       else
7189         check_register = 0;
7190
7191       overlap0 = operand_type_and (i.types[0], operand_types[0]);
7192       switch (t->operands)
7193         {
7194         case 1:
7195           if (!operand_type_match (overlap0, i.types[0]))
7196             continue;
7197
7198           /* Allow the ModR/M encoding to be requested by using the {load} or
7199              {store} pseudo prefix on an applicable insn.  */
7200           if (!t->opcode_modifier.modrm
7201               && i.reg_operands == 1
7202               && ((i.dir_encoding == dir_encoding_load
7203                    && t->mnem_off != MN_pop)
7204                   || (i.dir_encoding == dir_encoding_store
7205                       && t->mnem_off != MN_push))
7206               /* Avoid BSWAP.  */
7207               && t->mnem_off != MN_bswap)
7208             continue;
7209           break;
7210
7211         case 2:
7212           /* xchg %eax, %eax is a special case. It is an alias for nop
7213              only in 32bit mode and we can use opcode 0x90.  In 64bit
7214              mode, we can't use 0x90 for xchg %eax, %eax since it should
7215              zero-extend %eax to %rax.  */
7216           if (t->base_opcode == 0x90
7217               && t->opcode_space == SPACE_BASE)
7218             {
7219               if (flag_code == CODE_64BIT
7220                   && i.types[0].bitfield.instance == Accum
7221                   && i.types[0].bitfield.dword
7222                   && i.types[1].bitfield.instance == Accum)
7223                 continue;
7224
7225               /* Allow the ModR/M encoding to be requested by using the
7226                  {load} or {store} pseudo prefix.  */
7227               if (i.dir_encoding == dir_encoding_load
7228                   || i.dir_encoding == dir_encoding_store)
7229                 continue;
7230             }
7231
7232           if (t->base_opcode == MOV_AX_DISP32
7233               && t->opcode_space == SPACE_BASE
7234               && t->mnem_off != MN_movabs)
7235             {
7236               /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
7237               if (i.reloc[0] == BFD_RELOC_386_GOT32)
7238                 continue;
7239
7240               /* xrelease mov %eax, <disp> is another special case. It must not
7241                  match the accumulator-only encoding of mov.  */
7242               if (i.hle_prefix)
7243                 continue;
7244
7245               /* Allow the ModR/M encoding to be requested by using a suitable
7246                  {load} or {store} pseudo prefix.  */
7247               if (i.dir_encoding == (i.types[0].bitfield.instance == Accum
7248                                      ? dir_encoding_store
7249                                      : dir_encoding_load)
7250                   && !i.types[0].bitfield.disp64
7251                   && !i.types[1].bitfield.disp64)
7252                 continue;
7253             }
7254
7255           /* Allow the ModR/M encoding to be requested by using the {load} or
7256              {store} pseudo prefix on an applicable insn.  */
7257           if (!t->opcode_modifier.modrm
7258               && i.reg_operands == 1
7259               && i.imm_operands == 1
7260               && (i.dir_encoding == dir_encoding_load
7261                   || i.dir_encoding == dir_encoding_store)
7262               && t->opcode_space == SPACE_BASE)
7263             {
7264               if (t->base_opcode == 0xb0 /* mov $imm, %reg */
7265                   && i.dir_encoding == dir_encoding_store)
7266                 continue;
7267
7268               if ((t->base_opcode | 0x38) == 0x3c /* <alu> $imm, %acc */
7269                   && (t->base_opcode != 0x3c /* cmp $imm, %acc */
7270                       || i.dir_encoding == dir_encoding_load))
7271                 continue;
7272
7273               if (t->base_opcode == 0xa8 /* test $imm, %acc */
7274                   && i.dir_encoding == dir_encoding_load)
7275                 continue;
7276             }
7277           /* Fall through.  */
7278
7279         case 3:
7280           if (!(size_match & MATCH_STRAIGHT))
7281             goto check_reverse;
7282           /* Reverse direction of operands if swapping is possible in the first
7283              place (operands need to be symmetric) and
7284              - the load form is requested, and the template is a store form,
7285              - the store form is requested, and the template is a load form,
7286              - the non-default (swapped) form is requested.  */
7287           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
7288           if (t->opcode_modifier.d && i.reg_operands == i.operands
7289               && !operand_type_all_zero (&overlap1))
7290             switch (i.dir_encoding)
7291               {
7292               case dir_encoding_load:
7293                 if (operand_type_check (operand_types[i.operands - 1], anymem)
7294                     || t->opcode_modifier.regmem)
7295                   goto check_reverse;
7296                 break;
7297
7298               case dir_encoding_store:
7299                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
7300                     && !t->opcode_modifier.regmem)
7301                   goto check_reverse;
7302                 break;
7303
7304               case dir_encoding_swap:
7305                 goto check_reverse;
7306
7307               case dir_encoding_default:
7308                 break;
7309               }
7310           /* If we want store form, we skip the current load.  */
7311           if ((i.dir_encoding == dir_encoding_store
7312                || i.dir_encoding == dir_encoding_swap)
7313               && i.mem_operands == 0
7314               && t->opcode_modifier.load)
7315             continue;
7316           /* Fall through.  */
7317         case 4:
7318         case 5:
7319           overlap1 = operand_type_and (i.types[1], operand_types[1]);
7320           if (!operand_type_match (overlap0, i.types[0])
7321               || !operand_type_match (overlap1, i.types[1])
7322               || ((check_register & 3) == 3
7323                   && !operand_type_register_match (i.types[0],
7324                                                    operand_types[0],
7325                                                    i.types[1],
7326                                                    operand_types[1])))
7327             {
7328               specific_error = progress (i.error);
7329
7330               /* Check if other direction is valid ...  */
7331               if (!t->opcode_modifier.d)
7332                 continue;
7333
7334             check_reverse:
7335               if (!(size_match & MATCH_REVERSE))
7336                 continue;
7337               /* Try reversing direction of operands.  */
7338               j = is_cpu (t, CpuFMA4)
7339                   || is_cpu (t, CpuXOP) ? 1 : i.operands - 1;
7340               overlap0 = operand_type_and (i.types[0], operand_types[j]);
7341               overlap1 = operand_type_and (i.types[j], operand_types[0]);
7342               overlap2 = operand_type_and (i.types[1], operand_types[1]);
7343               gas_assert (t->operands != 3 || !check_register);
7344               if (!operand_type_match (overlap0, i.types[0])
7345                   || !operand_type_match (overlap1, i.types[j])
7346                   || (t->operands == 3
7347                       && !operand_type_match (overlap2, i.types[1]))
7348                   || (check_register
7349                       && !operand_type_register_match (i.types[0],
7350                                                        operand_types[j],
7351                                                        i.types[j],
7352                                                        operand_types[0])))
7353                 {
7354                   /* Does not match either direction.  */
7355                   specific_error = progress (i.error);
7356                   continue;
7357                 }
7358               /* found_reverse_match holds which variant of D
7359                  we've found.  */
7360               if (!t->opcode_modifier.d)
7361                 found_reverse_match = 0;
7362               else if (operand_types[0].bitfield.tbyte)
7363                 {
7364                   if (t->opcode_modifier.operandconstraint != UGH)
7365                     found_reverse_match = Opcode_FloatD;
7366                   else
7367                     found_reverse_match = ~0;
7368                   /* FSUB{,R} and FDIV{,R} may need a 2nd bit flipped.  */
7369                   if ((t->extension_opcode & 4)
7370                       && (intel_syntax || intel_mnemonic))
7371                     found_reverse_match |= Opcode_FloatR;
7372                 }
7373               else if (is_cpu (t, CpuFMA4) || is_cpu (t, CpuXOP))
7374                 {
7375                   found_reverse_match = Opcode_VexW;
7376                   goto check_operands_345;
7377                 }
7378               else if (t->opcode_space != SPACE_BASE
7379                        && (t->opcode_space != SPACE_0F
7380                            /* MOV to/from CR/DR/TR, as an exception, follow
7381                               the base opcode space encoding model.  */
7382                            || (t->base_opcode | 7) != 0x27))
7383                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
7384                                       ? Opcode_ExtD : Opcode_SIMD_IntD;
7385               else if (!t->opcode_modifier.commutative)
7386                 found_reverse_match = Opcode_D;
7387               else
7388                 found_reverse_match = ~0;
7389             }
7390           else
7391             {
7392               /* Found a forward 2 operand match here.  */
7393             check_operands_345:
7394               switch (t->operands)
7395                 {
7396                 case 5:
7397                   overlap4 = operand_type_and (i.types[4], operand_types[4]);
7398                   if (!operand_type_match (overlap4, i.types[4])
7399                       || !operand_type_register_match (i.types[3],
7400                                                        operand_types[3],
7401                                                        i.types[4],
7402                                                        operand_types[4]))
7403                     {
7404                       specific_error = progress (i.error);
7405                       continue;
7406                     }
7407                   /* Fall through.  */
7408                 case 4:
7409                   overlap3 = operand_type_and (i.types[3], operand_types[3]);
7410                   if (!operand_type_match (overlap3, i.types[3])
7411                       || ((check_register & 0xa) == 0xa
7412                           && !operand_type_register_match (i.types[1],
7413                                                             operand_types[1],
7414                                                             i.types[3],
7415                                                             operand_types[3]))
7416                       || ((check_register & 0xc) == 0xc
7417                           && !operand_type_register_match (i.types[2],
7418                                                             operand_types[2],
7419                                                             i.types[3],
7420                                                             operand_types[3])))
7421                     {
7422                       specific_error = progress (i.error);
7423                       continue;
7424                     }
7425                   /* Fall through.  */
7426                 case 3:
7427                   overlap2 = operand_type_and (i.types[2], operand_types[2]);
7428                   if (!operand_type_match (overlap2, i.types[2])
7429                       || ((check_register & 5) == 5
7430                           && !operand_type_register_match (i.types[0],
7431                                                             operand_types[0],
7432                                                             i.types[2],
7433                                                             operand_types[2]))
7434                       || ((check_register & 6) == 6
7435                           && !operand_type_register_match (i.types[1],
7436                                                             operand_types[1],
7437                                                             i.types[2],
7438                                                             operand_types[2])))
7439                     {
7440                       specific_error = progress (i.error);
7441                       continue;
7442                     }
7443                   break;
7444                 }
7445             }
7446           /* Found either forward/reverse 2, 3 or 4 operand match here:
7447              slip through to break.  */
7448         }
7449
7450       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
7451       if (VEX_check_encoding (t))
7452         {
7453           specific_error = progress (i.error);
7454           continue;
7455         }
7456
7457       /* Check if vector operands are valid.  */
7458       if (check_VecOperands (t))
7459         {
7460           specific_error = progress (i.error);
7461           continue;
7462         }
7463
7464       /* Check whether to use the shorter VEX encoding for certain insns where
7465          the EVEX enconding comes first in the table.  This requires the respective
7466          AVX-* feature to be explicitly enabled.  */
7467       if (t == current_templates->start
7468           && t->opcode_modifier.disp8memshift
7469           && !t->opcode_modifier.vex
7470           && !need_evex_encoding ()
7471           && t + 1 < current_templates->end
7472           && t[1].opcode_modifier.vex)
7473         {
7474           i386_cpu_flags cpu;
7475           unsigned int memshift = i.memshift;
7476
7477           i.memshift = 0;
7478           cpu = cpu_flags_and (cpu_flags_from_attr (t[1].cpu), cpu_arch_isa_flags);
7479           if (!cpu_flags_all_zero (&cpu)
7480               && (!i.types[0].bitfield.disp8
7481                   || !operand_type_check (i.types[0], disp)
7482                   || i.op[0].disps->X_op != O_constant
7483                   || fits_in_disp8 (i.op[0].disps->X_add_number)))
7484             {
7485               specific_error = progress (internal_error);
7486               continue;
7487             }
7488           i.memshift = memshift;
7489         }
7490
7491       /* We've found a match; break out of loop.  */
7492       break;
7493     }
7494
7495 #undef progress
7496
7497   if (t == current_templates->end)
7498     {
7499       /* We found no match.  */
7500       i.error = specific_error;
7501       return NULL;
7502     }
7503
7504   if (!quiet_warnings)
7505     {
7506       if (!intel_syntax
7507           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
7508         as_warn (_("indirect %s without `*'"), insn_name (t));
7509
7510       if (t->opcode_modifier.isprefix
7511           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
7512         {
7513           /* Warn them that a data or address size prefix doesn't
7514              affect assembly of the next line of code.  */
7515           as_warn (_("stand-alone `%s' prefix"), insn_name (t));
7516         }
7517     }
7518
7519   /* Copy the template we found.  */
7520   install_template (t);
7521
7522   if (addr_prefix_disp != -1)
7523     i.tm.operand_types[addr_prefix_disp]
7524       = operand_types[addr_prefix_disp];
7525
7526   switch (found_reverse_match)
7527     {
7528     case 0:
7529       break;
7530
7531     case Opcode_FloatR:
7532     case Opcode_FloatR | Opcode_FloatD:
7533       i.tm.extension_opcode ^= Opcode_FloatR >> 3;
7534       found_reverse_match &= Opcode_FloatD;
7535
7536       /* Fall through.  */
7537     default:
7538       /* If we found a reverse match we must alter the opcode direction
7539          bit and clear/flip the regmem modifier one.  found_reverse_match
7540          holds bits to change (different for int & float insns).  */
7541
7542       i.tm.base_opcode ^= found_reverse_match;
7543
7544       /* Certain SIMD insns have their load forms specified in the opcode
7545          table, and hence we need to _set_ RegMem instead of clearing it.
7546          We need to avoid setting the bit though on insns like KMOVW.  */
7547       i.tm.opcode_modifier.regmem
7548         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
7549           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
7550           && !i.tm.opcode_modifier.regmem;
7551
7552       /* Fall through.  */
7553     case ~0:
7554       i.tm.operand_types[0] = operand_types[i.operands - 1];
7555       i.tm.operand_types[i.operands - 1] = operand_types[0];
7556       break;
7557
7558     case Opcode_VexW:
7559       /* Only the first two register operands need reversing, alongside
7560          flipping VEX.W.  */
7561       i.tm.opcode_modifier.vexw ^= VEXW0 ^ VEXW1;
7562
7563       j = i.tm.operand_types[0].bitfield.imm8;
7564       i.tm.operand_types[j] = operand_types[j + 1];
7565       i.tm.operand_types[j + 1] = operand_types[j];
7566       break;
7567     }
7568
7569   return t;
7570 }
7571
7572 static int
7573 check_string (void)
7574 {
7575   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
7576   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
7577
7578   if (i.seg[op] != NULL && i.seg[op] != reg_es)
7579     {
7580       as_bad (_("`%s' operand %u must use `%ses' segment"),
7581               insn_name (&i.tm),
7582               intel_syntax ? i.tm.operands - es_op : es_op + 1,
7583               register_prefix);
7584       return 0;
7585     }
7586
7587   /* There's only ever one segment override allowed per instruction.
7588      This instruction possibly has a legal segment override on the
7589      second operand, so copy the segment to where non-string
7590      instructions store it, allowing common code.  */
7591   i.seg[op] = i.seg[1];
7592
7593   return 1;
7594 }
7595
7596 static int
7597 process_suffix (void)
7598 {
7599   bool is_movx = false;
7600
7601   /* If matched instruction specifies an explicit instruction mnemonic
7602      suffix, use it.  */
7603   if (i.tm.opcode_modifier.size == SIZE16)
7604     i.suffix = WORD_MNEM_SUFFIX;
7605   else if (i.tm.opcode_modifier.size == SIZE32)
7606     i.suffix = LONG_MNEM_SUFFIX;
7607   else if (i.tm.opcode_modifier.size == SIZE64)
7608     i.suffix = QWORD_MNEM_SUFFIX;
7609   else if (i.reg_operands
7610            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
7611            && i.tm.opcode_modifier.operandconstraint != ADDR_PREFIX_OP_REG)
7612     {
7613       unsigned int numop = i.operands;
7614
7615       /* MOVSX/MOVZX */
7616       is_movx = (i.tm.opcode_space == SPACE_0F
7617                  && (i.tm.base_opcode | 8) == 0xbe)
7618                 || (i.tm.opcode_space == SPACE_BASE
7619                     && i.tm.base_opcode == 0x63
7620                     && is_cpu (&i.tm, Cpu64));
7621
7622       /* movsx/movzx want only their source operand considered here, for the
7623          ambiguity checking below.  The suffix will be replaced afterwards
7624          to represent the destination (register).  */
7625       if (is_movx && (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63))
7626         --i.operands;
7627
7628       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
7629       if (i.tm.mnem_off == MN_crc32 && i.tm.operand_types[1].bitfield.qword)
7630         i.rex |= REX_W;
7631
7632       /* If there's no instruction mnemonic suffix we try to invent one
7633          based on GPR operands.  */
7634       if (!i.suffix)
7635         {
7636           /* We take i.suffix from the last register operand specified,
7637              Destination register type is more significant than source
7638              register type.  crc32 in SSE4.2 prefers source register
7639              type. */
7640           unsigned int op = i.tm.mnem_off == MN_crc32 ? 1 : i.operands;
7641
7642           while (op--)
7643             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
7644                 || i.tm.operand_types[op].bitfield.instance == Accum)
7645               {
7646                 if (i.types[op].bitfield.class != Reg)
7647                   continue;
7648                 if (i.types[op].bitfield.byte)
7649                   i.suffix = BYTE_MNEM_SUFFIX;
7650                 else if (i.types[op].bitfield.word)
7651                   i.suffix = WORD_MNEM_SUFFIX;
7652                 else if (i.types[op].bitfield.dword)
7653                   i.suffix = LONG_MNEM_SUFFIX;
7654                 else if (i.types[op].bitfield.qword)
7655                   i.suffix = QWORD_MNEM_SUFFIX;
7656                 else
7657                   continue;
7658                 break;
7659               }
7660
7661           /* As an exception, movsx/movzx silently default to a byte source
7662              in AT&T mode.  */
7663           if (is_movx && i.tm.opcode_modifier.w && !i.suffix && !intel_syntax)
7664             i.suffix = BYTE_MNEM_SUFFIX;
7665         }
7666       else if (i.suffix == BYTE_MNEM_SUFFIX)
7667         {
7668           if (!check_byte_reg ())
7669             return 0;
7670         }
7671       else if (i.suffix == LONG_MNEM_SUFFIX)
7672         {
7673           if (!check_long_reg ())
7674             return 0;
7675         }
7676       else if (i.suffix == QWORD_MNEM_SUFFIX)
7677         {
7678           if (!check_qword_reg ())
7679             return 0;
7680         }
7681       else if (i.suffix == WORD_MNEM_SUFFIX)
7682         {
7683           if (!check_word_reg ())
7684             return 0;
7685         }
7686       else if (intel_syntax
7687                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
7688         /* Do nothing if the instruction is going to ignore the prefix.  */
7689         ;
7690       else
7691         abort ();
7692
7693       /* Undo the movsx/movzx change done above.  */
7694       i.operands = numop;
7695     }
7696   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
7697            && !i.suffix)
7698     {
7699       i.suffix = stackop_size;
7700       if (stackop_size == LONG_MNEM_SUFFIX)
7701         {
7702           /* stackop_size is set to LONG_MNEM_SUFFIX for the
7703              .code16gcc directive to support 16-bit mode with
7704              32-bit address.  For IRET without a suffix, generate
7705              16-bit IRET (opcode 0xcf) to return from an interrupt
7706              handler.  */
7707           if (i.tm.base_opcode == 0xcf)
7708             {
7709               i.suffix = WORD_MNEM_SUFFIX;
7710               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
7711             }
7712           /* Warn about changed behavior for segment register push/pop.  */
7713           else if ((i.tm.base_opcode | 1) == 0x07)
7714             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
7715                      insn_name (&i.tm));
7716         }
7717     }
7718   else if (!i.suffix
7719            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
7720                || i.tm.opcode_modifier.jump == JUMP_BYTE
7721                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
7722                || (i.tm.opcode_space == SPACE_0F
7723                    && i.tm.base_opcode == 0x01 /* [ls][gi]dt */
7724                    && i.tm.extension_opcode <= 3)))
7725     {
7726       switch (flag_code)
7727         {
7728         case CODE_64BIT:
7729           if (!i.tm.opcode_modifier.no_qsuf)
7730             {
7731               if (i.tm.opcode_modifier.jump == JUMP_BYTE
7732                   || i.tm.opcode_modifier.no_lsuf)
7733                 i.suffix = QWORD_MNEM_SUFFIX;
7734               break;
7735             }
7736           /* Fall through.  */
7737         case CODE_32BIT:
7738           if (!i.tm.opcode_modifier.no_lsuf)
7739             i.suffix = LONG_MNEM_SUFFIX;
7740           break;
7741         case CODE_16BIT:
7742           if (!i.tm.opcode_modifier.no_wsuf)
7743             i.suffix = WORD_MNEM_SUFFIX;
7744           break;
7745         }
7746     }
7747
7748   if (!i.suffix
7749       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7750           /* Also cover lret/retf/iret in 64-bit mode.  */
7751           || (flag_code == CODE_64BIT
7752               && !i.tm.opcode_modifier.no_lsuf
7753               && !i.tm.opcode_modifier.no_qsuf))
7754       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7755       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
7756       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
7757       /* Accept FLDENV et al without suffix.  */
7758       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
7759     {
7760       unsigned int suffixes, evex = 0;
7761
7762       suffixes = !i.tm.opcode_modifier.no_bsuf;
7763       if (!i.tm.opcode_modifier.no_wsuf)
7764         suffixes |= 1 << 1;
7765       if (!i.tm.opcode_modifier.no_lsuf)
7766         suffixes |= 1 << 2;
7767       if (!i.tm.opcode_modifier.no_ssuf)
7768         suffixes |= 1 << 4;
7769       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
7770         suffixes |= 1 << 5;
7771
7772       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
7773          also suitable for AT&T syntax mode, it was requested that this be
7774          restricted to just Intel syntax.  */
7775       if (intel_syntax && is_any_vex_encoding (&i.tm)
7776           && !i.broadcast.type && !i.broadcast.bytes)
7777         {
7778           unsigned int op;
7779
7780           for (op = 0; op < i.tm.operands; ++op)
7781             {
7782               if (vector_size < VSZ512)
7783                 {
7784                   i.tm.operand_types[op].bitfield.zmmword = 0;
7785                   if (vector_size < VSZ256)
7786                     {
7787                       i.tm.operand_types[op].bitfield.ymmword = 0;
7788                       if (i.tm.operand_types[op].bitfield.xmmword
7789                           && (i.tm.opcode_modifier.evex == EVEXDYN
7790                               || (!i.tm.opcode_modifier.evex
7791                                   && is_evex_encoding (&i.tm))))
7792                         i.tm.opcode_modifier.evex = EVEX128;
7793                     }
7794                   else if (i.tm.operand_types[op].bitfield.ymmword
7795                            && !i.tm.operand_types[op].bitfield.xmmword
7796                            && (i.tm.opcode_modifier.evex == EVEXDYN
7797                                || (!i.tm.opcode_modifier.evex
7798                                    && is_evex_encoding (&i.tm))))
7799                     i.tm.opcode_modifier.evex = EVEX256;
7800                 }
7801               else if (is_evex_encoding (&i.tm)
7802                        && !cpu_arch_flags.bitfield.cpuavx512vl)
7803                 {
7804                   if (i.tm.operand_types[op].bitfield.ymmword)
7805                     i.tm.operand_types[op].bitfield.xmmword = 0;
7806                   if (i.tm.operand_types[op].bitfield.zmmword)
7807                     i.tm.operand_types[op].bitfield.ymmword = 0;
7808                   if (!i.tm.opcode_modifier.evex
7809                       || i.tm.opcode_modifier.evex == EVEXDYN)
7810                     i.tm.opcode_modifier.evex = EVEX512;
7811                 }
7812
7813               if (i.tm.operand_types[op].bitfield.xmmword
7814                   + i.tm.operand_types[op].bitfield.ymmword
7815                   + i.tm.operand_types[op].bitfield.zmmword < 2)
7816                 continue;
7817
7818               /* Any properly sized operand disambiguates the insn.  */
7819               if (i.types[op].bitfield.xmmword
7820                   || i.types[op].bitfield.ymmword
7821                   || i.types[op].bitfield.zmmword)
7822                 {
7823                   suffixes &= ~(7 << 6);
7824                   evex = 0;
7825                   break;
7826                 }
7827
7828               if ((i.flags[op] & Operand_Mem)
7829                   && i.tm.operand_types[op].bitfield.unspecified)
7830                 {
7831                   if (i.tm.operand_types[op].bitfield.xmmword)
7832                     suffixes |= 1 << 6;
7833                   if (i.tm.operand_types[op].bitfield.ymmword)
7834                     suffixes |= 1 << 7;
7835                   if (i.tm.operand_types[op].bitfield.zmmword)
7836                     suffixes |= 1 << 8;
7837                   if (is_evex_encoding (&i.tm))
7838                     evex = EVEX512;
7839                 }
7840             }
7841         }
7842
7843       /* Are multiple suffixes / operand sizes allowed?  */
7844       if (suffixes & (suffixes - 1))
7845         {
7846           if (intel_syntax
7847               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7848                   || operand_check == check_error))
7849             {
7850               as_bad (_("ambiguous operand size for `%s'"), insn_name (&i.tm));
7851               return 0;
7852             }
7853           if (operand_check == check_error)
7854             {
7855               as_bad (_("no instruction mnemonic suffix given and "
7856                         "no register operands; can't size `%s'"), insn_name (&i.tm));
7857               return 0;
7858             }
7859           if (operand_check == check_warning)
7860             as_warn (_("%s; using default for `%s'"),
7861                        intel_syntax
7862                        ? _("ambiguous operand size")
7863                        : _("no instruction mnemonic suffix given and "
7864                            "no register operands"),
7865                        insn_name (&i.tm));
7866
7867           if (i.tm.opcode_modifier.floatmf)
7868             i.suffix = SHORT_MNEM_SUFFIX;
7869           else if (is_movx)
7870             /* handled below */;
7871           else if (evex)
7872             i.tm.opcode_modifier.evex = evex;
7873           else if (flag_code == CODE_16BIT)
7874             i.suffix = WORD_MNEM_SUFFIX;
7875           else if (!i.tm.opcode_modifier.no_lsuf)
7876             i.suffix = LONG_MNEM_SUFFIX;
7877           else
7878             i.suffix = QWORD_MNEM_SUFFIX;
7879         }
7880     }
7881
7882   if (is_movx)
7883     {
7884       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7885          In AT&T syntax, if there is no suffix (warned about above), the default
7886          will be byte extension.  */
7887       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7888         i.tm.base_opcode |= 1;
7889
7890       /* For further processing, the suffix should represent the destination
7891          (register).  This is already the case when one was used with
7892          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7893          no suffix to begin with.  */
7894       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7895         {
7896           if (i.types[1].bitfield.word)
7897             i.suffix = WORD_MNEM_SUFFIX;
7898           else if (i.types[1].bitfield.qword)
7899             i.suffix = QWORD_MNEM_SUFFIX;
7900           else
7901             i.suffix = LONG_MNEM_SUFFIX;
7902
7903           i.tm.opcode_modifier.w = 0;
7904         }
7905     }
7906
7907   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7908     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7909                    != (i.tm.operand_types[1].bitfield.class == Reg);
7910
7911   /* Change the opcode based on the operand size given by i.suffix.  */
7912   switch (i.suffix)
7913     {
7914     /* Size floating point instruction.  */
7915     case LONG_MNEM_SUFFIX:
7916       if (i.tm.opcode_modifier.floatmf)
7917         {
7918           i.tm.base_opcode ^= 4;
7919           break;
7920         }
7921     /* fall through */
7922     case WORD_MNEM_SUFFIX:
7923     case QWORD_MNEM_SUFFIX:
7924       /* It's not a byte, select word/dword operation.  */
7925       if (i.tm.opcode_modifier.w)
7926         {
7927           if (i.short_form)
7928             i.tm.base_opcode |= 8;
7929           else
7930             i.tm.base_opcode |= 1;
7931         }
7932     /* fall through */
7933     case SHORT_MNEM_SUFFIX:
7934       /* Now select between word & dword operations via the operand
7935          size prefix, except for instructions that will ignore this
7936          prefix anyway.  */
7937       if (i.suffix != QWORD_MNEM_SUFFIX
7938           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7939           && !i.tm.opcode_modifier.floatmf
7940           && !is_any_vex_encoding (&i.tm)
7941           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7942               || (flag_code == CODE_64BIT
7943                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7944         {
7945           unsigned int prefix = DATA_PREFIX_OPCODE;
7946
7947           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7948             prefix = ADDR_PREFIX_OPCODE;
7949
7950           if (!add_prefix (prefix))
7951             return 0;
7952         }
7953
7954       /* Set mode64 for an operand.  */
7955       if (i.suffix == QWORD_MNEM_SUFFIX
7956           && flag_code == CODE_64BIT
7957           && !i.tm.opcode_modifier.norex64
7958           && !i.tm.opcode_modifier.vexw
7959           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7960              need rex64. */
7961           && ! (i.operands == 2
7962                 && i.tm.base_opcode == 0x90
7963                 && i.tm.opcode_space == SPACE_BASE
7964                 && i.types[0].bitfield.instance == Accum
7965                 && i.types[0].bitfield.qword
7966                 && i.types[1].bitfield.instance == Accum))
7967         i.rex |= REX_W;
7968
7969       break;
7970
7971     case 0:
7972       /* Select word/dword/qword operation with explicit data sizing prefix
7973          when there are no suitable register operands.  */
7974       if (i.tm.opcode_modifier.w
7975           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7976           && (!i.reg_operands
7977               || (i.reg_operands == 1
7978                       /* ShiftCount */
7979                   && (i.tm.operand_types[0].bitfield.instance == RegC
7980                       /* InOutPortReg */
7981                       || i.tm.operand_types[0].bitfield.instance == RegD
7982                       || i.tm.operand_types[1].bitfield.instance == RegD
7983                       || i.tm.mnem_off == MN_crc32))))
7984         i.tm.base_opcode |= 1;
7985       break;
7986     }
7987
7988   if (i.tm.opcode_modifier.operandconstraint == ADDR_PREFIX_OP_REG)
7989     {
7990       gas_assert (!i.suffix);
7991       gas_assert (i.reg_operands);
7992
7993       if (i.tm.operand_types[0].bitfield.instance == Accum
7994           || i.operands == 1)
7995         {
7996           /* The address size override prefix changes the size of the
7997              first operand.  */
7998           if (flag_code == CODE_64BIT
7999               && i.op[0].regs->reg_type.bitfield.word)
8000             {
8001               as_bad (_("16-bit addressing unavailable for `%s'"),
8002                       insn_name (&i.tm));
8003               return 0;
8004             }
8005
8006           if ((flag_code == CODE_32BIT
8007                ? i.op[0].regs->reg_type.bitfield.word
8008                : i.op[0].regs->reg_type.bitfield.dword)
8009               && !add_prefix (ADDR_PREFIX_OPCODE))
8010             return 0;
8011         }
8012       else
8013         {
8014           /* Check invalid register operand when the address size override
8015              prefix changes the size of register operands.  */
8016           unsigned int op;
8017           enum { need_word, need_dword, need_qword } need;
8018
8019           /* Check the register operand for the address size prefix if
8020              the memory operand has no real registers, like symbol, DISP
8021              or bogus (x32-only) symbol(%rip) when symbol(%eip) is meant.  */
8022           if (i.mem_operands == 1
8023               && i.reg_operands == 1
8024               && i.operands == 2
8025               && i.types[1].bitfield.class == Reg
8026               && (flag_code == CODE_32BIT
8027                   ? i.op[1].regs->reg_type.bitfield.word
8028                   : i.op[1].regs->reg_type.bitfield.dword)
8029               && ((i.base_reg == NULL && i.index_reg == NULL)
8030 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
8031                   || (x86_elf_abi == X86_64_X32_ABI
8032                       && i.base_reg
8033                       && i.base_reg->reg_num == RegIP
8034                       && i.base_reg->reg_type.bitfield.qword))
8035 #else
8036                   || 0)
8037 #endif
8038               && !add_prefix (ADDR_PREFIX_OPCODE))
8039             return 0;
8040
8041           if (flag_code == CODE_32BIT)
8042             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
8043           else if (i.prefix[ADDR_PREFIX])
8044             need = need_dword;
8045           else
8046             need = flag_code == CODE_64BIT ? need_qword : need_word;
8047
8048           for (op = 0; op < i.operands; op++)
8049             {
8050               if (i.types[op].bitfield.class != Reg)
8051                 continue;
8052
8053               switch (need)
8054                 {
8055                 case need_word:
8056                   if (i.op[op].regs->reg_type.bitfield.word)
8057                     continue;
8058                   break;
8059                 case need_dword:
8060                   if (i.op[op].regs->reg_type.bitfield.dword)
8061                     continue;
8062                   break;
8063                 case need_qword:
8064                   if (i.op[op].regs->reg_type.bitfield.qword)
8065                     continue;
8066                   break;
8067                 }
8068
8069               as_bad (_("invalid register operand size for `%s'"),
8070                       insn_name (&i.tm));
8071               return 0;
8072             }
8073         }
8074     }
8075
8076   return 1;
8077 }
8078
8079 static int
8080 check_byte_reg (void)
8081 {
8082   int op;
8083
8084   for (op = i.operands; --op >= 0;)
8085     {
8086       /* Skip non-register operands. */
8087       if (i.types[op].bitfield.class != Reg)
8088         continue;
8089
8090       /* If this is an eight bit register, it's OK.  If it's the 16 or
8091          32 bit version of an eight bit register, we will just use the
8092          low portion, and that's OK too.  */
8093       if (i.types[op].bitfield.byte)
8094         continue;
8095
8096       /* I/O port address operands are OK too.  */
8097       if (i.tm.operand_types[op].bitfield.instance == RegD
8098           && i.tm.operand_types[op].bitfield.word)
8099         continue;
8100
8101       /* crc32 only wants its source operand checked here.  */
8102       if (i.tm.mnem_off == MN_crc32 && op != 0)
8103         continue;
8104
8105       /* Any other register is bad.  */
8106       as_bad (_("`%s%s' not allowed with `%s%c'"),
8107               register_prefix, i.op[op].regs->reg_name,
8108               insn_name (&i.tm), i.suffix);
8109       return 0;
8110     }
8111   return 1;
8112 }
8113
8114 static int
8115 check_long_reg (void)
8116 {
8117   int op;
8118
8119   for (op = i.operands; --op >= 0;)
8120     /* Skip non-register operands. */
8121     if (i.types[op].bitfield.class != Reg)
8122       continue;
8123     /* Reject eight bit registers, except where the template requires
8124        them. (eg. movzb)  */
8125     else if (i.types[op].bitfield.byte
8126              && (i.tm.operand_types[op].bitfield.class == Reg
8127                  || i.tm.operand_types[op].bitfield.instance == Accum)
8128              && (i.tm.operand_types[op].bitfield.word
8129                  || i.tm.operand_types[op].bitfield.dword))
8130       {
8131         as_bad (_("`%s%s' not allowed with `%s%c'"),
8132                 register_prefix,
8133                 i.op[op].regs->reg_name,
8134                 insn_name (&i.tm),
8135                 i.suffix);
8136         return 0;
8137       }
8138     /* Error if the e prefix on a general reg is missing.  */
8139     else if (i.types[op].bitfield.word
8140              && (i.tm.operand_types[op].bitfield.class == Reg
8141                  || i.tm.operand_types[op].bitfield.instance == Accum)
8142              && i.tm.operand_types[op].bitfield.dword)
8143       {
8144         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
8145                 register_prefix, i.op[op].regs->reg_name,
8146                 i.suffix);
8147         return 0;
8148       }
8149     /* Warn if the r prefix on a general reg is present.  */
8150     else if (i.types[op].bitfield.qword
8151              && (i.tm.operand_types[op].bitfield.class == Reg
8152                  || i.tm.operand_types[op].bitfield.instance == Accum)
8153              && i.tm.operand_types[op].bitfield.dword)
8154       {
8155         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
8156                 register_prefix, i.op[op].regs->reg_name, i.suffix);
8157         return 0;
8158       }
8159   return 1;
8160 }
8161
8162 static int
8163 check_qword_reg (void)
8164 {
8165   int op;
8166
8167   for (op = i.operands; --op >= 0; )
8168     /* Skip non-register operands. */
8169     if (i.types[op].bitfield.class != Reg)
8170       continue;
8171     /* Reject eight bit registers, except where the template requires
8172        them. (eg. movzb)  */
8173     else if (i.types[op].bitfield.byte
8174              && (i.tm.operand_types[op].bitfield.class == Reg
8175                  || i.tm.operand_types[op].bitfield.instance == Accum)
8176              && (i.tm.operand_types[op].bitfield.word
8177                  || i.tm.operand_types[op].bitfield.dword))
8178       {
8179         as_bad (_("`%s%s' not allowed with `%s%c'"),
8180                 register_prefix,
8181                 i.op[op].regs->reg_name,
8182                 insn_name (&i.tm),
8183                 i.suffix);
8184         return 0;
8185       }
8186     /* Warn if the r prefix on a general reg is missing.  */
8187     else if ((i.types[op].bitfield.word
8188               || i.types[op].bitfield.dword)
8189              && (i.tm.operand_types[op].bitfield.class == Reg
8190                  || i.tm.operand_types[op].bitfield.instance == Accum)
8191              && i.tm.operand_types[op].bitfield.qword)
8192       {
8193         /* Prohibit these changes in the 64bit mode, since the
8194            lowering is more complicated.  */
8195         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
8196                 register_prefix, i.op[op].regs->reg_name, i.suffix);
8197         return 0;
8198       }
8199   return 1;
8200 }
8201
8202 static int
8203 check_word_reg (void)
8204 {
8205   int op;
8206   for (op = i.operands; --op >= 0;)
8207     /* Skip non-register operands. */
8208     if (i.types[op].bitfield.class != Reg)
8209       continue;
8210     /* Reject eight bit registers, except where the template requires
8211        them. (eg. movzb)  */
8212     else if (i.types[op].bitfield.byte
8213              && (i.tm.operand_types[op].bitfield.class == Reg
8214                  || i.tm.operand_types[op].bitfield.instance == Accum)
8215              && (i.tm.operand_types[op].bitfield.word
8216                  || i.tm.operand_types[op].bitfield.dword))
8217       {
8218         as_bad (_("`%s%s' not allowed with `%s%c'"),
8219                 register_prefix,
8220                 i.op[op].regs->reg_name,
8221                 insn_name (&i.tm),
8222                 i.suffix);
8223         return 0;
8224       }
8225     /* Error if the e or r prefix on a general reg is present.  */
8226     else if ((i.types[op].bitfield.dword
8227                  || i.types[op].bitfield.qword)
8228              && (i.tm.operand_types[op].bitfield.class == Reg
8229                  || i.tm.operand_types[op].bitfield.instance == Accum)
8230              && i.tm.operand_types[op].bitfield.word)
8231       {
8232         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
8233                 register_prefix, i.op[op].regs->reg_name,
8234                 i.suffix);
8235         return 0;
8236       }
8237   return 1;
8238 }
8239
8240 static int
8241 update_imm (unsigned int j)
8242 {
8243   i386_operand_type overlap = i.types[j];
8244
8245   if (i.tm.operand_types[j].bitfield.imm8
8246       && i.tm.operand_types[j].bitfield.imm8s
8247       && overlap.bitfield.imm8 && overlap.bitfield.imm8s)
8248     {
8249       /* This combination is used on 8-bit immediates where e.g. $~0 is
8250          desirable to permit.  We're past operand type matching, so simply
8251          put things back in the shape they were before introducing the
8252          distinction between Imm8, Imm8S, and Imm8|Imm8S.  */
8253       overlap.bitfield.imm8s = 0;
8254     }
8255
8256   if (overlap.bitfield.imm8
8257       + overlap.bitfield.imm8s
8258       + overlap.bitfield.imm16
8259       + overlap.bitfield.imm32
8260       + overlap.bitfield.imm32s
8261       + overlap.bitfield.imm64 > 1)
8262     {
8263       static const i386_operand_type imm16 = { .bitfield = { .imm16 = 1 } };
8264       static const i386_operand_type imm32 = { .bitfield = { .imm32 = 1 } };
8265       static const i386_operand_type imm32s = { .bitfield = { .imm32s = 1 } };
8266       static const i386_operand_type imm16_32 = { .bitfield =
8267         { .imm16 = 1, .imm32 = 1 }
8268       };
8269       static const i386_operand_type imm16_32s =  { .bitfield =
8270         { .imm16 = 1, .imm32s = 1 }
8271       };
8272       static const i386_operand_type imm16_32_32s = { .bitfield =
8273         { .imm16 = 1, .imm32 = 1, .imm32s = 1 }
8274       };
8275
8276       if (i.suffix)
8277         {
8278           i386_operand_type temp;
8279
8280           operand_type_set (&temp, 0);
8281           if (i.suffix == BYTE_MNEM_SUFFIX)
8282             {
8283               temp.bitfield.imm8 = overlap.bitfield.imm8;
8284               temp.bitfield.imm8s = overlap.bitfield.imm8s;
8285             }
8286           else if (i.suffix == WORD_MNEM_SUFFIX)
8287             temp.bitfield.imm16 = overlap.bitfield.imm16;
8288           else if (i.suffix == QWORD_MNEM_SUFFIX)
8289             {
8290               temp.bitfield.imm64 = overlap.bitfield.imm64;
8291               temp.bitfield.imm32s = overlap.bitfield.imm32s;
8292             }
8293           else
8294             temp.bitfield.imm32 = overlap.bitfield.imm32;
8295           overlap = temp;
8296         }
8297       else if (operand_type_equal (&overlap, &imm16_32_32s)
8298                || operand_type_equal (&overlap, &imm16_32)
8299                || operand_type_equal (&overlap, &imm16_32s))
8300         {
8301           if ((flag_code == CODE_16BIT)
8302               ^ (i.prefix[DATA_PREFIX] != 0 && !(i.prefix[REX_PREFIX] & REX_W)))
8303             overlap = imm16;
8304           else
8305             overlap = imm32s;
8306         }
8307       else if (i.prefix[REX_PREFIX] & REX_W)
8308         overlap = operand_type_and (overlap, imm32s);
8309       else if (i.prefix[DATA_PREFIX])
8310         overlap = operand_type_and (overlap,
8311                                     flag_code != CODE_16BIT ? imm16 : imm32);
8312       if (overlap.bitfield.imm8
8313           + overlap.bitfield.imm8s
8314           + overlap.bitfield.imm16
8315           + overlap.bitfield.imm32
8316           + overlap.bitfield.imm32s
8317           + overlap.bitfield.imm64 != 1)
8318         {
8319           as_bad (_("no instruction mnemonic suffix given; "
8320                     "can't determine immediate size"));
8321           return 0;
8322         }
8323     }
8324   i.types[j] = overlap;
8325
8326   return 1;
8327 }
8328
8329 static int
8330 finalize_imm (void)
8331 {
8332   unsigned int j, n;
8333
8334   /* Update the first 2 immediate operands.  */
8335   n = i.operands > 2 ? 2 : i.operands;
8336   if (n)
8337     {
8338       for (j = 0; j < n; j++)
8339         if (update_imm (j) == 0)
8340           return 0;
8341
8342       /* The 3rd operand can't be immediate operand.  */
8343       gas_assert (operand_type_check (i.types[2], imm) == 0);
8344     }
8345
8346   return 1;
8347 }
8348
8349 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
8350                                  bool do_sse2avx)
8351 {
8352   if (r->reg_flags & RegRex)
8353     {
8354       if (i.rex & rex_bit)
8355         as_bad (_("same type of prefix used twice"));
8356       i.rex |= rex_bit;
8357     }
8358   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
8359     {
8360       gas_assert (i.vex.register_specifier == r);
8361       i.vex.register_specifier += 8;
8362     }
8363
8364   if (r->reg_flags & RegVRex)
8365     i.vrex |= rex_bit;
8366 }
8367
8368 static int
8369 process_operands (void)
8370 {
8371   /* Default segment register this instruction will use for memory
8372      accesses.  0 means unknown.  This is only for optimizing out
8373      unnecessary segment overrides.  */
8374   const reg_entry *default_seg = NULL;
8375
8376   /* We only need to check those implicit registers for instructions
8377      with 3 operands or less.  */
8378   if (i.operands <= 3)
8379     for (unsigned int j = 0; j < i.operands; j++)
8380       if (i.types[j].bitfield.instance != InstanceNone)
8381         i.reg_operands--;
8382
8383   if (i.tm.opcode_modifier.sse2avx)
8384     {
8385       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
8386          need converting.  */
8387       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
8388       i.prefix[REX_PREFIX] = 0;
8389       i.rex_encoding = 0;
8390     }
8391   /* ImmExt should be processed after SSE2AVX.  */
8392   else if (i.tm.opcode_modifier.immext)
8393     process_immext ();
8394
8395   /* TILEZERO is unusual in that it has a single operand encoded in ModR/M.reg,
8396      not ModR/M.rm.  To avoid special casing this in build_modrm_byte(), fake a
8397      new destination operand here, while converting the source one to register
8398      number 0.  */
8399   if (i.tm.mnem_off == MN_tilezero)
8400     {
8401       i.op[1].regs = i.op[0].regs;
8402       i.op[0].regs -= i.op[0].regs->reg_num;
8403       i.types[1] = i.types[0];
8404       i.tm.operand_types[1] = i.tm.operand_types[0];
8405       i.flags[1] = i.flags[0];
8406       i.operands++;
8407       i.reg_operands++;
8408       i.tm.operands++;
8409     }
8410
8411   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
8412     {
8413       static const i386_operand_type regxmm = {
8414         .bitfield = { .class = RegSIMD, .xmmword = 1 }
8415       };
8416       unsigned int dupl = i.operands;
8417       unsigned int dest = dupl - 1;
8418       unsigned int j;
8419
8420       /* The destination must be an xmm register.  */
8421       gas_assert (i.reg_operands
8422                   && MAX_OPERANDS > dupl
8423                   && operand_type_equal (&i.types[dest], &regxmm));
8424
8425       if (i.tm.operand_types[0].bitfield.instance == Accum
8426           && i.tm.operand_types[0].bitfield.xmmword)
8427         {
8428           /* Keep xmm0 for instructions with VEX prefix and 3
8429              sources.  */
8430           i.tm.operand_types[0].bitfield.instance = InstanceNone;
8431           i.tm.operand_types[0].bitfield.class = RegSIMD;
8432           i.reg_operands++;
8433           goto duplicate;
8434         }
8435
8436       if (i.tm.opcode_modifier.operandconstraint == IMPLICIT_1ST_XMM0)
8437         {
8438           gas_assert ((MAX_OPERANDS - 1) > dupl);
8439
8440           /* Add the implicit xmm0 for instructions with VEX prefix
8441              and 3 sources.  */
8442           for (j = i.operands; j > 0; j--)
8443             {
8444               i.op[j] = i.op[j - 1];
8445               i.types[j] = i.types[j - 1];
8446               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
8447               i.flags[j] = i.flags[j - 1];
8448             }
8449           i.op[0].regs
8450             = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
8451           i.types[0] = regxmm;
8452           i.tm.operand_types[0] = regxmm;
8453
8454           i.operands += 2;
8455           i.reg_operands += 2;
8456           i.tm.operands += 2;
8457
8458           dupl++;
8459           dest++;
8460           i.op[dupl] = i.op[dest];
8461           i.types[dupl] = i.types[dest];
8462           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8463           i.flags[dupl] = i.flags[dest];
8464         }
8465       else
8466         {
8467         duplicate:
8468           i.operands++;
8469           i.reg_operands++;
8470           i.tm.operands++;
8471
8472           i.op[dupl] = i.op[dest];
8473           i.types[dupl] = i.types[dest];
8474           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
8475           i.flags[dupl] = i.flags[dest];
8476         }
8477
8478        if (i.tm.opcode_modifier.immext)
8479          process_immext ();
8480     }
8481   else if (i.tm.operand_types[0].bitfield.instance == Accum
8482            && i.tm.opcode_modifier.modrm)
8483     {
8484       unsigned int j;
8485
8486       for (j = 1; j < i.operands; j++)
8487         {
8488           i.op[j - 1] = i.op[j];
8489           i.types[j - 1] = i.types[j];
8490
8491           /* We need to adjust fields in i.tm since they are used by
8492              build_modrm_byte.  */
8493           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
8494
8495           i.flags[j - 1] = i.flags[j];
8496         }
8497
8498       /* No adjustment to i.reg_operands: This was already done at the top
8499          of the function.  */
8500       i.operands--;
8501       i.tm.operands--;
8502     }
8503   else if (i.tm.opcode_modifier.operandconstraint == IMPLICIT_QUAD_GROUP)
8504     {
8505       unsigned int regnum, first_reg_in_group, last_reg_in_group;
8506
8507       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
8508       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
8509       regnum = register_number (i.op[1].regs);
8510       first_reg_in_group = regnum & ~3;
8511       last_reg_in_group = first_reg_in_group + 3;
8512       if (regnum != first_reg_in_group)
8513         as_warn (_("source register `%s%s' implicitly denotes"
8514                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
8515                  register_prefix, i.op[1].regs->reg_name,
8516                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
8517                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
8518                  insn_name (&i.tm));
8519     }
8520   else if (i.tm.opcode_modifier.operandconstraint == REG_KLUDGE)
8521     {
8522       /* The imul $imm, %reg instruction is converted into
8523          imul $imm, %reg, %reg, and the clr %reg instruction
8524          is converted into xor %reg, %reg.  */
8525
8526       unsigned int first_reg_op;
8527
8528       if (operand_type_check (i.types[0], reg))
8529         first_reg_op = 0;
8530       else
8531         first_reg_op = 1;
8532       /* Pretend we saw the extra register operand.  */
8533       gas_assert (i.reg_operands == 1
8534                   && i.op[first_reg_op + 1].regs == 0);
8535       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
8536       i.types[first_reg_op + 1] = i.types[first_reg_op];
8537       i.operands++;
8538       i.reg_operands++;
8539     }
8540
8541   if (i.tm.opcode_modifier.modrm)
8542     {
8543       /* The opcode is completed (modulo i.tm.extension_opcode which
8544          must be put into the modrm byte).  Now, we make the modrm and
8545          index base bytes based on all the info we've collected.  */
8546
8547       default_seg = build_modrm_byte ();
8548
8549       if (!quiet_warnings && i.tm.opcode_modifier.operandconstraint == UGH)
8550         {
8551           /* Warn about some common errors, but press on regardless.  */
8552           if (i.operands == 2)
8553             {
8554               /* Reversed arguments on faddp or fmulp.  */
8555               as_warn (_("translating to `%s %s%s,%s%s'"), insn_name (&i.tm),
8556                        register_prefix, i.op[!intel_syntax].regs->reg_name,
8557                        register_prefix, i.op[intel_syntax].regs->reg_name);
8558             }
8559           else if (i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
8560             {
8561               /* Extraneous `l' suffix on fp insn.  */
8562               as_warn (_("translating to `%s %s%s'"), insn_name (&i.tm),
8563                        register_prefix, i.op[0].regs->reg_name);
8564             }
8565         }
8566     }
8567   else if (i.types[0].bitfield.class == SReg && !dot_insn ())
8568     {
8569       if (flag_code != CODE_64BIT
8570           ? i.tm.base_opcode == POP_SEG_SHORT
8571             && i.op[0].regs->reg_num == 1
8572           : (i.tm.base_opcode | 1) == (POP_SEG386_SHORT & 0xff)
8573             && i.op[0].regs->reg_num < 4)
8574         {
8575           as_bad (_("you can't `%s %s%s'"),
8576                   insn_name (&i.tm), register_prefix, i.op[0].regs->reg_name);
8577           return 0;
8578         }
8579       if (i.op[0].regs->reg_num > 3
8580           && i.tm.opcode_space == SPACE_BASE )
8581         {
8582           i.tm.base_opcode ^= (POP_SEG_SHORT ^ POP_SEG386_SHORT) & 0xff;
8583           i.tm.opcode_space = SPACE_0F;
8584         }
8585       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
8586     }
8587   else if (i.tm.opcode_space == SPACE_BASE
8588            && (i.tm.base_opcode & ~3) == MOV_AX_DISP32)
8589     {
8590       default_seg = reg_ds;
8591     }
8592   else if (i.tm.opcode_modifier.isstring)
8593     {
8594       /* For the string instructions that allow a segment override
8595          on one of their operands, the default segment is ds.  */
8596       default_seg = reg_ds;
8597     }
8598   else if (i.short_form)
8599     {
8600       /* The register operand is in the 1st or 2nd non-immediate operand.  */
8601       const reg_entry *r = i.op[i.imm_operands].regs;
8602
8603       if (!dot_insn ()
8604           && r->reg_type.bitfield.instance == Accum
8605           && i.op[i.imm_operands + 1].regs)
8606         r = i.op[i.imm_operands + 1].regs;
8607       /* Register goes in low 3 bits of opcode.  */
8608       i.tm.base_opcode |= r->reg_num;
8609       set_rex_vrex (r, REX_B, false);
8610
8611       if (dot_insn () && i.reg_operands == 2)
8612         {
8613           gas_assert (is_any_vex_encoding (&i.tm)
8614                       || i.vec_encoding != vex_encoding_default);
8615           i.vex.register_specifier = i.op[i.operands - 1].regs;
8616         }
8617     }
8618   else if (i.reg_operands == 1
8619            && !i.flags[i.operands - 1]
8620            && i.tm.operand_types[i.operands - 1].bitfield.instance
8621               == InstanceNone)
8622     {
8623       gas_assert (is_any_vex_encoding (&i.tm)
8624                   || i.vec_encoding != vex_encoding_default);
8625       i.vex.register_specifier = i.op[i.operands - 1].regs;
8626     }
8627
8628   if ((i.seg[0] || i.prefix[SEG_PREFIX])
8629       && i.tm.mnem_off == MN_lea)
8630     {
8631       if (!quiet_warnings)
8632         as_warn (_("segment override on `%s' is ineffectual"), insn_name (&i.tm));
8633       if (optimize && !i.no_optimize)
8634         {
8635           i.seg[0] = NULL;
8636           i.prefix[SEG_PREFIX] = 0;
8637         }
8638     }
8639
8640   /* If a segment was explicitly specified, and the specified segment
8641      is neither the default nor the one already recorded from a prefix,
8642      use an opcode prefix to select it.  If we never figured out what
8643      the default segment is, then default_seg will be zero at this
8644      point, and the specified segment prefix will always be used.  */
8645   if (i.seg[0]
8646       && i.seg[0] != default_seg
8647       && i386_seg_prefixes[i.seg[0]->reg_num] != i.prefix[SEG_PREFIX])
8648     {
8649       if (!add_prefix (i386_seg_prefixes[i.seg[0]->reg_num]))
8650         return 0;
8651     }
8652   return 1;
8653 }
8654
8655 static const reg_entry *
8656 build_modrm_byte (void)
8657 {
8658   const reg_entry *default_seg = NULL;
8659   unsigned int source = i.imm_operands - i.tm.opcode_modifier.immext
8660                         /* Compensate for kludge in md_assemble().  */
8661                         + i.tm.operand_types[0].bitfield.imm1;
8662   unsigned int dest = i.operands - 1 - i.tm.opcode_modifier.immext;
8663   unsigned int v, op, reg_slot = ~0;
8664
8665   /* Accumulator (in particular %st), shift count (%cl), and alike need
8666      to be skipped just like immediate operands do.  */
8667   if (i.tm.operand_types[source].bitfield.instance)
8668     ++source;
8669   while (i.tm.operand_types[dest].bitfield.instance)
8670     --dest;
8671
8672   for (op = source; op < i.operands; ++op)
8673     if (i.tm.operand_types[op].bitfield.baseindex)
8674       break;
8675
8676   if (i.reg_operands + i.mem_operands + (i.tm.extension_opcode != None) == 4)
8677     {
8678       expressionS *exp;
8679
8680       /* There are 2 kinds of instructions:
8681          1. 5 operands: 4 register operands or 3 register operands
8682          plus 1 memory operand plus one Imm4 operand, VexXDS, and
8683          VexW0 or VexW1.  The destination must be either XMM, YMM or
8684          ZMM register.
8685          2. 4 operands: 4 register operands or 3 register operands
8686          plus 1 memory operand, with VexXDS.
8687          3. Other equivalent combinations when coming from s_insn().  */
8688       gas_assert (i.tm.opcode_modifier.vexvvvv
8689                   && i.tm.opcode_modifier.vexw);
8690       gas_assert (dot_insn ()
8691                   || i.tm.operand_types[dest].bitfield.class == RegSIMD);
8692
8693       /* Of the first two non-immediate operands the one with the template
8694          not allowing for a memory one is encoded in the immediate operand.  */
8695       if (source == op)
8696         reg_slot = source + 1;
8697       else
8698         reg_slot = source++;
8699
8700       if (!dot_insn ())
8701         {
8702           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
8703           gas_assert (!(i.op[reg_slot].regs->reg_flags & RegVRex));
8704         }
8705       else
8706         gas_assert (i.tm.operand_types[reg_slot].bitfield.class != ClassNone);
8707
8708       if (i.imm_operands == 0)
8709         {
8710           /* When there is no immediate operand, generate an 8bit
8711              immediate operand to encode the first operand.  */
8712           exp = &im_expressions[i.imm_operands++];
8713           i.op[i.operands].imms = exp;
8714           i.types[i.operands].bitfield.imm8 = 1;
8715           i.operands++;
8716
8717           exp->X_op = O_constant;
8718         }
8719       else
8720         {
8721           gas_assert (i.imm_operands == 1);
8722           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
8723           gas_assert (!i.tm.opcode_modifier.immext);
8724
8725           /* Turn on Imm8 again so that output_imm will generate it.  */
8726           i.types[0].bitfield.imm8 = 1;
8727
8728           exp = i.op[0].imms;
8729         }
8730       exp->X_add_number |= register_number (i.op[reg_slot].regs)
8731                            << (3 + !(is_evex_encoding (&i.tm)
8732                                      || i.vec_encoding == vex_encoding_evex));
8733     }
8734
8735   for (v = source + 1; v < dest; ++v)
8736     if (v != reg_slot)
8737       break;
8738   if (v >= dest)
8739     v = ~0;
8740   if (i.tm.extension_opcode != None)
8741     {
8742       if (dest != source)
8743         v = dest;
8744       dest = ~0;
8745     }
8746   gas_assert (source < dest);
8747   if (i.tm.opcode_modifier.operandconstraint == SWAP_SOURCES
8748       && source != op)
8749     {
8750       unsigned int tmp = source;
8751
8752       source = v;
8753       v = tmp;
8754     }
8755
8756   if (v < MAX_OPERANDS)
8757     {
8758       gas_assert (i.tm.opcode_modifier.vexvvvv);
8759       i.vex.register_specifier = i.op[v].regs;
8760     }
8761
8762   if (op < i.operands)
8763     {
8764       if (i.mem_operands)
8765         {
8766           unsigned int fake_zero_displacement = 0;
8767
8768           gas_assert (i.flags[op] & Operand_Mem);
8769
8770           if (i.tm.opcode_modifier.sib)
8771             {
8772               /* The index register of VSIB shouldn't be RegIZ.  */
8773               if (i.tm.opcode_modifier.sib != SIBMEM
8774                   && i.index_reg->reg_num == RegIZ)
8775                 abort ();
8776
8777               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8778               if (!i.base_reg)
8779                 {
8780                   i.sib.base = NO_BASE_REGISTER;
8781                   i.sib.scale = i.log2_scale_factor;
8782                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8783                   i.types[op].bitfield.disp32 = 1;
8784                 }
8785
8786               /* Since the mandatory SIB always has index register, so
8787                  the code logic remains unchanged. The non-mandatory SIB
8788                  without index register is allowed and will be handled
8789                  later.  */
8790               if (i.index_reg)
8791                 {
8792                   if (i.index_reg->reg_num == RegIZ)
8793                     i.sib.index = NO_INDEX_REGISTER;
8794                   else
8795                     i.sib.index = i.index_reg->reg_num;
8796                   set_rex_vrex (i.index_reg, REX_X, false);
8797                 }
8798             }
8799
8800           default_seg = reg_ds;
8801
8802           if (i.base_reg == 0)
8803             {
8804               i.rm.mode = 0;
8805               if (!i.disp_operands)
8806                 fake_zero_displacement = 1;
8807               if (i.index_reg == 0)
8808                 {
8809                   /* Both check for VSIB and mandatory non-vector SIB. */
8810                   gas_assert (!i.tm.opcode_modifier.sib
8811                               || i.tm.opcode_modifier.sib == SIBMEM);
8812                   /* Operand is just <disp>  */
8813                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8814                   if (flag_code == CODE_64BIT)
8815                     {
8816                       /* 64bit mode overwrites the 32bit absolute
8817                          addressing by RIP relative addressing and
8818                          absolute addressing is encoded by one of the
8819                          redundant SIB forms.  */
8820                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8821                       i.sib.base = NO_BASE_REGISTER;
8822                       i.sib.index = NO_INDEX_REGISTER;
8823                       i.types[op].bitfield.disp32 = 1;
8824                     }
8825                   else if ((flag_code == CODE_16BIT)
8826                            ^ (i.prefix[ADDR_PREFIX] != 0))
8827                     {
8828                       i.rm.regmem = NO_BASE_REGISTER_16;
8829                       i.types[op].bitfield.disp16 = 1;
8830                     }
8831                   else
8832                     {
8833                       i.rm.regmem = NO_BASE_REGISTER;
8834                       i.types[op].bitfield.disp32 = 1;
8835                     }
8836                 }
8837               else if (!i.tm.opcode_modifier.sib)
8838                 {
8839                   /* !i.base_reg && i.index_reg  */
8840                   if (i.index_reg->reg_num == RegIZ)
8841                     i.sib.index = NO_INDEX_REGISTER;
8842                   else
8843                     i.sib.index = i.index_reg->reg_num;
8844                   i.sib.base = NO_BASE_REGISTER;
8845                   i.sib.scale = i.log2_scale_factor;
8846                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8847                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8848                   i.types[op].bitfield.disp32 = 1;
8849                   if ((i.index_reg->reg_flags & RegRex) != 0)
8850                     i.rex |= REX_X;
8851                 }
8852             }
8853           /* RIP addressing for 64bit mode.  */
8854           else if (i.base_reg->reg_num == RegIP)
8855             {
8856               gas_assert (!i.tm.opcode_modifier.sib);
8857               i.rm.regmem = NO_BASE_REGISTER;
8858               i.types[op].bitfield.disp8 = 0;
8859               i.types[op].bitfield.disp16 = 0;
8860               i.types[op].bitfield.disp32 = 1;
8861               i.types[op].bitfield.disp64 = 0;
8862               i.flags[op] |= Operand_PCrel;
8863               if (! i.disp_operands)
8864                 fake_zero_displacement = 1;
8865             }
8866           else if (i.base_reg->reg_type.bitfield.word)
8867             {
8868               gas_assert (!i.tm.opcode_modifier.sib);
8869               switch (i.base_reg->reg_num)
8870                 {
8871                 case 3: /* (%bx)  */
8872                   if (i.index_reg == 0)
8873                     i.rm.regmem = 7;
8874                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8875                     i.rm.regmem = i.index_reg->reg_num - 6;
8876                   break;
8877                 case 5: /* (%bp)  */
8878                   default_seg = reg_ss;
8879                   if (i.index_reg == 0)
8880                     {
8881                       i.rm.regmem = 6;
8882                       if (operand_type_check (i.types[op], disp) == 0)
8883                         {
8884                           /* fake (%bp) into 0(%bp)  */
8885                           if (i.disp_encoding == disp_encoding_16bit)
8886                             i.types[op].bitfield.disp16 = 1;
8887                           else
8888                             i.types[op].bitfield.disp8 = 1;
8889                           fake_zero_displacement = 1;
8890                         }
8891                     }
8892                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8893                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8894                   break;
8895                 default: /* (%si) -> 4 or (%di) -> 5  */
8896                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8897                 }
8898               if (!fake_zero_displacement
8899                   && !i.disp_operands
8900                   && i.disp_encoding)
8901                 {
8902                   fake_zero_displacement = 1;
8903                   if (i.disp_encoding == disp_encoding_8bit)
8904                     i.types[op].bitfield.disp8 = 1;
8905                   else
8906                     i.types[op].bitfield.disp16 = 1;
8907                 }
8908               i.rm.mode = mode_from_disp_size (i.types[op]);
8909             }
8910           else /* i.base_reg and 32/64 bit mode  */
8911             {
8912               if (operand_type_check (i.types[op], disp))
8913                 {
8914                   i.types[op].bitfield.disp16 = 0;
8915                   i.types[op].bitfield.disp64 = 0;
8916                   i.types[op].bitfield.disp32 = 1;
8917                 }
8918
8919               if (!i.tm.opcode_modifier.sib)
8920                 i.rm.regmem = i.base_reg->reg_num;
8921               if ((i.base_reg->reg_flags & RegRex) != 0)
8922                 i.rex |= REX_B;
8923               i.sib.base = i.base_reg->reg_num;
8924               /* x86-64 ignores REX prefix bit here to avoid decoder
8925                  complications.  */
8926               if (!(i.base_reg->reg_flags & RegRex)
8927                   && (i.base_reg->reg_num == EBP_REG_NUM
8928                    || i.base_reg->reg_num == ESP_REG_NUM))
8929                   default_seg = reg_ss;
8930               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8931                 {
8932                   fake_zero_displacement = 1;
8933                   if (i.disp_encoding == disp_encoding_32bit)
8934                     i.types[op].bitfield.disp32 = 1;
8935                   else
8936                     i.types[op].bitfield.disp8 = 1;
8937                 }
8938               i.sib.scale = i.log2_scale_factor;
8939               if (i.index_reg == 0)
8940                 {
8941                   /* Only check for VSIB. */
8942                   gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8943                               && i.tm.opcode_modifier.sib != VECSIB256
8944                               && i.tm.opcode_modifier.sib != VECSIB512);
8945
8946                   /* <disp>(%esp) becomes two byte modrm with no index
8947                      register.  We've already stored the code for esp
8948                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8949                      Any base register besides %esp will not use the
8950                      extra modrm byte.  */
8951                   i.sib.index = NO_INDEX_REGISTER;
8952                 }
8953               else if (!i.tm.opcode_modifier.sib)
8954                 {
8955                   if (i.index_reg->reg_num == RegIZ)
8956                     i.sib.index = NO_INDEX_REGISTER;
8957                   else
8958                     i.sib.index = i.index_reg->reg_num;
8959                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8960                   if ((i.index_reg->reg_flags & RegRex) != 0)
8961                     i.rex |= REX_X;
8962                 }
8963
8964               if (i.disp_operands
8965                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8966                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8967                 i.rm.mode = 0;
8968               else
8969                 {
8970                   if (!fake_zero_displacement
8971                       && !i.disp_operands
8972                       && i.disp_encoding)
8973                     {
8974                       fake_zero_displacement = 1;
8975                       if (i.disp_encoding == disp_encoding_8bit)
8976                         i.types[op].bitfield.disp8 = 1;
8977                       else
8978                         i.types[op].bitfield.disp32 = 1;
8979                     }
8980                   i.rm.mode = mode_from_disp_size (i.types[op]);
8981                 }
8982             }
8983
8984           if (fake_zero_displacement)
8985             {
8986               /* Fakes a zero displacement assuming that i.types[op]
8987                  holds the correct displacement size.  */
8988               expressionS *exp;
8989
8990               gas_assert (i.op[op].disps == 0);
8991               exp = &disp_expressions[i.disp_operands++];
8992               i.op[op].disps = exp;
8993               exp->X_op = O_constant;
8994               exp->X_add_number = 0;
8995               exp->X_add_symbol = (symbolS *) 0;
8996               exp->X_op_symbol = (symbolS *) 0;
8997             }
8998         }
8999     else
9000         {
9001       i.rm.mode = 3;
9002       i.rm.regmem = i.op[op].regs->reg_num;
9003       set_rex_vrex (i.op[op].regs, REX_B, false);
9004         }
9005
9006       if (op == dest)
9007         dest = ~0;
9008       if (op == source)
9009         source = ~0;
9010     }
9011   else
9012     {
9013       i.rm.mode = 3;
9014       if (!i.tm.opcode_modifier.regmem)
9015         {
9016           gas_assert (source < MAX_OPERANDS);
9017           i.rm.regmem = i.op[source].regs->reg_num;
9018           set_rex_vrex (i.op[source].regs, REX_B,
9019                         dest >= MAX_OPERANDS && i.tm.opcode_modifier.sse2avx);
9020           source = ~0;
9021         }
9022       else
9023         {
9024           gas_assert (dest < MAX_OPERANDS);
9025           i.rm.regmem = i.op[dest].regs->reg_num;
9026           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
9027           dest = ~0;
9028         }
9029     }
9030
9031   /* Fill in i.rm.reg field with extension opcode (if any) or the
9032      appropriate register.  */
9033   if (i.tm.extension_opcode != None)
9034     i.rm.reg = i.tm.extension_opcode;
9035   else if (!i.tm.opcode_modifier.regmem && dest < MAX_OPERANDS)
9036     {
9037       i.rm.reg = i.op[dest].regs->reg_num;
9038       set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
9039     }
9040   else
9041     {
9042       gas_assert (source < MAX_OPERANDS);
9043       i.rm.reg = i.op[source].regs->reg_num;
9044       set_rex_vrex (i.op[source].regs, REX_R, false);
9045     }
9046
9047   if (flag_code != CODE_64BIT && (i.rex & REX_R))
9048     {
9049       gas_assert (i.types[!i.tm.opcode_modifier.regmem].bitfield.class == RegCR);
9050       i.rex &= ~REX_R;
9051       add_prefix (LOCK_PREFIX_OPCODE);
9052     }
9053
9054   return default_seg;
9055 }
9056
9057 static INLINE void
9058 frag_opcode_byte (unsigned char byte)
9059 {
9060   if (now_seg != absolute_section)
9061     FRAG_APPEND_1_CHAR (byte);
9062   else
9063     ++abs_section_offset;
9064 }
9065
9066 static unsigned int
9067 flip_code16 (unsigned int code16)
9068 {
9069   gas_assert (i.tm.operands == 1);
9070
9071   return !(i.prefix[REX_PREFIX] & REX_W)
9072          && (code16 ? i.tm.operand_types[0].bitfield.disp32
9073                     : i.tm.operand_types[0].bitfield.disp16)
9074          ? CODE16 : 0;
9075 }
9076
9077 static void
9078 output_branch (void)
9079 {
9080   char *p;
9081   int size;
9082   int code16;
9083   int prefix;
9084   relax_substateT subtype;
9085   symbolS *sym;
9086   offsetT off;
9087
9088   if (now_seg == absolute_section)
9089     {
9090       as_bad (_("relaxable branches not supported in absolute section"));
9091       return;
9092     }
9093
9094   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
9095   size = i.disp_encoding > disp_encoding_8bit ? BIG : SMALL;
9096
9097   prefix = 0;
9098   if (i.prefix[DATA_PREFIX] != 0)
9099     {
9100       prefix = 1;
9101       i.prefixes -= 1;
9102       code16 ^= flip_code16(code16);
9103     }
9104   /* Pentium4 branch hints.  */
9105   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
9106       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
9107     {
9108       prefix++;
9109       i.prefixes--;
9110     }
9111   if (i.prefix[REX_PREFIX] != 0)
9112     {
9113       prefix++;
9114       i.prefixes--;
9115     }
9116
9117   /* BND prefixed jump.  */
9118   if (i.prefix[BND_PREFIX] != 0)
9119     {
9120       prefix++;
9121       i.prefixes--;
9122     }
9123
9124   if (i.prefixes != 0)
9125     as_warn (_("skipping prefixes on `%s'"), insn_name (&i.tm));
9126
9127   /* It's always a symbol;  End frag & setup for relax.
9128      Make sure there is enough room in this frag for the largest
9129      instruction we may generate in md_convert_frag.  This is 2
9130      bytes for the opcode and room for the prefix and largest
9131      displacement.  */
9132   frag_grow (prefix + 2 + 4);
9133   /* Prefix and 1 opcode byte go in fr_fix.  */
9134   p = frag_more (prefix + 1);
9135   if (i.prefix[DATA_PREFIX] != 0)
9136     *p++ = DATA_PREFIX_OPCODE;
9137   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
9138       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
9139     *p++ = i.prefix[SEG_PREFIX];
9140   if (i.prefix[BND_PREFIX] != 0)
9141     *p++ = BND_PREFIX_OPCODE;
9142   if (i.prefix[REX_PREFIX] != 0)
9143     *p++ = i.prefix[REX_PREFIX];
9144   *p = i.tm.base_opcode;
9145
9146   if ((unsigned char) *p == JUMP_PC_RELATIVE)
9147     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
9148   else if (cpu_arch_flags.bitfield.cpui386)
9149     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
9150   else
9151     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
9152   subtype |= code16;
9153
9154   sym = i.op[0].disps->X_add_symbol;
9155   off = i.op[0].disps->X_add_number;
9156
9157   if (i.op[0].disps->X_op != O_constant
9158       && i.op[0].disps->X_op != O_symbol)
9159     {
9160       /* Handle complex expressions.  */
9161       sym = make_expr_symbol (i.op[0].disps);
9162       off = 0;
9163     }
9164
9165   frag_now->tc_frag_data.code64 = flag_code == CODE_64BIT;
9166
9167   /* 1 possible extra opcode + 4 byte displacement go in var part.
9168      Pass reloc in fr_var.  */
9169   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
9170 }
9171
9172 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9173 /* Return TRUE iff PLT32 relocation should be used for branching to
9174    symbol S.  */
9175
9176 static bool
9177 need_plt32_p (symbolS *s)
9178 {
9179   /* PLT32 relocation is ELF only.  */
9180   if (!IS_ELF)
9181     return false;
9182
9183 #ifdef TE_SOLARIS
9184   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
9185      krtld support it.  */
9186   return false;
9187 #endif
9188
9189   /* Since there is no need to prepare for PLT branch on x86-64, we
9190      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
9191      be used as a marker for 32-bit PC-relative branches.  */
9192   if (!object_64bit)
9193     return false;
9194
9195   if (s == NULL)
9196     return false;
9197
9198   /* Weak or undefined symbol need PLT32 relocation.  */
9199   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
9200     return true;
9201
9202   /* Non-global symbol doesn't need PLT32 relocation.  */
9203   if (! S_IS_EXTERNAL (s))
9204     return false;
9205
9206   /* Other global symbols need PLT32 relocation.  NB: Symbol with
9207      non-default visibilities are treated as normal global symbol
9208      so that PLT32 relocation can be used as a marker for 32-bit
9209      PC-relative branches.  It is useful for linker relaxation.  */
9210   return true;
9211 }
9212 #endif
9213
9214 static void
9215 output_jump (void)
9216 {
9217   char *p;
9218   int size;
9219   fixS *fixP;
9220   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
9221
9222   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
9223     {
9224       /* This is a loop or jecxz type instruction.  */
9225       size = 1;
9226       if (i.prefix[ADDR_PREFIX] != 0)
9227         {
9228           frag_opcode_byte (ADDR_PREFIX_OPCODE);
9229           i.prefixes -= 1;
9230         }
9231       /* Pentium4 branch hints.  */
9232       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
9233           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
9234         {
9235           frag_opcode_byte (i.prefix[SEG_PREFIX]);
9236           i.prefixes--;
9237         }
9238     }
9239   else
9240     {
9241       int code16;
9242
9243       code16 = 0;
9244       if (flag_code == CODE_16BIT)
9245         code16 = CODE16;
9246
9247       if (i.prefix[DATA_PREFIX] != 0)
9248         {
9249           frag_opcode_byte (DATA_PREFIX_OPCODE);
9250           i.prefixes -= 1;
9251           code16 ^= flip_code16(code16);
9252         }
9253
9254       size = 4;
9255       if (code16)
9256         size = 2;
9257     }
9258
9259   /* BND prefixed jump.  */
9260   if (i.prefix[BND_PREFIX] != 0)
9261     {
9262       frag_opcode_byte (i.prefix[BND_PREFIX]);
9263       i.prefixes -= 1;
9264     }
9265
9266   if (i.prefix[REX_PREFIX] != 0)
9267     {
9268       frag_opcode_byte (i.prefix[REX_PREFIX]);
9269       i.prefixes -= 1;
9270     }
9271
9272   if (i.prefixes != 0)
9273     as_warn (_("skipping prefixes on `%s'"), insn_name (&i.tm));
9274
9275   if (now_seg == absolute_section)
9276     {
9277       abs_section_offset += i.opcode_length + size;
9278       return;
9279     }
9280
9281   p = frag_more (i.opcode_length + size);
9282   switch (i.opcode_length)
9283     {
9284     case 2:
9285       *p++ = i.tm.base_opcode >> 8;
9286       /* Fall through.  */
9287     case 1:
9288       *p++ = i.tm.base_opcode;
9289       break;
9290     default:
9291       abort ();
9292     }
9293
9294 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9295   if (flag_code == CODE_64BIT && size == 4
9296       && jump_reloc == NO_RELOC && i.op[0].disps->X_add_number == 0
9297       && need_plt32_p (i.op[0].disps->X_add_symbol))
9298     jump_reloc = BFD_RELOC_X86_64_PLT32;
9299 #endif
9300
9301   jump_reloc = reloc (size, 1, 1, jump_reloc);
9302
9303   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9304                       i.op[0].disps, 1, jump_reloc);
9305
9306   /* All jumps handled here are signed, but don't unconditionally use a
9307      signed limit check for 32 and 16 bit jumps as we want to allow wrap
9308      around at 4G (outside of 64-bit mode) and 64k (except for XBEGIN)
9309      respectively.  */
9310   switch (size)
9311     {
9312     case 1:
9313       fixP->fx_signed = 1;
9314       break;
9315
9316     case 2:
9317       if (i.tm.mnem_off == MN_xbegin)
9318         fixP->fx_signed = 1;
9319       break;
9320
9321     case 4:
9322       if (flag_code == CODE_64BIT)
9323         fixP->fx_signed = 1;
9324       break;
9325     }
9326 }
9327
9328 static void
9329 output_interseg_jump (void)
9330 {
9331   char *p;
9332   int size;
9333   int prefix;
9334   int code16;
9335
9336   code16 = 0;
9337   if (flag_code == CODE_16BIT)
9338     code16 = CODE16;
9339
9340   prefix = 0;
9341   if (i.prefix[DATA_PREFIX] != 0)
9342     {
9343       prefix = 1;
9344       i.prefixes -= 1;
9345       code16 ^= CODE16;
9346     }
9347
9348   gas_assert (!i.prefix[REX_PREFIX]);
9349
9350   size = 4;
9351   if (code16)
9352     size = 2;
9353
9354   if (i.prefixes != 0)
9355     as_warn (_("skipping prefixes on `%s'"), insn_name (&i.tm));
9356
9357   if (now_seg == absolute_section)
9358     {
9359       abs_section_offset += prefix + 1 + 2 + size;
9360       return;
9361     }
9362
9363   /* 1 opcode; 2 segment; offset  */
9364   p = frag_more (prefix + 1 + 2 + size);
9365
9366   if (i.prefix[DATA_PREFIX] != 0)
9367     *p++ = DATA_PREFIX_OPCODE;
9368
9369   if (i.prefix[REX_PREFIX] != 0)
9370     *p++ = i.prefix[REX_PREFIX];
9371
9372   *p++ = i.tm.base_opcode;
9373   if (i.op[1].imms->X_op == O_constant)
9374     {
9375       offsetT n = i.op[1].imms->X_add_number;
9376
9377       if (size == 2
9378           && !fits_in_unsigned_word (n)
9379           && !fits_in_signed_word (n))
9380         {
9381           as_bad (_("16-bit jump out of range"));
9382           return;
9383         }
9384       md_number_to_chars (p, n, size);
9385     }
9386   else
9387     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9388                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
9389
9390   p += size;
9391   if (i.op[0].imms->X_op == O_constant)
9392     md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
9393   else
9394     fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
9395                  i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
9396 }
9397
9398 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9399 void
9400 x86_cleanup (void)
9401 {
9402   char *p;
9403   asection *seg = now_seg;
9404   subsegT subseg = now_subseg;
9405   asection *sec;
9406   unsigned int alignment, align_size_1;
9407   unsigned int isa_1_descsz, feature_2_descsz, descsz;
9408   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
9409   unsigned int padding;
9410
9411   if (!IS_ELF || !x86_used_note)
9412     return;
9413
9414   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
9415
9416   /* The .note.gnu.property section layout:
9417
9418      Field      Length          Contents
9419      ----       ----            ----
9420      n_namsz    4               4
9421      n_descsz   4               The note descriptor size
9422      n_type     4               NT_GNU_PROPERTY_TYPE_0
9423      n_name     4               "GNU"
9424      n_desc     n_descsz        The program property array
9425      ....       ....            ....
9426    */
9427
9428   /* Create the .note.gnu.property section.  */
9429   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
9430   bfd_set_section_flags (sec,
9431                          (SEC_ALLOC
9432                           | SEC_LOAD
9433                           | SEC_DATA
9434                           | SEC_HAS_CONTENTS
9435                           | SEC_READONLY));
9436
9437   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
9438     {
9439       align_size_1 = 7;
9440       alignment = 3;
9441     }
9442   else
9443     {
9444       align_size_1 = 3;
9445       alignment = 2;
9446     }
9447
9448   bfd_set_section_alignment (sec, alignment);
9449   elf_section_type (sec) = SHT_NOTE;
9450
9451   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
9452                                   + 4-byte data  */
9453   isa_1_descsz_raw = 4 + 4 + 4;
9454   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
9455   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
9456
9457   feature_2_descsz_raw = isa_1_descsz;
9458   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
9459                                       + 4-byte data  */
9460   feature_2_descsz_raw += 4 + 4 + 4;
9461   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
9462   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
9463                       & ~align_size_1);
9464
9465   descsz = feature_2_descsz;
9466   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
9467   p = frag_more (4 + 4 + 4 + 4 + descsz);
9468
9469   /* Write n_namsz.  */
9470   md_number_to_chars (p, (valueT) 4, 4);
9471
9472   /* Write n_descsz.  */
9473   md_number_to_chars (p + 4, (valueT) descsz, 4);
9474
9475   /* Write n_type.  */
9476   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
9477
9478   /* Write n_name.  */
9479   memcpy (p + 4 * 3, "GNU", 4);
9480
9481   /* Write 4-byte type.  */
9482   md_number_to_chars (p + 4 * 4,
9483                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
9484
9485   /* Write 4-byte data size.  */
9486   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
9487
9488   /* Write 4-byte data.  */
9489   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
9490
9491   /* Zero out paddings.  */
9492   padding = isa_1_descsz - isa_1_descsz_raw;
9493   if (padding)
9494     memset (p + 4 * 7, 0, padding);
9495
9496   /* Write 4-byte type.  */
9497   md_number_to_chars (p + isa_1_descsz + 4 * 4,
9498                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
9499
9500   /* Write 4-byte data size.  */
9501   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
9502
9503   /* Write 4-byte data.  */
9504   md_number_to_chars (p + isa_1_descsz + 4 * 6,
9505                       (valueT) x86_feature_2_used, 4);
9506
9507   /* Zero out paddings.  */
9508   padding = feature_2_descsz - feature_2_descsz_raw;
9509   if (padding)
9510     memset (p + isa_1_descsz + 4 * 7, 0, padding);
9511
9512   /* We probably can't restore the current segment, for there likely
9513      isn't one yet...  */
9514   if (seg && subseg)
9515     subseg_set (seg, subseg);
9516 }
9517
9518 bool
9519 x86_support_sframe_p (void)
9520 {
9521   /* At this time, SFrame stack trace is supported for AMD64 ABI only.  */
9522   return (x86_elf_abi == X86_64_ABI);
9523 }
9524
9525 bool
9526 x86_sframe_ra_tracking_p (void)
9527 {
9528   /* In AMD64, return address is always stored on the stack at a fixed offset
9529      from the CFA (provided via x86_sframe_cfa_ra_offset ()).
9530      Do not track explicitly via an SFrame Frame Row Entry.  */
9531   return false;
9532 }
9533
9534 offsetT
9535 x86_sframe_cfa_ra_offset (void)
9536 {
9537   gas_assert (x86_elf_abi == X86_64_ABI);
9538   return (offsetT) -8;
9539 }
9540
9541 unsigned char
9542 x86_sframe_get_abi_arch (void)
9543 {
9544   unsigned char sframe_abi_arch = 0;
9545
9546   if (x86_support_sframe_p ())
9547     {
9548       gas_assert (!target_big_endian);
9549       sframe_abi_arch = SFRAME_ABI_AMD64_ENDIAN_LITTLE;
9550     }
9551
9552   return sframe_abi_arch;
9553 }
9554
9555 #endif
9556
9557 static unsigned int
9558 encoding_length (const fragS *start_frag, offsetT start_off,
9559                  const char *frag_now_ptr)
9560 {
9561   unsigned int len = 0;
9562
9563   if (start_frag != frag_now)
9564     {
9565       const fragS *fr = start_frag;
9566
9567       do {
9568         len += fr->fr_fix;
9569         fr = fr->fr_next;
9570       } while (fr && fr != frag_now);
9571     }
9572
9573   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
9574 }
9575
9576 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
9577    be macro-fused with conditional jumps.
9578    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
9579    or is one of the following format:
9580
9581     cmp m, imm
9582     add m, imm
9583     sub m, imm
9584    test m, imm
9585     and m, imm
9586     inc m
9587     dec m
9588
9589    it is unfusible.  */
9590
9591 static int
9592 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
9593 {
9594   /* No RIP address.  */
9595   if (i.base_reg && i.base_reg->reg_num == RegIP)
9596     return 0;
9597
9598   /* No opcodes outside of base encoding space.  */
9599   if (i.tm.opcode_space != SPACE_BASE)
9600     return 0;
9601
9602   /* add, sub without add/sub m, imm.  */
9603   if (i.tm.base_opcode <= 5
9604       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
9605       || ((i.tm.base_opcode | 3) == 0x83
9606           && (i.tm.extension_opcode == 0x5
9607               || i.tm.extension_opcode == 0x0)))
9608     {
9609       *mf_cmp_p = mf_cmp_alu_cmp;
9610       return !(i.mem_operands && i.imm_operands);
9611     }
9612
9613   /* and without and m, imm.  */
9614   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
9615       || ((i.tm.base_opcode | 3) == 0x83
9616           && i.tm.extension_opcode == 0x4))
9617     {
9618       *mf_cmp_p = mf_cmp_test_and;
9619       return !(i.mem_operands && i.imm_operands);
9620     }
9621
9622   /* test without test m imm.  */
9623   if ((i.tm.base_opcode | 1) == 0x85
9624       || (i.tm.base_opcode | 1) == 0xa9
9625       || ((i.tm.base_opcode | 1) == 0xf7
9626           && i.tm.extension_opcode == 0))
9627     {
9628       *mf_cmp_p = mf_cmp_test_and;
9629       return !(i.mem_operands && i.imm_operands);
9630     }
9631
9632   /* cmp without cmp m, imm.  */
9633   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
9634       || ((i.tm.base_opcode | 3) == 0x83
9635           && (i.tm.extension_opcode == 0x7)))
9636     {
9637       *mf_cmp_p = mf_cmp_alu_cmp;
9638       return !(i.mem_operands && i.imm_operands);
9639     }
9640
9641   /* inc, dec without inc/dec m.   */
9642   if ((is_cpu (&i.tm, CpuNo64)
9643        && (i.tm.base_opcode | 0xf) == 0x4f)
9644       || ((i.tm.base_opcode | 1) == 0xff
9645           && i.tm.extension_opcode <= 0x1))
9646     {
9647       *mf_cmp_p = mf_cmp_incdec;
9648       return !i.mem_operands;
9649     }
9650
9651   return 0;
9652 }
9653
9654 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
9655
9656 static int
9657 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9658 {
9659   /* NB: Don't work with COND_JUMP86 without i386.  */
9660   if (!align_branch_power
9661       || now_seg == absolute_section
9662       || !cpu_arch_flags.bitfield.cpui386
9663       || !(align_branch & align_branch_fused_bit))
9664     return 0;
9665
9666   if (maybe_fused_with_jcc_p (mf_cmp_p))
9667     {
9668       if (last_insn.kind == last_insn_other
9669           || last_insn.seg != now_seg)
9670         return 1;
9671       if (flag_debug)
9672         as_warn_where (last_insn.file, last_insn.line,
9673                        _("`%s` skips -malign-branch-boundary on `%s`"),
9674                        last_insn.name, insn_name (&i.tm));
9675     }
9676
9677   return 0;
9678 }
9679
9680 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
9681
9682 static int
9683 add_branch_prefix_frag_p (void)
9684 {
9685   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
9686      to PadLock instructions since they include prefixes in opcode.  */
9687   if (!align_branch_power
9688       || !align_branch_prefix_size
9689       || now_seg == absolute_section
9690       || is_cpu (&i.tm, CpuPadLock)
9691       || !cpu_arch_flags.bitfield.cpui386)
9692     return 0;
9693
9694   /* Don't add prefix if it is a prefix or there is no operand in case
9695      that segment prefix is special.  */
9696   if (!i.operands || i.tm.opcode_modifier.isprefix)
9697     return 0;
9698
9699   if (last_insn.kind == last_insn_other
9700       || last_insn.seg != now_seg)
9701     return 1;
9702
9703   if (flag_debug)
9704     as_warn_where (last_insn.file, last_insn.line,
9705                    _("`%s` skips -malign-branch-boundary on `%s`"),
9706                    last_insn.name, insn_name (&i.tm));
9707
9708   return 0;
9709 }
9710
9711 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
9712
9713 static int
9714 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9715                            enum mf_jcc_kind *mf_jcc_p)
9716 {
9717   int add_padding;
9718
9719   /* NB: Don't work with COND_JUMP86 without i386.  */
9720   if (!align_branch_power
9721       || now_seg == absolute_section
9722       || !cpu_arch_flags.bitfield.cpui386
9723       || i.tm.opcode_space != SPACE_BASE)
9724     return 0;
9725
9726   add_padding = 0;
9727
9728   /* Check for jcc and direct jmp.  */
9729   if (i.tm.opcode_modifier.jump == JUMP)
9730     {
9731       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9732         {
9733           *branch_p = align_branch_jmp;
9734           add_padding = align_branch & align_branch_jmp_bit;
9735         }
9736       else
9737         {
9738           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9739              igore the lowest bit.  */
9740           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9741           *branch_p = align_branch_jcc;
9742           if ((align_branch & align_branch_jcc_bit))
9743             add_padding = 1;
9744         }
9745     }
9746   else if ((i.tm.base_opcode | 1) == 0xc3)
9747     {
9748       /* Near ret.  */
9749       *branch_p = align_branch_ret;
9750       if ((align_branch & align_branch_ret_bit))
9751         add_padding = 1;
9752     }
9753   else
9754     {
9755       /* Check for indirect jmp, direct and indirect calls.  */
9756       if (i.tm.base_opcode == 0xe8)
9757         {
9758           /* Direct call.  */
9759           *branch_p = align_branch_call;
9760           if ((align_branch & align_branch_call_bit))
9761             add_padding = 1;
9762         }
9763       else if (i.tm.base_opcode == 0xff
9764                && (i.tm.extension_opcode == 2
9765                    || i.tm.extension_opcode == 4))
9766         {
9767           /* Indirect call and jmp.  */
9768           *branch_p = align_branch_indirect;
9769           if ((align_branch & align_branch_indirect_bit))
9770             add_padding = 1;
9771         }
9772
9773       if (add_padding
9774           && i.disp_operands
9775           && tls_get_addr
9776           && (i.op[0].disps->X_op == O_symbol
9777               || (i.op[0].disps->X_op == O_subtract
9778                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9779         {
9780           symbolS *s = i.op[0].disps->X_add_symbol;
9781           /* No padding to call to global or undefined tls_get_addr.  */
9782           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9783               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9784             return 0;
9785         }
9786     }
9787
9788   if (add_padding
9789       && last_insn.kind != last_insn_other
9790       && last_insn.seg == now_seg)
9791     {
9792       if (flag_debug)
9793         as_warn_where (last_insn.file, last_insn.line,
9794                        _("`%s` skips -malign-branch-boundary on `%s`"),
9795                        last_insn.name, insn_name (&i.tm));
9796       return 0;
9797     }
9798
9799   return add_padding;
9800 }
9801
9802 static void
9803 output_insn (void)
9804 {
9805   fragS *insn_start_frag;
9806   offsetT insn_start_off;
9807   fragS *fragP = NULL;
9808   enum align_branch_kind branch = align_branch_none;
9809   /* The initializer is arbitrary just to avoid uninitialized error.
9810      it's actually either assigned in add_branch_padding_frag_p
9811      or never be used.  */
9812   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9813
9814 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9815   if (IS_ELF && x86_used_note && now_seg != absolute_section)
9816     {
9817       if ((i.xstate & xstate_tmm) == xstate_tmm
9818           || is_cpu (&i.tm, CpuAMX_TILE))
9819         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9820
9821       if (is_cpu (&i.tm, Cpu8087)
9822           || is_cpu (&i.tm, Cpu287)
9823           || is_cpu (&i.tm, Cpu387)
9824           || is_cpu (&i.tm, Cpu687)
9825           || is_cpu (&i.tm, CpuFISTTP))
9826         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9827
9828       if ((i.xstate & xstate_mmx)
9829           || i.tm.mnem_off == MN_emms
9830           || i.tm.mnem_off == MN_femms)
9831         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9832
9833       if (i.index_reg)
9834         {
9835           if (i.index_reg->reg_type.bitfield.zmmword)
9836             i.xstate |= xstate_zmm;
9837           else if (i.index_reg->reg_type.bitfield.ymmword)
9838             i.xstate |= xstate_ymm;
9839           else if (i.index_reg->reg_type.bitfield.xmmword)
9840             i.xstate |= xstate_xmm;
9841         }
9842
9843       /* vzeroall / vzeroupper */
9844       if (i.tm.base_opcode == 0x77 && is_cpu (&i.tm, CpuAVX))
9845         i.xstate |= xstate_ymm;
9846
9847       if ((i.xstate & xstate_xmm)
9848           /* ldmxcsr / stmxcsr / vldmxcsr / vstmxcsr */
9849           || (i.tm.base_opcode == 0xae
9850               && (is_cpu (&i.tm, CpuSSE)
9851                   || is_cpu (&i.tm, CpuAVX)))
9852           || is_cpu (&i.tm, CpuWideKL)
9853           || is_cpu (&i.tm, CpuKL))
9854         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9855
9856       if ((i.xstate & xstate_ymm) == xstate_ymm)
9857         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9858       if ((i.xstate & xstate_zmm) == xstate_zmm)
9859         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9860       if (i.mask.reg || (i.xstate & xstate_mask) == xstate_mask)
9861         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9862       if (is_cpu (&i.tm, CpuFXSR))
9863         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9864       if (is_cpu (&i.tm, CpuXsave))
9865         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9866       if (is_cpu (&i.tm, CpuXsaveopt))
9867         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9868       if (is_cpu (&i.tm, CpuXSAVEC))
9869         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9870
9871       if (x86_feature_2_used
9872           || is_cpu (&i.tm, CpuCMOV)
9873           || is_cpu (&i.tm, CpuSYSCALL)
9874           || i.tm.mnem_off == MN_cmpxchg8b)
9875         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9876       if (is_cpu (&i.tm, CpuSSE3)
9877           || is_cpu (&i.tm, CpuSSSE3)
9878           || is_cpu (&i.tm, CpuSSE4_1)
9879           || is_cpu (&i.tm, CpuSSE4_2)
9880           || is_cpu (&i.tm, CpuCX16)
9881           || is_cpu (&i.tm, CpuPOPCNT)
9882           /* LAHF-SAHF insns in 64-bit mode.  */
9883           || (flag_code == CODE_64BIT
9884               && (i.tm.base_opcode | 1) == 0x9f
9885               && i.tm.opcode_space == SPACE_BASE))
9886         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9887       if (is_cpu (&i.tm, CpuAVX)
9888           || is_cpu (&i.tm, CpuAVX2)
9889           /* Any VEX encoded insns execpt for AVX512F, AVX512BW, AVX512DQ,
9890              XOP, FMA4, LPW, TBM, and AMX.  */
9891           || (i.tm.opcode_modifier.vex
9892               && !is_cpu (&i.tm, CpuAVX512F)
9893               && !is_cpu (&i.tm, CpuAVX512BW)
9894               && !is_cpu (&i.tm, CpuAVX512DQ)
9895               && !is_cpu (&i.tm, CpuXOP)
9896               && !is_cpu (&i.tm, CpuFMA4)
9897               && !is_cpu (&i.tm, CpuLWP)
9898               && !is_cpu (&i.tm, CpuTBM)
9899               && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9900           || is_cpu (&i.tm, CpuF16C)
9901           || is_cpu (&i.tm, CpuFMA)
9902           || is_cpu (&i.tm, CpuLZCNT)
9903           || is_cpu (&i.tm, CpuMovbe)
9904           || is_cpu (&i.tm, CpuXSAVES)
9905           || (x86_feature_2_used
9906               & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9907                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9908                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9909         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9910       if (is_cpu (&i.tm, CpuAVX512F)
9911           || is_cpu (&i.tm, CpuAVX512BW)
9912           || is_cpu (&i.tm, CpuAVX512DQ)
9913           || is_cpu (&i.tm, CpuAVX512VL)
9914           /* Any EVEX encoded insns except for AVX512ER, AVX512PF,
9915              AVX512-4FMAPS, and AVX512-4VNNIW.  */
9916           || (i.tm.opcode_modifier.evex
9917               && !is_cpu (&i.tm, CpuAVX512ER)
9918               && !is_cpu (&i.tm, CpuAVX512PF)
9919               && !is_cpu (&i.tm, CpuAVX512_4FMAPS)
9920               && !is_cpu (&i.tm, CpuAVX512_4VNNIW)))
9921         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9922     }
9923 #endif
9924
9925   /* Tie dwarf2 debug info to the address at the start of the insn.
9926      We can't do this after the insn has been output as the current
9927      frag may have been closed off.  eg. by frag_var.  */
9928   dwarf2_emit_insn (0);
9929
9930   insn_start_frag = frag_now;
9931   insn_start_off = frag_now_fix ();
9932
9933   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9934     {
9935       char *p;
9936       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9937       unsigned int max_branch_padding_size = 14;
9938
9939       /* Align section to boundary.  */
9940       record_alignment (now_seg, align_branch_power);
9941
9942       /* Make room for padding.  */
9943       frag_grow (max_branch_padding_size);
9944
9945       /* Start of the padding.  */
9946       p = frag_more (0);
9947
9948       fragP = frag_now;
9949
9950       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9951                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9952                 NULL, 0, p);
9953
9954       fragP->tc_frag_data.mf_type = mf_jcc;
9955       fragP->tc_frag_data.branch_type = branch;
9956       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9957     }
9958
9959   if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT)
9960       && !pre_386_16bit_warned)
9961     {
9962       as_warn (_("use .code16 to ensure correct addressing mode"));
9963       pre_386_16bit_warned = true;
9964     }
9965
9966   /* Output jumps.  */
9967   if (i.tm.opcode_modifier.jump == JUMP)
9968     output_branch ();
9969   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9970            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9971     output_jump ();
9972   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9973     output_interseg_jump ();
9974   else
9975     {
9976       /* Output normal instructions here.  */
9977       char *p;
9978       unsigned char *q;
9979       unsigned int j;
9980       enum mf_cmp_kind mf_cmp;
9981
9982       if (avoid_fence
9983           && (i.tm.base_opcode == 0xaee8
9984               || i.tm.base_opcode == 0xaef0
9985               || i.tm.base_opcode == 0xaef8))
9986         {
9987           /* Encode lfence, mfence, and sfence as
9988              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9989           if (flag_code == CODE_16BIT)
9990             as_bad (_("Cannot convert `%s' in 16-bit mode"), insn_name (&i.tm));
9991           else if (omit_lock_prefix)
9992             as_bad (_("Cannot convert `%s' with `-momit-lock-prefix=yes' in effect"),
9993                     insn_name (&i.tm));
9994           else if (now_seg != absolute_section)
9995             {
9996               offsetT val = 0x240483f0ULL;
9997
9998               p = frag_more (5);
9999               md_number_to_chars (p, val, 5);
10000             }
10001           else
10002             abs_section_offset += 5;
10003           return;
10004         }
10005
10006       /* Some processors fail on LOCK prefix. This options makes
10007          assembler ignore LOCK prefix and serves as a workaround.  */
10008       if (omit_lock_prefix)
10009         {
10010           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE
10011               && i.tm.opcode_modifier.isprefix)
10012             return;
10013           i.prefix[LOCK_PREFIX] = 0;
10014         }
10015
10016       if (branch)
10017         /* Skip if this is a branch.  */
10018         ;
10019       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
10020         {
10021           /* Make room for padding.  */
10022           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
10023           p = frag_more (0);
10024
10025           fragP = frag_now;
10026
10027           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
10028                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
10029                     NULL, 0, p);
10030
10031           fragP->tc_frag_data.mf_type = mf_cmp;
10032           fragP->tc_frag_data.branch_type = align_branch_fused;
10033           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
10034         }
10035       else if (add_branch_prefix_frag_p ())
10036         {
10037           unsigned int max_prefix_size = align_branch_prefix_size;
10038
10039           /* Make room for padding.  */
10040           frag_grow (max_prefix_size);
10041           p = frag_more (0);
10042
10043           fragP = frag_now;
10044
10045           frag_var (rs_machine_dependent, max_prefix_size, 0,
10046                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
10047                     NULL, 0, p);
10048
10049           fragP->tc_frag_data.max_bytes = max_prefix_size;
10050         }
10051
10052       /* Since the VEX/EVEX prefix contains the implicit prefix, we
10053          don't need the explicit prefix.  */
10054       if (!is_any_vex_encoding (&i.tm))
10055         {
10056           switch (i.tm.opcode_modifier.opcodeprefix)
10057             {
10058             case PREFIX_0X66:
10059               add_prefix (0x66);
10060               break;
10061             case PREFIX_0XF2:
10062               add_prefix (0xf2);
10063               break;
10064             case PREFIX_0XF3:
10065               if (!is_cpu (&i.tm, CpuPadLock)
10066                   || (i.prefix[REP_PREFIX] != 0xf3))
10067                 add_prefix (0xf3);
10068               break;
10069             case PREFIX_NONE:
10070               switch (i.opcode_length)
10071                 {
10072                 case 2:
10073                   break;
10074                 case 1:
10075                   /* Check for pseudo prefixes.  */
10076                   if (!i.tm.opcode_modifier.isprefix || i.tm.base_opcode)
10077                     break;
10078                   as_bad_where (insn_start_frag->fr_file,
10079                                 insn_start_frag->fr_line,
10080                                 _("pseudo prefix without instruction"));
10081                   return;
10082                 default:
10083                   abort ();
10084                 }
10085               break;
10086             default:
10087               abort ();
10088             }
10089
10090 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10091           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
10092              R_X86_64_GOTTPOFF relocation so that linker can safely
10093              perform IE->LE optimization.  A dummy REX_OPCODE prefix
10094              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
10095              relocation for GDesc -> IE/LE optimization.  */
10096           if (x86_elf_abi == X86_64_X32_ABI
10097               && i.operands == 2
10098               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
10099                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
10100               && i.prefix[REX_PREFIX] == 0)
10101             add_prefix (REX_OPCODE);
10102 #endif
10103
10104           /* The prefix bytes.  */
10105           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
10106             if (*q)
10107               frag_opcode_byte (*q);
10108         }
10109       else
10110         {
10111           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
10112             if (*q)
10113               switch (j)
10114                 {
10115                 case SEG_PREFIX:
10116                 case ADDR_PREFIX:
10117                   frag_opcode_byte (*q);
10118                   break;
10119                 default:
10120                   /* There should be no other prefixes for instructions
10121                      with VEX prefix.  */
10122                   abort ();
10123                 }
10124
10125           /* For EVEX instructions i.vrex should become 0 after
10126              build_evex_prefix.  For VEX instructions upper 16 registers
10127              aren't available, so VREX should be 0.  */
10128           if (i.vrex)
10129             abort ();
10130           /* Now the VEX prefix.  */
10131           if (now_seg != absolute_section)
10132             {
10133               p = frag_more (i.vex.length);
10134               for (j = 0; j < i.vex.length; j++)
10135                 p[j] = i.vex.bytes[j];
10136             }
10137           else
10138             abs_section_offset += i.vex.length;
10139         }
10140
10141       /* Now the opcode; be careful about word order here!  */
10142       j = i.opcode_length;
10143       if (!i.vex.length)
10144         switch (i.tm.opcode_space)
10145           {
10146           case SPACE_BASE:
10147             break;
10148           case SPACE_0F:
10149             ++j;
10150             break;
10151           case SPACE_0F38:
10152           case SPACE_0F3A:
10153             j += 2;
10154             break;
10155           default:
10156             abort ();
10157           }
10158
10159       if (now_seg == absolute_section)
10160         abs_section_offset += j;
10161       else if (j == 1)
10162         {
10163           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
10164         }
10165       else
10166         {
10167           p = frag_more (j);
10168           if (!i.vex.length
10169               && i.tm.opcode_space != SPACE_BASE)
10170             {
10171               *p++ = 0x0f;
10172               if (i.tm.opcode_space != SPACE_0F)
10173                 *p++ = i.tm.opcode_space == SPACE_0F38
10174                        ? 0x38 : 0x3a;
10175             }
10176
10177           switch (i.opcode_length)
10178             {
10179             case 2:
10180               /* Put out high byte first: can't use md_number_to_chars!  */
10181               *p++ = (i.tm.base_opcode >> 8) & 0xff;
10182               /* Fall through.  */
10183             case 1:
10184               *p = i.tm.base_opcode & 0xff;
10185               break;
10186             default:
10187               abort ();
10188               break;
10189             }
10190
10191         }
10192
10193       /* Now the modrm byte and sib byte (if present).  */
10194       if (i.tm.opcode_modifier.modrm)
10195         {
10196           frag_opcode_byte ((i.rm.regmem << 0)
10197                              | (i.rm.reg << 3)
10198                              | (i.rm.mode << 6));
10199           /* If i.rm.regmem == ESP (4)
10200              && i.rm.mode != (Register mode)
10201              && not 16 bit
10202              ==> need second modrm byte.  */
10203           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
10204               && i.rm.mode != 3
10205               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
10206             frag_opcode_byte ((i.sib.base << 0)
10207                               | (i.sib.index << 3)
10208                               | (i.sib.scale << 6));
10209         }
10210
10211       if (i.disp_operands)
10212         output_disp (insn_start_frag, insn_start_off);
10213
10214       if (i.imm_operands)
10215         output_imm (insn_start_frag, insn_start_off);
10216
10217       /*
10218        * frag_now_fix () returning plain abs_section_offset when we're in the
10219        * absolute section, and abs_section_offset not getting updated as data
10220        * gets added to the frag breaks the logic below.
10221        */
10222       if (now_seg != absolute_section)
10223         {
10224           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
10225           if (j > 15)
10226             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
10227                      j);
10228           else if (fragP)
10229             {
10230               /* NB: Don't add prefix with GOTPC relocation since
10231                  output_disp() above depends on the fixed encoding
10232                  length.  Can't add prefix with TLS relocation since
10233                  it breaks TLS linker optimization.  */
10234               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
10235               /* Prefix count on the current instruction.  */
10236               unsigned int count = i.vex.length;
10237               unsigned int k;
10238               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
10239                 /* REX byte is encoded in VEX/EVEX prefix.  */
10240                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
10241                   count++;
10242
10243               /* Count prefixes for extended opcode maps.  */
10244               if (!i.vex.length)
10245                 switch (i.tm.opcode_space)
10246                   {
10247                   case SPACE_BASE:
10248                     break;
10249                   case SPACE_0F:
10250                     count++;
10251                     break;
10252                   case SPACE_0F38:
10253                   case SPACE_0F3A:
10254                     count += 2;
10255                     break;
10256                   default:
10257                     abort ();
10258                   }
10259
10260               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
10261                   == BRANCH_PREFIX)
10262                 {
10263                   /* Set the maximum prefix size in BRANCH_PREFIX
10264                      frag.  */
10265                   if (fragP->tc_frag_data.max_bytes > max)
10266                     fragP->tc_frag_data.max_bytes = max;
10267                   if (fragP->tc_frag_data.max_bytes > count)
10268                     fragP->tc_frag_data.max_bytes -= count;
10269                   else
10270                     fragP->tc_frag_data.max_bytes = 0;
10271                 }
10272               else
10273                 {
10274                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
10275                      frag.  */
10276                   unsigned int max_prefix_size;
10277                   if (align_branch_prefix_size > max)
10278                     max_prefix_size = max;
10279                   else
10280                     max_prefix_size = align_branch_prefix_size;
10281                   if (max_prefix_size > count)
10282                     fragP->tc_frag_data.max_prefix_length
10283                       = max_prefix_size - count;
10284                 }
10285
10286               /* Use existing segment prefix if possible.  Use CS
10287                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
10288                  segment prefix with ESP/EBP base register and use DS
10289                  segment prefix without ESP/EBP base register.  */
10290               if (i.prefix[SEG_PREFIX])
10291                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
10292               else if (flag_code == CODE_64BIT)
10293                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
10294               else if (i.base_reg
10295                        && (i.base_reg->reg_num == 4
10296                            || i.base_reg->reg_num == 5))
10297                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
10298               else
10299                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
10300             }
10301         }
10302     }
10303
10304   /* NB: Don't work with COND_JUMP86 without i386.  */
10305   if (align_branch_power
10306       && now_seg != absolute_section
10307       && cpu_arch_flags.bitfield.cpui386)
10308     {
10309       /* Terminate each frag so that we can add prefix and check for
10310          fused jcc.  */
10311       frag_wane (frag_now);
10312       frag_new (0);
10313     }
10314
10315 #ifdef DEBUG386
10316   if (flag_debug)
10317     {
10318       pi ("" /*line*/, &i);
10319     }
10320 #endif /* DEBUG386  */
10321 }
10322
10323 /* Return the size of the displacement operand N.  */
10324
10325 static int
10326 disp_size (unsigned int n)
10327 {
10328   int size = 4;
10329
10330   if (i.types[n].bitfield.disp64)
10331     size = 8;
10332   else if (i.types[n].bitfield.disp8)
10333     size = 1;
10334   else if (i.types[n].bitfield.disp16)
10335     size = 2;
10336   return size;
10337 }
10338
10339 /* Return the size of the immediate operand N.  */
10340
10341 static int
10342 imm_size (unsigned int n)
10343 {
10344   int size = 4;
10345   if (i.types[n].bitfield.imm64)
10346     size = 8;
10347   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
10348     size = 1;
10349   else if (i.types[n].bitfield.imm16)
10350     size = 2;
10351   return size;
10352 }
10353
10354 static void
10355 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
10356 {
10357   char *p;
10358   unsigned int n;
10359
10360   for (n = 0; n < i.operands; n++)
10361     {
10362       if (operand_type_check (i.types[n], disp))
10363         {
10364           int size = disp_size (n);
10365
10366           if (now_seg == absolute_section)
10367             abs_section_offset += size;
10368           else if (i.op[n].disps->X_op == O_constant)
10369             {
10370               offsetT val = i.op[n].disps->X_add_number;
10371
10372               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
10373                                      size);
10374               p = frag_more (size);
10375               md_number_to_chars (p, val, size);
10376             }
10377           else
10378             {
10379               enum bfd_reloc_code_real reloc_type;
10380               bool pcrel = (i.flags[n] & Operand_PCrel) != 0;
10381               bool sign = (flag_code == CODE_64BIT && size == 4
10382                            && (!want_disp32 (&i.tm)
10383                                || (i.tm.opcode_modifier.jump && !i.jumpabsolute
10384                                    && !i.types[n].bitfield.baseindex)))
10385                           || pcrel;
10386               fixS *fixP;
10387
10388               /* We can't have 8 bit displacement here.  */
10389               gas_assert (!i.types[n].bitfield.disp8);
10390
10391               /* The PC relative address is computed relative
10392                  to the instruction boundary, so in case immediate
10393                  fields follows, we need to adjust the value.  */
10394               if (pcrel && i.imm_operands)
10395                 {
10396                   unsigned int n1;
10397                   int sz = 0;
10398
10399                   for (n1 = 0; n1 < i.operands; n1++)
10400                     if (operand_type_check (i.types[n1], imm))
10401                       {
10402                         /* Only one immediate is allowed for PC
10403                            relative address, except with .insn.  */
10404                         gas_assert (sz == 0 || dot_insn ());
10405                         sz += imm_size (n1);
10406                       }
10407                   /* We should find at least one immediate.  */
10408                   gas_assert (sz != 0);
10409                   i.op[n].disps->X_add_number -= sz;
10410                 }
10411
10412               p = frag_more (size);
10413               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
10414               if (GOT_symbol
10415                   && GOT_symbol == i.op[n].disps->X_add_symbol
10416                   && (((reloc_type == BFD_RELOC_32
10417                         || reloc_type == BFD_RELOC_X86_64_32S
10418                         || (reloc_type == BFD_RELOC_64
10419                             && object_64bit))
10420                        && (i.op[n].disps->X_op == O_symbol
10421                            || (i.op[n].disps->X_op == O_add
10422                                && ((symbol_get_value_expression
10423                                     (i.op[n].disps->X_op_symbol)->X_op)
10424                                    == O_subtract))))
10425                       || reloc_type == BFD_RELOC_32_PCREL))
10426                 {
10427                   if (!object_64bit)
10428                     {
10429                       reloc_type = BFD_RELOC_386_GOTPC;
10430                       i.has_gotpc_tls_reloc = true;
10431                       i.op[n].disps->X_add_number +=
10432                         encoding_length (insn_start_frag, insn_start_off, p);
10433                     }
10434                   else if (reloc_type == BFD_RELOC_64)
10435                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
10436                   else
10437                     /* Don't do the adjustment for x86-64, as there
10438                        the pcrel addressing is relative to the _next_
10439                        insn, and that is taken care of in other code.  */
10440                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
10441                 }
10442               else if (align_branch_power)
10443                 {
10444                   switch (reloc_type)
10445                     {
10446                     case BFD_RELOC_386_TLS_GD:
10447                     case BFD_RELOC_386_TLS_LDM:
10448                     case BFD_RELOC_386_TLS_IE:
10449                     case BFD_RELOC_386_TLS_IE_32:
10450                     case BFD_RELOC_386_TLS_GOTIE:
10451                     case BFD_RELOC_386_TLS_GOTDESC:
10452                     case BFD_RELOC_386_TLS_DESC_CALL:
10453                     case BFD_RELOC_X86_64_TLSGD:
10454                     case BFD_RELOC_X86_64_TLSLD:
10455                     case BFD_RELOC_X86_64_GOTTPOFF:
10456                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10457                     case BFD_RELOC_X86_64_TLSDESC_CALL:
10458                       i.has_gotpc_tls_reloc = true;
10459                     default:
10460                       break;
10461                     }
10462                 }
10463               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
10464                                   size, i.op[n].disps, pcrel,
10465                                   reloc_type);
10466
10467               if (flag_code == CODE_64BIT && size == 4 && pcrel
10468                   && !i.prefix[ADDR_PREFIX])
10469                 fixP->fx_signed = 1;
10470
10471               /* Check for "call/jmp *mem", "mov mem, %reg",
10472                  "test %reg, mem" and "binop mem, %reg" where binop
10473                  is one of adc, add, and, cmp, or, sbb, sub, xor
10474                  instructions without data prefix.  Always generate
10475                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
10476               if (i.prefix[DATA_PREFIX] == 0
10477                   && (generate_relax_relocations
10478                       || (!object_64bit
10479                           && i.rm.mode == 0
10480                           && i.rm.regmem == 5))
10481                   && (i.rm.mode == 2
10482                       || (i.rm.mode == 0 && i.rm.regmem == 5))
10483                   && i.tm.opcode_space == SPACE_BASE
10484                   && ((i.operands == 1
10485                        && i.tm.base_opcode == 0xff
10486                        && (i.rm.reg == 2 || i.rm.reg == 4))
10487                       || (i.operands == 2
10488                           && (i.tm.base_opcode == 0x8b
10489                               || i.tm.base_opcode == 0x85
10490                               || (i.tm.base_opcode & ~0x38) == 0x03))))
10491                 {
10492                   if (object_64bit)
10493                     {
10494                       fixP->fx_tcbit = i.rex != 0;
10495                       if (i.base_reg
10496                           && (i.base_reg->reg_num == RegIP))
10497                       fixP->fx_tcbit2 = 1;
10498                     }
10499                   else
10500                     fixP->fx_tcbit2 = 1;
10501                 }
10502             }
10503         }
10504     }
10505 }
10506
10507 static void
10508 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
10509 {
10510   char *p;
10511   unsigned int n;
10512
10513   for (n = 0; n < i.operands; n++)
10514     {
10515       if (operand_type_check (i.types[n], imm))
10516         {
10517           int size = imm_size (n);
10518
10519           if (now_seg == absolute_section)
10520             abs_section_offset += size;
10521           else if (i.op[n].imms->X_op == O_constant)
10522             {
10523               offsetT val;
10524
10525               val = offset_in_range (i.op[n].imms->X_add_number,
10526                                      size);
10527               p = frag_more (size);
10528               md_number_to_chars (p, val, size);
10529             }
10530           else
10531             {
10532               /* Not absolute_section.
10533                  Need a 32-bit fixup (don't support 8bit
10534                  non-absolute imms).  Try to support other
10535                  sizes ...  */
10536               enum bfd_reloc_code_real reloc_type;
10537               int sign;
10538
10539               if (i.types[n].bitfield.imm32s
10540                   && (i.suffix == QWORD_MNEM_SUFFIX
10541                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)
10542                       || (i.prefix[REX_PREFIX] & REX_W)
10543                       || dot_insn ()))
10544                 sign = 1;
10545               else
10546                 sign = 0;
10547
10548               p = frag_more (size);
10549               reloc_type = reloc (size, 0, sign, i.reloc[n]);
10550
10551               /*   This is tough to explain.  We end up with this one if we
10552                * have operands that look like
10553                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
10554                * obtain the absolute address of the GOT, and it is strongly
10555                * preferable from a performance point of view to avoid using
10556                * a runtime relocation for this.  The actual sequence of
10557                * instructions often look something like:
10558                *
10559                *        call    .L66
10560                * .L66:
10561                *        popl    %ebx
10562                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
10563                *
10564                *   The call and pop essentially return the absolute address
10565                * of the label .L66 and store it in %ebx.  The linker itself
10566                * will ultimately change the first operand of the addl so
10567                * that %ebx points to the GOT, but to keep things simple, the
10568                * .o file must have this operand set so that it generates not
10569                * the absolute address of .L66, but the absolute address of
10570                * itself.  This allows the linker itself simply treat a GOTPC
10571                * relocation as asking for a pcrel offset to the GOT to be
10572                * added in, and the addend of the relocation is stored in the
10573                * operand field for the instruction itself.
10574                *
10575                *   Our job here is to fix the operand so that it would add
10576                * the correct offset so that %ebx would point to itself.  The
10577                * thing that is tricky is that .-.L66 will point to the
10578                * beginning of the instruction, so we need to further modify
10579                * the operand so that it will point to itself.  There are
10580                * other cases where you have something like:
10581                *
10582                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
10583                *
10584                * and here no correction would be required.  Internally in
10585                * the assembler we treat operands of this form as not being
10586                * pcrel since the '.' is explicitly mentioned, and I wonder
10587                * whether it would simplify matters to do it this way.  Who
10588                * knows.  In earlier versions of the PIC patches, the
10589                * pcrel_adjust field was used to store the correction, but
10590                * since the expression is not pcrel, I felt it would be
10591                * confusing to do it this way.  */
10592
10593               if ((reloc_type == BFD_RELOC_32
10594                    || reloc_type == BFD_RELOC_X86_64_32S
10595                    || reloc_type == BFD_RELOC_64)
10596                   && GOT_symbol
10597                   && GOT_symbol == i.op[n].imms->X_add_symbol
10598                   && (i.op[n].imms->X_op == O_symbol
10599                       || (i.op[n].imms->X_op == O_add
10600                           && ((symbol_get_value_expression
10601                                (i.op[n].imms->X_op_symbol)->X_op)
10602                               == O_subtract))))
10603                 {
10604                   if (!object_64bit)
10605                     reloc_type = BFD_RELOC_386_GOTPC;
10606                   else if (size == 4)
10607                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
10608                   else if (size == 8)
10609                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
10610                   i.has_gotpc_tls_reloc = true;
10611                   i.op[n].imms->X_add_number +=
10612                     encoding_length (insn_start_frag, insn_start_off, p);
10613                 }
10614               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
10615                            i.op[n].imms, 0, reloc_type);
10616             }
10617         }
10618     }
10619 }
10620 \f
10621 /* x86_cons_fix_new is called via the expression parsing code when a
10622    reloc is needed.  We use this hook to get the correct .got reloc.  */
10623 static int cons_sign = -1;
10624
10625 void
10626 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
10627                   expressionS *exp, bfd_reloc_code_real_type r)
10628 {
10629   r = reloc (len, 0, cons_sign, r);
10630
10631 #ifdef TE_PE
10632   if (exp->X_op == O_secrel)
10633     {
10634       exp->X_op = O_symbol;
10635       r = BFD_RELOC_32_SECREL;
10636     }
10637   else if (exp->X_op == O_secidx)
10638     r = BFD_RELOC_16_SECIDX;
10639 #endif
10640
10641   fix_new_exp (frag, off, len, exp, 0, r);
10642 }
10643
10644 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
10645    purpose of the `.dc.a' internal pseudo-op.  */
10646
10647 int
10648 x86_address_bytes (void)
10649 {
10650   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
10651     return 4;
10652   return stdoutput->arch_info->bits_per_address / 8;
10653 }
10654
10655 #if (!(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
10656      || defined (LEX_AT)) && !defined (TE_PE)
10657 # define lex_got(reloc, adjust, types) NULL
10658 #else
10659 /* Parse operands of the form
10660    <symbol>@GOTOFF+<nnn>
10661    and similar .plt or .got references.
10662
10663    If we find one, set up the correct relocation in RELOC and copy the
10664    input string, minus the `@GOTOFF' into a malloc'd buffer for
10665    parsing by the calling routine.  Return this buffer, and if ADJUST
10666    is non-null set it to the length of the string we removed from the
10667    input line.  Otherwise return NULL.  */
10668 static char *
10669 lex_got (enum bfd_reloc_code_real *rel,
10670          int *adjust,
10671          i386_operand_type *types)
10672 {
10673   /* Some of the relocations depend on the size of what field is to
10674      be relocated.  But in our callers i386_immediate and i386_displacement
10675      we don't yet know the operand size (this will be set by insn
10676      matching).  Hence we record the word32 relocation here,
10677      and adjust the reloc according to the real size in reloc().  */
10678   static const struct
10679   {
10680     const char *str;
10681     int len;
10682     const enum bfd_reloc_code_real rel[2];
10683     const i386_operand_type types64;
10684     bool need_GOT_symbol;
10685   }
10686     gotrel[] =
10687   {
10688
10689 #define OPERAND_TYPE_IMM32_32S_DISP32 { .bitfield = \
10690   { .imm32 = 1, .imm32s = 1, .disp32 = 1 } }
10691 #define OPERAND_TYPE_IMM32_32S_64_DISP32 { .bitfield = \
10692   { .imm32 = 1, .imm32s = 1, .imm64 = 1, .disp32 = 1 } }
10693 #define OPERAND_TYPE_IMM32_32S_64_DISP32_64 { .bitfield = \
10694   { .imm32 = 1, .imm32s = 1, .imm64 = 1, .disp32 = 1, .disp64 = 1 } }
10695 #define OPERAND_TYPE_IMM64_DISP64 { .bitfield = \
10696   { .imm64 = 1, .disp64 = 1 } }
10697
10698 #ifndef TE_PE
10699 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10700     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
10701                                         BFD_RELOC_SIZE32 },
10702       { .bitfield = { .imm32 = 1, .imm64 = 1 } }, false },
10703 #endif
10704     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
10705                                        BFD_RELOC_X86_64_PLTOFF64 },
10706       { .bitfield = { .imm64 = 1 } }, true },
10707     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
10708                                        BFD_RELOC_X86_64_PLT32    },
10709       OPERAND_TYPE_IMM32_32S_DISP32, false },
10710     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
10711                                        BFD_RELOC_X86_64_GOTPLT64 },
10712       OPERAND_TYPE_IMM64_DISP64, true },
10713     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
10714                                        BFD_RELOC_X86_64_GOTOFF64 },
10715       OPERAND_TYPE_IMM64_DISP64, true },
10716     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10717                                        BFD_RELOC_X86_64_GOTPCREL },
10718       OPERAND_TYPE_IMM32_32S_DISP32, true },
10719     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
10720                                        BFD_RELOC_X86_64_TLSGD    },
10721       OPERAND_TYPE_IMM32_32S_DISP32, true },
10722     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
10723                                        _dummy_first_bfd_reloc_code_real },
10724       OPERAND_TYPE_NONE, true },
10725     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
10726                                        BFD_RELOC_X86_64_TLSLD    },
10727       OPERAND_TYPE_IMM32_32S_DISP32, true },
10728     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10729                                        BFD_RELOC_X86_64_GOTTPOFF },
10730       OPERAND_TYPE_IMM32_32S_DISP32, true },
10731     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
10732                                        BFD_RELOC_X86_64_TPOFF32  },
10733       OPERAND_TYPE_IMM32_32S_64_DISP32_64, true },
10734     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
10735                                        _dummy_first_bfd_reloc_code_real },
10736       OPERAND_TYPE_NONE, true },
10737     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
10738                                        BFD_RELOC_X86_64_DTPOFF32 },
10739       OPERAND_TYPE_IMM32_32S_64_DISP32_64, true },
10740     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10741                                        _dummy_first_bfd_reloc_code_real },
10742       OPERAND_TYPE_NONE, true },
10743     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10744                                        _dummy_first_bfd_reloc_code_real },
10745       OPERAND_TYPE_NONE, true },
10746     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
10747                                        BFD_RELOC_X86_64_GOT32    },
10748       OPERAND_TYPE_IMM32_32S_64_DISP32, true },
10749     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
10750                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10751       OPERAND_TYPE_IMM32_32S_DISP32, true },
10752     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
10753                                        BFD_RELOC_X86_64_TLSDESC_CALL },
10754       OPERAND_TYPE_IMM32_32S_DISP32, true },
10755 #else /* TE_PE */
10756     { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10757                                        BFD_RELOC_32_SECREL },
10758       OPERAND_TYPE_IMM32_32S_64_DISP32_64, false },
10759 #endif
10760
10761 #undef OPERAND_TYPE_IMM32_32S_DISP32
10762 #undef OPERAND_TYPE_IMM32_32S_64_DISP32
10763 #undef OPERAND_TYPE_IMM32_32S_64_DISP32_64
10764 #undef OPERAND_TYPE_IMM64_DISP64
10765
10766   };
10767   char *cp;
10768   unsigned int j;
10769
10770 #if defined (OBJ_MAYBE_ELF) && !defined (TE_PE)
10771   if (!IS_ELF)
10772     return NULL;
10773 #endif
10774
10775   for (cp = input_line_pointer; *cp != '@'; cp++)
10776     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10777       return NULL;
10778
10779   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10780     {
10781       int len = gotrel[j].len;
10782       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10783         {
10784           if (gotrel[j].rel[object_64bit] != 0)
10785             {
10786               int first, second;
10787               char *tmpbuf, *past_reloc;
10788
10789               *rel = gotrel[j].rel[object_64bit];
10790
10791               if (types)
10792                 {
10793                   if (flag_code != CODE_64BIT)
10794                     {
10795                       types->bitfield.imm32 = 1;
10796                       types->bitfield.disp32 = 1;
10797                     }
10798                   else
10799                     *types = gotrel[j].types64;
10800                 }
10801
10802               if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10803                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10804
10805               /* The length of the first part of our input line.  */
10806               first = cp - input_line_pointer;
10807
10808               /* The second part goes from after the reloc token until
10809                  (and including) an end_of_line char or comma.  */
10810               past_reloc = cp + 1 + len;
10811               cp = past_reloc;
10812               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10813                 ++cp;
10814               second = cp + 1 - past_reloc;
10815
10816               /* Allocate and copy string.  The trailing NUL shouldn't
10817                  be necessary, but be safe.  */
10818               tmpbuf = XNEWVEC (char, first + second + 2);
10819               memcpy (tmpbuf, input_line_pointer, first);
10820               if (second != 0 && *past_reloc != ' ')
10821                 /* Replace the relocation token with ' ', so that
10822                    errors like foo@GOTOFF1 will be detected.  */
10823                 tmpbuf[first++] = ' ';
10824               else
10825                 /* Increment length by 1 if the relocation token is
10826                    removed.  */
10827                 len++;
10828               if (adjust)
10829                 *adjust = len;
10830               memcpy (tmpbuf + first, past_reloc, second);
10831               tmpbuf[first + second] = '\0';
10832               return tmpbuf;
10833             }
10834
10835           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10836                   gotrel[j].str, 1 << (5 + object_64bit));
10837           return NULL;
10838         }
10839     }
10840
10841   /* Might be a symbol version string.  Don't as_bad here.  */
10842   return NULL;
10843 }
10844 #endif
10845
10846 bfd_reloc_code_real_type
10847 x86_cons (expressionS *exp, int size)
10848 {
10849   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10850
10851   intel_syntax = -intel_syntax;
10852   exp->X_md = 0;
10853   expr_mode = expr_operator_none;
10854
10855 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
10856       && !defined (LEX_AT)) \
10857     || defined (TE_PE)
10858   if (size == 4 || (object_64bit && size == 8))
10859     {
10860       /* Handle @GOTOFF and the like in an expression.  */
10861       char *save;
10862       char *gotfree_input_line;
10863       int adjust = 0;
10864
10865       save = input_line_pointer;
10866       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10867       if (gotfree_input_line)
10868         input_line_pointer = gotfree_input_line;
10869
10870       expression (exp);
10871
10872       if (gotfree_input_line)
10873         {
10874           /* expression () has merrily parsed up to the end of line,
10875              or a comma - in the wrong buffer.  Transfer how far
10876              input_line_pointer has moved to the right buffer.  */
10877           input_line_pointer = (save
10878                                 + (input_line_pointer - gotfree_input_line)
10879                                 + adjust);
10880           free (gotfree_input_line);
10881           if (exp->X_op == O_constant
10882               || exp->X_op == O_absent
10883               || exp->X_op == O_illegal
10884               || exp->X_op == O_register
10885               || exp->X_op == O_big)
10886             {
10887               char c = *input_line_pointer;
10888               *input_line_pointer = 0;
10889               as_bad (_("missing or invalid expression `%s'"), save);
10890               *input_line_pointer = c;
10891             }
10892           else if ((got_reloc == BFD_RELOC_386_PLT32
10893                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10894                    && exp->X_op != O_symbol)
10895             {
10896               char c = *input_line_pointer;
10897               *input_line_pointer = 0;
10898               as_bad (_("invalid PLT expression `%s'"), save);
10899               *input_line_pointer = c;
10900             }
10901         }
10902     }
10903   else
10904 #endif
10905     expression (exp);
10906
10907   intel_syntax = -intel_syntax;
10908
10909   if (intel_syntax)
10910     i386_intel_simplify (exp);
10911
10912   /* If not 64bit, massage value, to account for wraparound when !BFD64.  */
10913   if (size <= 4 && expr_mode == expr_operator_present
10914       && exp->X_op == O_constant && !object_64bit)
10915     exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
10916
10917   return got_reloc;
10918 }
10919
10920 static void
10921 signed_cons (int size)
10922 {
10923   if (object_64bit)
10924     cons_sign = 1;
10925   cons (size);
10926   cons_sign = -1;
10927 }
10928
10929 static void
10930 s_insn (int dummy ATTRIBUTE_UNUSED)
10931 {
10932   char mnemonic[MAX_MNEM_SIZE], *line = input_line_pointer, *ptr;
10933   char *saved_ilp = find_end_of_line (line, false), saved_char;
10934   const char *end;
10935   unsigned int j;
10936   valueT val;
10937   bool vex = false, xop = false, evex = false;
10938   static const templates tt = { &i.tm, &i.tm + 1 };
10939
10940   init_globals ();
10941
10942   saved_char = *saved_ilp;
10943   *saved_ilp = 0;
10944
10945   end = parse_insn (line, mnemonic, true);
10946   if (end == NULL)
10947     {
10948   bad:
10949       *saved_ilp = saved_char;
10950       ignore_rest_of_line ();
10951       i.tm.mnem_off = 0;
10952       return;
10953     }
10954   line += end - line;
10955
10956   current_templates = &tt;
10957   i.tm.mnem_off = MN__insn;
10958   i.tm.extension_opcode = None;
10959
10960   if (startswith (line, "VEX")
10961       && (line[3] == '.' || is_space_char (line[3])))
10962     {
10963       vex = true;
10964       line += 3;
10965     }
10966   else if (startswith (line, "XOP") && ISDIGIT (line[3]))
10967     {
10968       char *e;
10969       unsigned long n = strtoul (line + 3, &e, 16);
10970
10971       if (e == line + 5 && n >= 0x08 && n <= 0x1f
10972           && (*e == '.' || is_space_char (*e)))
10973         {
10974           xop = true;
10975           /* Arrange for build_vex_prefix() to emit 0x8f.  */
10976           i.tm.opcode_space = SPACE_XOP08;
10977           i.insn_opcode_space = n;
10978           line = e;
10979         }
10980     }
10981   else if (startswith (line, "EVEX")
10982            && (line[4] == '.' || is_space_char (line[4])))
10983     {
10984       evex = true;
10985       line += 4;
10986     }
10987
10988   if (vex || xop
10989       ? i.vec_encoding == vex_encoding_evex
10990       : evex
10991         ? i.vec_encoding == vex_encoding_vex
10992           || i.vec_encoding == vex_encoding_vex3
10993         : i.vec_encoding != vex_encoding_default)
10994     {
10995       as_bad (_("pseudo-prefix conflicts with encoding specifier"));
10996       goto bad;
10997     }
10998
10999   if (line > end && i.vec_encoding == vex_encoding_default)
11000     i.vec_encoding = evex ? vex_encoding_evex : vex_encoding_vex;
11001
11002   if (i.vec_encoding != vex_encoding_default)
11003     {
11004       /* Only address size and segment override prefixes are permitted with
11005          VEX/XOP/EVEX encodings.  */
11006       const unsigned char *p = i.prefix;
11007
11008       for (j = 0; j < ARRAY_SIZE (i.prefix); ++j, ++p)
11009         {
11010           if (!*p)
11011             continue;
11012
11013           switch (j)
11014             {
11015             case SEG_PREFIX:
11016             case ADDR_PREFIX:
11017               break;
11018             default:
11019                   as_bad (_("illegal prefix used with VEX/XOP/EVEX"));
11020                   goto bad;
11021             }
11022         }
11023     }
11024
11025   if (line > end && *line == '.')
11026     {
11027       /* Length specifier (VEX.L, XOP.L, EVEX.L'L).  */
11028       switch (line[1])
11029         {
11030         case 'L':
11031           switch (line[2])
11032             {
11033             case '0':
11034               if (evex)
11035                 i.tm.opcode_modifier.evex = EVEX128;
11036               else
11037                 i.tm.opcode_modifier.vex = VEX128;
11038               break;
11039
11040             case '1':
11041               if (evex)
11042                 i.tm.opcode_modifier.evex = EVEX256;
11043               else
11044                 i.tm.opcode_modifier.vex = VEX256;
11045               break;
11046
11047             case '2':
11048               if (evex)
11049                 i.tm.opcode_modifier.evex = EVEX512;
11050               break;
11051
11052             case '3':
11053               if (evex)
11054                 i.tm.opcode_modifier.evex = EVEX_L3;
11055               break;
11056
11057             case 'I':
11058               if (line[3] == 'G')
11059                 {
11060                   if (evex)
11061                     i.tm.opcode_modifier.evex = EVEXLIG;
11062                   else
11063                     i.tm.opcode_modifier.vex = VEXScalar; /* LIG */
11064                   ++line;
11065                 }
11066               break;
11067             }
11068
11069           if (i.tm.opcode_modifier.vex || i.tm.opcode_modifier.evex)
11070             line += 3;
11071           break;
11072
11073         case '1':
11074           if (line[2] == '2' && line[3] == '8')
11075             {
11076               if (evex)
11077                 i.tm.opcode_modifier.evex = EVEX128;
11078               else
11079                 i.tm.opcode_modifier.vex = VEX128;
11080               line += 4;
11081             }
11082           break;
11083
11084         case '2':
11085           if (line[2] == '5' && line[3] == '6')
11086             {
11087               if (evex)
11088                 i.tm.opcode_modifier.evex = EVEX256;
11089               else
11090                 i.tm.opcode_modifier.vex = VEX256;
11091               line += 4;
11092             }
11093           break;
11094
11095         case '5':
11096           if (evex && line[2] == '1' && line[3] == '2')
11097             {
11098               i.tm.opcode_modifier.evex = EVEX512;
11099               line += 4;
11100             }
11101           break;
11102         }
11103     }
11104
11105   if (line > end && *line == '.')
11106     {
11107       /* embedded prefix (VEX.pp, XOP.pp, EVEX.pp).  */
11108       switch (line[1])
11109         {
11110         case 'N':
11111           if (line[2] == 'P')
11112             line += 3;
11113           break;
11114
11115         case '6':
11116           if (line[2] == '6')
11117             {
11118               i.tm.opcode_modifier.opcodeprefix = PREFIX_0X66;
11119               line += 3;
11120             }
11121           break;
11122
11123         case 'F': case 'f':
11124           if (line[2] == '3')
11125             {
11126               i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
11127               line += 3;
11128             }
11129           else if (line[2] == '2')
11130             {
11131               i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF2;
11132               line += 3;
11133             }
11134           break;
11135         }
11136     }
11137
11138   if (line > end && !xop && *line == '.')
11139     {
11140       /* Encoding space (VEX.mmmmm, EVEX.mmmm).  */
11141       switch (line[1])
11142         {
11143         case '0':
11144           if (TOUPPER (line[2]) != 'F')
11145             break;
11146           if (line[3] == '.' || is_space_char (line[3]))
11147             {
11148               i.insn_opcode_space = SPACE_0F;
11149               line += 3;
11150             }
11151           else if (line[3] == '3'
11152                    && (line[4] == '8' || TOUPPER (line[4]) == 'A')
11153                    && (line[5] == '.' || is_space_char (line[5])))
11154             {
11155               i.insn_opcode_space = line[4] == '8' ? SPACE_0F38 : SPACE_0F3A;
11156               line += 5;
11157             }
11158           break;
11159
11160         case 'M':
11161           if (ISDIGIT (line[2]) && line[2] != '0')
11162             {
11163               char *e;
11164               unsigned long n = strtoul (line + 2, &e, 10);
11165
11166               if (n <= (evex ? 15 : 31)
11167                   && (*e == '.' || is_space_char (*e)))
11168                 {
11169                   i.insn_opcode_space = n;
11170                   line = e;
11171                 }
11172             }
11173           break;
11174         }
11175     }
11176
11177   if (line > end && *line == '.' && line[1] == 'W')
11178     {
11179       /* VEX.W, XOP.W, EVEX.W  */
11180       switch (line[2])
11181         {
11182         case '0':
11183           i.tm.opcode_modifier.vexw = VEXW0;
11184           break;
11185
11186         case '1':
11187           i.tm.opcode_modifier.vexw = VEXW1;
11188           break;
11189
11190         case 'I':
11191           if (line[3] == 'G')
11192             {
11193               i.tm.opcode_modifier.vexw = VEXWIG;
11194               ++line;
11195             }
11196           break;
11197         }
11198
11199       if (i.tm.opcode_modifier.vexw)
11200         line += 3;
11201     }
11202
11203   if (line > end && *line && !is_space_char (*line))
11204     {
11205       /* Improve diagnostic a little.  */
11206       if (*line == '.' && line[1] && !is_space_char (line[1]))
11207         ++line;
11208       goto done;
11209     }
11210
11211   /* Before processing the opcode expression, find trailing "+r" or
11212      "/<digit>" specifiers.  */
11213   for (ptr = line; ; ++ptr)
11214     {
11215       unsigned long n;
11216       char *e;
11217
11218       ptr = strpbrk (ptr, "+/,");
11219       if (ptr == NULL || *ptr == ',')
11220         break;
11221
11222       if (*ptr == '+' && ptr[1] == 'r'
11223           && (ptr[2] == ',' || (is_space_char (ptr[2]) && ptr[3] == ',')))
11224         {
11225           *ptr = ' ';
11226           ptr[1] = ' ';
11227           i.short_form = true;
11228           break;
11229         }
11230
11231       if (*ptr == '/' && ISDIGIT (ptr[1])
11232           && (n = strtoul (ptr + 1, &e, 8)) < 8
11233           && e == ptr + 2
11234           && (ptr[2] == ',' || (is_space_char (ptr[2]) && ptr[3] == ',')))
11235         {
11236           *ptr = ' ';
11237           ptr[1] = ' ';
11238           i.tm.extension_opcode = n;
11239           i.tm.opcode_modifier.modrm = 1;
11240           break;
11241         }
11242     }
11243
11244   input_line_pointer = line;
11245   val = get_absolute_expression ();
11246   line = input_line_pointer;
11247
11248   if (i.short_form && (val & 7))
11249     as_warn ("`+r' assumes low three opcode bits to be clear");
11250
11251   for (j = 1; j < sizeof(val); ++j)
11252     if (!(val >> (j * 8)))
11253       break;
11254
11255   /* Trim off a prefix if present.  */
11256   if (j > 1 && !vex && !xop && !evex)
11257     {
11258       uint8_t byte = val >> ((j - 1) * 8);
11259
11260       switch (byte)
11261         {
11262         case DATA_PREFIX_OPCODE:
11263         case REPE_PREFIX_OPCODE:
11264         case REPNE_PREFIX_OPCODE:
11265           if (!add_prefix (byte))
11266             goto bad;
11267           val &= ((uint64_t)1 << (--j * 8)) - 1;
11268           break;
11269         }
11270     }
11271
11272   /* Trim off encoding space.  */
11273   if (j > 1 && !i.insn_opcode_space && (val >> ((j - 1) * 8)) == 0x0f)
11274     {
11275       uint8_t byte = val >> ((--j - 1) * 8);
11276
11277       i.insn_opcode_space = SPACE_0F;
11278       switch (byte & -(j > 1))
11279         {
11280         case 0x38:
11281           i.insn_opcode_space = SPACE_0F38;
11282           --j;
11283           break;
11284         case 0x3a:
11285           i.insn_opcode_space = SPACE_0F3A;
11286           --j;
11287           break;
11288         }
11289       i.tm.opcode_space = i.insn_opcode_space;
11290       val &= ((uint64_t)1 << (j * 8)) - 1;
11291     }
11292   if (!i.tm.opcode_space && (vex || evex))
11293     /* Arrange for build_vex_prefix() to properly emit 0xC4/0xC5.
11294        Also avoid hitting abort() there or in build_evex_prefix().  */
11295     i.tm.opcode_space = i.insn_opcode_space == SPACE_0F ? SPACE_0F
11296                                                    : SPACE_0F38;
11297
11298   if (j > 2)
11299     {
11300       as_bad (_("opcode residual (%#"PRIx64") too wide"), (uint64_t) val);
11301       goto bad;
11302     }
11303   i.opcode_length = j;
11304
11305   /* Handle operands, if any.  */
11306   if (*line == ',')
11307     {
11308       i386_operand_type combined;
11309       expressionS *disp_exp = NULL;
11310       bool changed;
11311
11312       i.memshift = -1;
11313
11314       ptr = parse_operands (line + 1, &i386_mnemonics[MN__insn]);
11315       this_operand = -1;
11316       if (!ptr)
11317         goto bad;
11318       line = ptr;
11319
11320       if (!i.operands)
11321         {
11322           as_bad (_("expecting operand after ','; got nothing"));
11323           goto done;
11324         }
11325
11326       if (i.mem_operands > 1)
11327         {
11328           as_bad (_("too many memory references for `%s'"),
11329                   &i386_mnemonics[MN__insn]);
11330           goto done;
11331         }
11332
11333       /* No need to distinguish vex_encoding_evex and vex_encoding_evex512.  */
11334       if (i.vec_encoding == vex_encoding_evex512)
11335         i.vec_encoding = vex_encoding_evex;
11336
11337       /* Are we to emit ModR/M encoding?  */
11338       if (!i.short_form
11339           && (i.mem_operands
11340               || i.reg_operands > (i.vec_encoding != vex_encoding_default)
11341               || i.tm.extension_opcode != None))
11342         i.tm.opcode_modifier.modrm = 1;
11343
11344       if (!i.tm.opcode_modifier.modrm
11345           && (i.reg_operands
11346               > i.short_form + 0U + (i.vec_encoding != vex_encoding_default)
11347               || i.mem_operands))
11348         {
11349           as_bad (_("too many register/memory operands"));
11350           goto done;
11351         }
11352
11353       /* Enforce certain constraints on operands.  */
11354       switch (i.reg_operands + i.mem_operands
11355               + (i.tm.extension_opcode != None))
11356         {
11357         case 0:
11358           if (i.short_form)
11359             {
11360               as_bad (_("too few register/memory operands"));
11361               goto done;
11362             }
11363           /* Fall through.  */
11364         case 1:
11365           if (i.tm.opcode_modifier.modrm)
11366             {
11367               as_bad (_("too few register/memory operands"));
11368               goto done;
11369             }
11370           break;
11371
11372         case 2:
11373           break;
11374
11375         case 4:
11376           if (i.imm_operands
11377               && (i.op[0].imms->X_op != O_constant
11378                   || !fits_in_imm4 (i.op[0].imms->X_add_number)))
11379             {
11380               as_bad (_("constant doesn't fit in %d bits"), evex ? 3 : 4);
11381               goto done;
11382             }
11383           /* Fall through.  */
11384         case 3:
11385           if (i.vec_encoding != vex_encoding_default)
11386             {
11387               i.tm.opcode_modifier.vexvvvv = 1;
11388               break;
11389             }
11390           /* Fall through.  */
11391         default:
11392           as_bad (_("too many register/memory operands"));
11393           goto done;
11394         }
11395
11396       /* Bring operands into canonical order (imm, mem, reg).  */
11397       do
11398         {
11399           changed = false;
11400
11401           for (j = 1; j < i.operands; ++j)
11402             {
11403               if ((!operand_type_check (i.types[j - 1], imm)
11404                    && operand_type_check (i.types[j], imm))
11405                   || (i.types[j - 1].bitfield.class != ClassNone
11406                       && i.types[j].bitfield.class == ClassNone))
11407                 {
11408                   swap_2_operands (j - 1, j);
11409                   changed = true;
11410                 }
11411             }
11412         }
11413       while (changed);
11414
11415       /* For Intel syntax swap the order of register operands.  */
11416       if (intel_syntax)
11417         switch (i.reg_operands)
11418           {
11419           case 0:
11420           case 1:
11421             break;
11422
11423           case 4:
11424             swap_2_operands (i.imm_operands + i.mem_operands + 1, i.operands - 2);
11425             /* Fall through.  */
11426           case 3:
11427           case 2:
11428             swap_2_operands (i.imm_operands + i.mem_operands, i.operands - 1);
11429             break;
11430
11431           default:
11432             abort ();
11433           }
11434
11435       /* Enforce constraints when using VSIB.  */
11436       if (i.index_reg
11437           && (i.index_reg->reg_type.bitfield.xmmword
11438               || i.index_reg->reg_type.bitfield.ymmword
11439               || i.index_reg->reg_type.bitfield.zmmword))
11440         {
11441           if (i.vec_encoding == vex_encoding_default)
11442             {
11443               as_bad (_("VSIB unavailable with legacy encoding"));
11444               goto done;
11445             }
11446
11447           if (i.vec_encoding == vex_encoding_evex
11448               && i.reg_operands > 1)
11449             {
11450               /* We could allow two register operands, encoding the 2nd one in
11451                  an 8-bit immediate like for 4-register-operand insns, but that
11452                  would require ugly fiddling with process_operands() and/or
11453                  build_modrm_byte().  */
11454               as_bad (_("too many register operands with VSIB"));
11455               goto done;
11456             }
11457
11458           i.tm.opcode_modifier.sib = 1;
11459         }
11460
11461       /* Establish operand size encoding.  */
11462       operand_type_set (&combined, 0);
11463
11464       for (j = i.imm_operands; j < i.operands; ++j)
11465         {
11466           i.types[j].bitfield.instance = InstanceNone;
11467
11468           if (operand_type_check (i.types[j], disp))
11469             {
11470               i.types[j].bitfield.baseindex = 1;
11471               disp_exp = i.op[j].disps;
11472             }
11473
11474           if (evex && i.types[j].bitfield.baseindex)
11475             {
11476               unsigned int n = i.memshift;
11477
11478               if (i.types[j].bitfield.byte)
11479                 n = 0;
11480               else if (i.types[j].bitfield.word)
11481                 n = 1;
11482               else if (i.types[j].bitfield.dword)
11483                 n = 2;
11484               else if (i.types[j].bitfield.qword)
11485                 n = 3;
11486               else if (i.types[j].bitfield.xmmword)
11487                 n = 4;
11488               else if (i.types[j].bitfield.ymmword)
11489                 n = 5;
11490               else if (i.types[j].bitfield.zmmword)
11491                 n = 6;
11492
11493               if (i.memshift < 32 && n != i.memshift)
11494                 as_warn ("conflicting memory operand size specifiers");
11495               i.memshift = n;
11496             }
11497
11498           if ((i.broadcast.type || i.broadcast.bytes)
11499               && j == i.broadcast.operand)
11500             continue;
11501
11502           combined = operand_type_or (combined, i.types[j]);
11503           combined.bitfield.class = ClassNone;
11504         }
11505
11506       switch ((i.broadcast.type ? i.broadcast.type : 1)
11507               << (i.memshift < 32 ? i.memshift : 0))
11508         {
11509         case 64: combined.bitfield.zmmword = 1; break;
11510         case 32: combined.bitfield.ymmword = 1; break;
11511         case 16: combined.bitfield.xmmword = 1; break;
11512         case  8: combined.bitfield.qword = 1; break;
11513         case  4: combined.bitfield.dword = 1; break;
11514         }
11515
11516       if (i.vec_encoding == vex_encoding_default)
11517         {
11518           if (flag_code == CODE_64BIT && combined.bitfield.qword)
11519             i.rex |= REX_W;
11520           else if ((flag_code == CODE_16BIT ? combined.bitfield.dword
11521                                             : combined.bitfield.word)
11522                    && !add_prefix (DATA_PREFIX_OPCODE))
11523             goto done;
11524         }
11525       else if (!i.tm.opcode_modifier.vexw)
11526         {
11527           if (flag_code == CODE_64BIT)
11528             {
11529               if (combined.bitfield.qword)
11530                 i.tm.opcode_modifier.vexw = VEXW1;
11531               else if (combined.bitfield.dword)
11532                 i.tm.opcode_modifier.vexw = VEXW0;
11533             }
11534
11535           if (!i.tm.opcode_modifier.vexw)
11536             i.tm.opcode_modifier.vexw = VEXWIG;
11537         }
11538
11539       if (vex || xop)
11540         {
11541           if (!i.tm.opcode_modifier.vex)
11542             {
11543               if (combined.bitfield.ymmword)
11544                 i.tm.opcode_modifier.vex = VEX256;
11545               else if (combined.bitfield.xmmword)
11546                 i.tm.opcode_modifier.vex = VEX128;
11547             }
11548         }
11549       else if (evex)
11550         {
11551           if (!i.tm.opcode_modifier.evex)
11552             {
11553               /* Do _not_ consider AVX512VL here.  */
11554               if (i.rounding.type != rc_none || combined.bitfield.zmmword)
11555                 i.tm.opcode_modifier.evex = EVEX512;
11556               else if (combined.bitfield.ymmword)
11557                 i.tm.opcode_modifier.evex = EVEX256;
11558               else if (combined.bitfield.xmmword)
11559                 i.tm.opcode_modifier.evex = EVEX128;
11560             }
11561
11562           if (i.memshift >= 32)
11563             {
11564               unsigned int n = 0;
11565
11566               switch (i.tm.opcode_modifier.evex)
11567                 {
11568                 case EVEX512: n = 64; break;
11569                 case EVEX256: n = 32; break;
11570                 case EVEX128: n = 16; break;
11571                 }
11572
11573               if (i.broadcast.type)
11574                 n /= i.broadcast.type;
11575
11576               if (n > 0)
11577                 for (i.memshift = 0; !(n & 1); n >>= 1)
11578                   ++i.memshift;
11579               else if (disp_exp != NULL && disp_exp->X_op == O_constant
11580                        && disp_exp->X_add_number != 0
11581                        && i.disp_encoding != disp_encoding_32bit)
11582                 {
11583                   if (!quiet_warnings)
11584                     as_warn ("cannot determine memory operand size");
11585                   i.disp_encoding = disp_encoding_32bit;
11586                 }
11587             }
11588         }
11589
11590       if (i.memshift >= 32)
11591         i.memshift = 0;
11592       else if (!evex)
11593         i.vec_encoding = vex_encoding_error;
11594
11595       if (i.disp_operands && !optimize_disp (&i.tm))
11596         goto done;
11597
11598       /* Establish size for immediate operands.  */
11599       for (j = 0; j < i.imm_operands; ++j)
11600         {
11601           expressionS *expP = i.op[j].imms;
11602
11603           gas_assert (operand_type_check (i.types[j], imm));
11604           operand_type_set (&i.types[j], 0);
11605
11606           if (i.imm_bits[j] > 32)
11607             i.types[j].bitfield.imm64 = 1;
11608           else if (i.imm_bits[j] > 16)
11609             {
11610               if (flag_code == CODE_64BIT && (i.flags[j] & Operand_Signed))
11611                 i.types[j].bitfield.imm32s = 1;
11612               else
11613                 i.types[j].bitfield.imm32 = 1;
11614             }
11615           else if (i.imm_bits[j] > 8)
11616             i.types[j].bitfield.imm16 = 1;
11617           else if (i.imm_bits[j] > 0)
11618             {
11619               if (i.flags[j] & Operand_Signed)
11620                 i.types[j].bitfield.imm8s = 1;
11621               else
11622                 i.types[j].bitfield.imm8 = 1;
11623             }
11624           else if (expP->X_op == O_constant)
11625             {
11626               i.types[j] = smallest_imm_type (expP->X_add_number);
11627               i.types[j].bitfield.imm1 = 0;
11628               /* Oddly enough imm_size() checks imm64 first, so the bit needs
11629                  zapping since smallest_imm_type() sets it unconditionally.  */
11630               if (flag_code != CODE_64BIT)
11631                 {
11632                   i.types[j].bitfield.imm64 = 0;
11633                   i.types[j].bitfield.imm32s = 0;
11634                   i.types[j].bitfield.imm32 = 1;
11635                 }
11636               else if (i.types[j].bitfield.imm32 || i.types[j].bitfield.imm32s)
11637                 i.types[j].bitfield.imm64 = 0;
11638             }
11639           else
11640             /* Non-constant expressions are sized heuristically.  */
11641             switch (flag_code)
11642               {
11643               case CODE_64BIT: i.types[j].bitfield.imm32s = 1; break;
11644               case CODE_32BIT: i.types[j].bitfield.imm32 = 1; break;
11645               case CODE_16BIT: i.types[j].bitfield.imm16 = 1; break;
11646               }
11647         }
11648
11649       for (j = 0; j < i.operands; ++j)
11650         i.tm.operand_types[j] = i.types[j];
11651
11652       process_operands ();
11653     }
11654
11655   /* Don't set opcode until after processing operands, to avoid any
11656      potential special casing there.  */
11657   i.tm.base_opcode |= val;
11658
11659   if (i.vec_encoding == vex_encoding_error
11660       || (i.vec_encoding != vex_encoding_evex
11661           ? i.broadcast.type || i.broadcast.bytes
11662             || i.rounding.type != rc_none
11663             || i.mask.reg
11664           : (i.mem_operands && i.rounding.type != rc_none)
11665             || ((i.broadcast.type || i.broadcast.bytes)
11666                 && !(i.flags[i.broadcast.operand] & Operand_Mem))))
11667     {
11668       as_bad (_("conflicting .insn operands"));
11669       goto done;
11670     }
11671
11672   if (vex || xop)
11673     {
11674       if (!i.tm.opcode_modifier.vex)
11675         i.tm.opcode_modifier.vex = VEXScalar; /* LIG */
11676
11677       build_vex_prefix (NULL);
11678       i.rex &= REX_OPCODE;
11679     }
11680   else if (evex)
11681     {
11682       if (!i.tm.opcode_modifier.evex)
11683         i.tm.opcode_modifier.evex = EVEXLIG;
11684
11685       build_evex_prefix ();
11686       i.rex &= REX_OPCODE;
11687     }
11688   else if (i.rex != 0)
11689     add_prefix (REX_OPCODE | i.rex);
11690
11691   output_insn ();
11692
11693  done:
11694   *saved_ilp = saved_char;
11695   input_line_pointer = line;
11696
11697   demand_empty_rest_of_line ();
11698
11699   /* Make sure dot_insn() won't yield "true" anymore.  */
11700   i.tm.mnem_off = 0;
11701 }
11702
11703 #ifdef TE_PE
11704 static void
11705 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
11706 {
11707   expressionS exp;
11708
11709   do
11710     {
11711       expression (&exp);
11712       if (exp.X_op == O_symbol)
11713         exp.X_op = O_secrel;
11714
11715       emit_expr (&exp, 4);
11716     }
11717   while (*input_line_pointer++ == ',');
11718
11719   input_line_pointer--;
11720   demand_empty_rest_of_line ();
11721 }
11722
11723 static void
11724 pe_directive_secidx (int dummy ATTRIBUTE_UNUSED)
11725 {
11726   expressionS exp;
11727
11728   do
11729     {
11730       expression (&exp);
11731       if (exp.X_op == O_symbol)
11732         exp.X_op = O_secidx;
11733
11734       emit_expr (&exp, 2);
11735     }
11736   while (*input_line_pointer++ == ',');
11737
11738   input_line_pointer--;
11739   demand_empty_rest_of_line ();
11740 }
11741 #endif
11742
11743 /* Handle Rounding Control / SAE specifiers.  */
11744
11745 static char *
11746 RC_SAE_specifier (const char *pstr)
11747 {
11748   unsigned int j;
11749
11750   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11751     {
11752       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11753         {
11754           if (i.rounding.type != rc_none)
11755             {
11756               as_bad (_("duplicated `{%s}'"), RC_NamesTable[j].name);
11757               return NULL;
11758             }
11759
11760           if (i.vec_encoding == vex_encoding_default)
11761             i.vec_encoding = vex_encoding_evex512;
11762           else if (i.vec_encoding != vex_encoding_evex
11763                    && i.vec_encoding != vex_encoding_evex512)
11764             return NULL;
11765
11766           i.rounding.type = RC_NamesTable[j].type;
11767
11768           return (char *)(pstr + RC_NamesTable[j].len);
11769         }
11770     }
11771
11772   return NULL;
11773 }
11774
11775 /* Handle Vector operations.  */
11776
11777 static char *
11778 check_VecOperations (char *op_string)
11779 {
11780   const reg_entry *mask;
11781   const char *saved;
11782   char *end_op;
11783
11784   while (*op_string)
11785     {
11786       saved = op_string;
11787       if (*op_string == '{')
11788         {
11789           op_string++;
11790
11791           /* Check broadcasts.  */
11792           if (startswith (op_string, "1to"))
11793             {
11794               unsigned int bcst_type;
11795
11796               if (i.broadcast.type)
11797                 goto duplicated_vec_op;
11798
11799               op_string += 3;
11800               if (*op_string == '8')
11801                 bcst_type = 8;
11802               else if (*op_string == '4')
11803                 bcst_type = 4;
11804               else if (*op_string == '2')
11805                 bcst_type = 2;
11806               else if (*op_string == '1'
11807                        && *(op_string+1) == '6')
11808                 {
11809                   bcst_type = 16;
11810                   op_string++;
11811                 }
11812               else if (*op_string == '3'
11813                        && *(op_string+1) == '2')
11814                 {
11815                   bcst_type = 32;
11816                   op_string++;
11817                 }
11818               else
11819                 {
11820                   as_bad (_("Unsupported broadcast: `%s'"), saved);
11821                   return NULL;
11822                 }
11823               op_string++;
11824
11825               if (i.vec_encoding == vex_encoding_default)
11826                 i.vec_encoding = vex_encoding_evex;
11827               else if (i.vec_encoding != vex_encoding_evex
11828                        && i.vec_encoding != vex_encoding_evex512)
11829                 goto unknown_vec_op;
11830
11831               i.broadcast.type = bcst_type;
11832               i.broadcast.operand = this_operand;
11833
11834               /* For .insn a data size specifier may be appended.  */
11835               if (dot_insn () && *op_string == ':')
11836                 goto dot_insn_modifier;
11837             }
11838           /* Check .insn special cases.  */
11839           else if (dot_insn () && *op_string == ':')
11840             {
11841             dot_insn_modifier:
11842               switch (op_string[1])
11843                 {
11844                   unsigned long n;
11845
11846                 case 'd':
11847                   if (i.memshift < 32)
11848                     goto duplicated_vec_op;
11849
11850                   n = strtoul (op_string + 2, &end_op, 0);
11851                   if (n)
11852                     for (i.memshift = 0; !(n & 1); n >>= 1)
11853                       ++i.memshift;
11854                   if (i.memshift < 32 && n == 1)
11855                     op_string = end_op;
11856                   break;
11857
11858                 case 's': case 'u':
11859                   /* This isn't really a "vector" operation, but a sign/size
11860                      specifier for immediate operands of .insn.  Note that AT&T
11861                      syntax handles the same in i386_immediate().  */
11862                   if (!intel_syntax)
11863                     break;
11864
11865                   if (i.imm_bits[this_operand])
11866                     goto duplicated_vec_op;
11867
11868                   n = strtoul (op_string + 2, &end_op, 0);
11869                   if (n && n <= (flag_code == CODE_64BIT ? 64 : 32))
11870                     {
11871                       i.imm_bits[this_operand] = n;
11872                       if (op_string[1] == 's')
11873                         i.flags[this_operand] |= Operand_Signed;
11874                       op_string = end_op;
11875                     }
11876                   break;
11877                 }
11878             }
11879           /* Check masking operation.  */
11880           else if ((mask = parse_register (op_string, &end_op)) != NULL)
11881             {
11882               if (mask == &bad_reg)
11883                 return NULL;
11884
11885               /* k0 can't be used for write mask.  */
11886               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
11887                 {
11888                   as_bad (_("`%s%s' can't be used for write mask"),
11889                           register_prefix, mask->reg_name);
11890                   return NULL;
11891                 }
11892
11893               if (!i.mask.reg)
11894                 {
11895                   i.mask.reg = mask;
11896                   i.mask.operand = this_operand;
11897                 }
11898               else if (i.mask.reg->reg_num)
11899                 goto duplicated_vec_op;
11900               else
11901                 {
11902                   i.mask.reg = mask;
11903
11904                   /* Only "{z}" is allowed here.  No need to check
11905                      zeroing mask explicitly.  */
11906                   if (i.mask.operand != (unsigned int) this_operand)
11907                     {
11908                       as_bad (_("invalid write mask `%s'"), saved);
11909                       return NULL;
11910                     }
11911                 }
11912
11913               op_string = end_op;
11914             }
11915           /* Check zeroing-flag for masking operation.  */
11916           else if (*op_string == 'z')
11917             {
11918               if (!i.mask.reg)
11919                 {
11920                   i.mask.reg = reg_k0;
11921                   i.mask.zeroing = 1;
11922                   i.mask.operand = this_operand;
11923                 }
11924               else
11925                 {
11926                   if (i.mask.zeroing)
11927                     {
11928                     duplicated_vec_op:
11929                       as_bad (_("duplicated `%s'"), saved);
11930                       return NULL;
11931                     }
11932
11933                   i.mask.zeroing = 1;
11934
11935                   /* Only "{%k}" is allowed here.  No need to check mask
11936                      register explicitly.  */
11937                   if (i.mask.operand != (unsigned int) this_operand)
11938                     {
11939                       as_bad (_("invalid zeroing-masking `%s'"),
11940                               saved);
11941                       return NULL;
11942                     }
11943                 }
11944
11945               op_string++;
11946             }
11947           else if (intel_syntax
11948                    && (op_string = RC_SAE_specifier (op_string)) != NULL)
11949             i.rounding.modifier = true;
11950           else
11951             goto unknown_vec_op;
11952
11953           if (*op_string != '}')
11954             {
11955               as_bad (_("missing `}' in `%s'"), saved);
11956               return NULL;
11957             }
11958           op_string++;
11959
11960           /* Strip whitespace since the addition of pseudo prefixes
11961              changed how the scrubber treats '{'.  */
11962           if (is_space_char (*op_string))
11963             ++op_string;
11964
11965           continue;
11966         }
11967     unknown_vec_op:
11968       /* We don't know this one.  */
11969       as_bad (_("unknown vector operation: `%s'"), saved);
11970       return NULL;
11971     }
11972
11973   if (i.mask.reg && i.mask.zeroing && !i.mask.reg->reg_num)
11974     {
11975       as_bad (_("zeroing-masking only allowed with write mask"));
11976       return NULL;
11977     }
11978
11979   return op_string;
11980 }
11981
11982 static int
11983 i386_immediate (char *imm_start)
11984 {
11985   char *save_input_line_pointer;
11986   char *gotfree_input_line;
11987   segT exp_seg = 0;
11988   expressionS *exp;
11989   i386_operand_type types;
11990
11991   operand_type_set (&types, ~0);
11992
11993   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
11994     {
11995       as_bad (_("at most %d immediate operands are allowed"),
11996               MAX_IMMEDIATE_OPERANDS);
11997       return 0;
11998     }
11999
12000   exp = &im_expressions[i.imm_operands++];
12001   i.op[this_operand].imms = exp;
12002
12003   if (is_space_char (*imm_start))
12004     ++imm_start;
12005
12006   save_input_line_pointer = input_line_pointer;
12007   input_line_pointer = imm_start;
12008
12009   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
12010   if (gotfree_input_line)
12011     input_line_pointer = gotfree_input_line;
12012
12013   expr_mode = expr_operator_none;
12014   exp_seg = expression (exp);
12015
12016   /* For .insn immediates there may be a size specifier.  */
12017   if (dot_insn () && *input_line_pointer == '{' && input_line_pointer[1] == ':'
12018       && (input_line_pointer[2] == 's' || input_line_pointer[2] == 'u'))
12019     {
12020       char *e;
12021       unsigned long n = strtoul (input_line_pointer + 3, &e, 0);
12022
12023       if (*e == '}' && n && n <= (flag_code == CODE_64BIT ? 64 : 32))
12024         {
12025           i.imm_bits[this_operand] = n;
12026           if (input_line_pointer[2] == 's')
12027             i.flags[this_operand] |= Operand_Signed;
12028           input_line_pointer = e + 1;
12029         }
12030     }
12031
12032   SKIP_WHITESPACE ();
12033   if (*input_line_pointer)
12034     as_bad (_("junk `%s' after expression"), input_line_pointer);
12035
12036   input_line_pointer = save_input_line_pointer;
12037   if (gotfree_input_line)
12038     {
12039       free (gotfree_input_line);
12040
12041       if (exp->X_op == O_constant)
12042         exp->X_op = O_illegal;
12043     }
12044
12045   if (exp_seg == reg_section)
12046     {
12047       as_bad (_("illegal immediate register operand %s"), imm_start);
12048       return 0;
12049     }
12050
12051   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
12052 }
12053
12054 static int
12055 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
12056                          i386_operand_type types, const char *imm_start)
12057 {
12058   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
12059     {
12060       if (imm_start)
12061         as_bad (_("missing or invalid immediate expression `%s'"),
12062                 imm_start);
12063       return 0;
12064     }
12065   else if (exp->X_op == O_constant)
12066     {
12067       /* Size it properly later.  */
12068       i.types[this_operand].bitfield.imm64 = 1;
12069
12070       /* If not 64bit, sign/zero extend val, to account for wraparound
12071          when !BFD64.  */
12072       if (expr_mode == expr_operator_present
12073           && flag_code != CODE_64BIT && !object_64bit)
12074         exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
12075     }
12076 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
12077   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
12078            && exp_seg != absolute_section
12079            && exp_seg != text_section
12080            && exp_seg != data_section
12081            && exp_seg != bss_section
12082            && exp_seg != undefined_section
12083            && !bfd_is_com_section (exp_seg))
12084     {
12085       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
12086       return 0;
12087     }
12088 #endif
12089   else
12090     {
12091       /* This is an address.  The size of the address will be
12092          determined later, depending on destination register,
12093          suffix, or the default for the section.  */
12094       i.types[this_operand].bitfield.imm8 = 1;
12095       i.types[this_operand].bitfield.imm16 = 1;
12096       i.types[this_operand].bitfield.imm32 = 1;
12097       i.types[this_operand].bitfield.imm32s = 1;
12098       i.types[this_operand].bitfield.imm64 = 1;
12099       i.types[this_operand] = operand_type_and (i.types[this_operand],
12100                                                 types);
12101     }
12102
12103   return 1;
12104 }
12105
12106 static char *
12107 i386_scale (char *scale)
12108 {
12109   offsetT val;
12110   char *save = input_line_pointer;
12111
12112   input_line_pointer = scale;
12113   val = get_absolute_expression ();
12114
12115   switch (val)
12116     {
12117     case 1:
12118       i.log2_scale_factor = 0;
12119       break;
12120     case 2:
12121       i.log2_scale_factor = 1;
12122       break;
12123     case 4:
12124       i.log2_scale_factor = 2;
12125       break;
12126     case 8:
12127       i.log2_scale_factor = 3;
12128       break;
12129     default:
12130       {
12131         char sep = *input_line_pointer;
12132
12133         *input_line_pointer = '\0';
12134         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
12135                 scale);
12136         *input_line_pointer = sep;
12137         input_line_pointer = save;
12138         return NULL;
12139       }
12140     }
12141   if (i.log2_scale_factor != 0 && i.index_reg == 0)
12142     {
12143       as_warn (_("scale factor of %d without an index register"),
12144                1 << i.log2_scale_factor);
12145       i.log2_scale_factor = 0;
12146     }
12147   scale = input_line_pointer;
12148   input_line_pointer = save;
12149   return scale;
12150 }
12151
12152 static int
12153 i386_displacement (char *disp_start, char *disp_end)
12154 {
12155   expressionS *exp;
12156   segT exp_seg = 0;
12157   char *save_input_line_pointer;
12158   char *gotfree_input_line;
12159   int override;
12160   i386_operand_type bigdisp, types = anydisp;
12161   int ret;
12162
12163   if (i.disp_operands == MAX_MEMORY_OPERANDS)
12164     {
12165       as_bad (_("at most %d displacement operands are allowed"),
12166               MAX_MEMORY_OPERANDS);
12167       return 0;
12168     }
12169
12170   operand_type_set (&bigdisp, 0);
12171   if (i.jumpabsolute
12172       || i.types[this_operand].bitfield.baseindex
12173       || (current_templates->start->opcode_modifier.jump != JUMP
12174           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
12175     {
12176       i386_addressing_mode ();
12177       override = (i.prefix[ADDR_PREFIX] != 0);
12178       if (flag_code == CODE_64BIT)
12179         {
12180           bigdisp.bitfield.disp32 = 1;
12181           if (!override)
12182             bigdisp.bitfield.disp64 = 1;
12183         }
12184       else if ((flag_code == CODE_16BIT) ^ override)
12185           bigdisp.bitfield.disp16 = 1;
12186       else
12187           bigdisp.bitfield.disp32 = 1;
12188     }
12189   else
12190     {
12191       /* For PC-relative branches, the width of the displacement may be
12192          dependent upon data size, but is never dependent upon address size.
12193          Also make sure to not unintentionally match against a non-PC-relative
12194          branch template.  */
12195       static templates aux_templates;
12196       const insn_template *t = current_templates->start;
12197       bool has_intel64 = false;
12198
12199       aux_templates.start = t;
12200       while (++t < current_templates->end)
12201         {
12202           if (t->opcode_modifier.jump
12203               != current_templates->start->opcode_modifier.jump)
12204             break;
12205           if ((t->opcode_modifier.isa64 >= INTEL64))
12206             has_intel64 = true;
12207         }
12208       if (t < current_templates->end)
12209         {
12210           aux_templates.end = t;
12211           current_templates = &aux_templates;
12212         }
12213
12214       override = (i.prefix[DATA_PREFIX] != 0);
12215       if (flag_code == CODE_64BIT)
12216         {
12217           if ((override || i.suffix == WORD_MNEM_SUFFIX)
12218               && (!intel64 || !has_intel64))
12219             bigdisp.bitfield.disp16 = 1;
12220           else
12221             bigdisp.bitfield.disp32 = 1;
12222         }
12223       else
12224         {
12225           if (!override)
12226             override = (i.suffix == (flag_code != CODE_16BIT
12227                                      ? WORD_MNEM_SUFFIX
12228                                      : LONG_MNEM_SUFFIX));
12229           bigdisp.bitfield.disp32 = 1;
12230           if ((flag_code == CODE_16BIT) ^ override)
12231             {
12232               bigdisp.bitfield.disp32 = 0;
12233               bigdisp.bitfield.disp16 = 1;
12234             }
12235         }
12236     }
12237   i.types[this_operand] = operand_type_or (i.types[this_operand],
12238                                            bigdisp);
12239
12240   exp = &disp_expressions[i.disp_operands];
12241   i.op[this_operand].disps = exp;
12242   i.disp_operands++;
12243   save_input_line_pointer = input_line_pointer;
12244   input_line_pointer = disp_start;
12245   END_STRING_AND_SAVE (disp_end);
12246
12247 #ifndef GCC_ASM_O_HACK
12248 #define GCC_ASM_O_HACK 0
12249 #endif
12250 #if GCC_ASM_O_HACK
12251   END_STRING_AND_SAVE (disp_end + 1);
12252   if (i.types[this_operand].bitfield.baseIndex
12253       && displacement_string_end[-1] == '+')
12254     {
12255       /* This hack is to avoid a warning when using the "o"
12256          constraint within gcc asm statements.
12257          For instance:
12258
12259          #define _set_tssldt_desc(n,addr,limit,type) \
12260          __asm__ __volatile__ ( \
12261          "movw %w2,%0\n\t" \
12262          "movw %w1,2+%0\n\t" \
12263          "rorl $16,%1\n\t" \
12264          "movb %b1,4+%0\n\t" \
12265          "movb %4,5+%0\n\t" \
12266          "movb $0,6+%0\n\t" \
12267          "movb %h1,7+%0\n\t" \
12268          "rorl $16,%1" \
12269          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
12270
12271          This works great except that the output assembler ends
12272          up looking a bit weird if it turns out that there is
12273          no offset.  You end up producing code that looks like:
12274
12275          #APP
12276          movw $235,(%eax)
12277          movw %dx,2+(%eax)
12278          rorl $16,%edx
12279          movb %dl,4+(%eax)
12280          movb $137,5+(%eax)
12281          movb $0,6+(%eax)
12282          movb %dh,7+(%eax)
12283          rorl $16,%edx
12284          #NO_APP
12285
12286          So here we provide the missing zero.  */
12287
12288       *displacement_string_end = '0';
12289     }
12290 #endif
12291   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
12292   if (gotfree_input_line)
12293     input_line_pointer = gotfree_input_line;
12294
12295   expr_mode = expr_operator_none;
12296   exp_seg = expression (exp);
12297
12298   SKIP_WHITESPACE ();
12299   if (*input_line_pointer)
12300     as_bad (_("junk `%s' after expression"), input_line_pointer);
12301 #if GCC_ASM_O_HACK
12302   RESTORE_END_STRING (disp_end + 1);
12303 #endif
12304   input_line_pointer = save_input_line_pointer;
12305   if (gotfree_input_line)
12306     {
12307       free (gotfree_input_line);
12308
12309       if (exp->X_op == O_constant || exp->X_op == O_register)
12310         exp->X_op = O_illegal;
12311     }
12312
12313   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
12314
12315   RESTORE_END_STRING (disp_end);
12316
12317   return ret;
12318 }
12319
12320 static int
12321 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
12322                             i386_operand_type types, const char *disp_start)
12323 {
12324   int ret = 1;
12325
12326   /* We do this to make sure that the section symbol is in
12327      the symbol table.  We will ultimately change the relocation
12328      to be relative to the beginning of the section.  */
12329   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
12330       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
12331       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
12332     {
12333       if (exp->X_op != O_symbol)
12334         goto inv_disp;
12335
12336       if (S_IS_LOCAL (exp->X_add_symbol)
12337           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
12338           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
12339         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
12340       exp->X_op = O_subtract;
12341       exp->X_op_symbol = GOT_symbol;
12342       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
12343         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
12344       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
12345         i.reloc[this_operand] = BFD_RELOC_64;
12346       else
12347         i.reloc[this_operand] = BFD_RELOC_32;
12348     }
12349
12350   else if (exp->X_op == O_absent
12351            || exp->X_op == O_illegal
12352            || exp->X_op == O_big)
12353     {
12354     inv_disp:
12355       as_bad (_("missing or invalid displacement expression `%s'"),
12356               disp_start);
12357       ret = 0;
12358     }
12359
12360   else if (exp->X_op == O_constant)
12361     {
12362       /* Sizing gets taken care of by optimize_disp().
12363
12364          If not 64bit, sign/zero extend val, to account for wraparound
12365          when !BFD64.  */
12366       if (expr_mode == expr_operator_present
12367           && flag_code != CODE_64BIT && !object_64bit)
12368         exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
12369     }
12370
12371 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
12372   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
12373            && exp_seg != absolute_section
12374            && exp_seg != text_section
12375            && exp_seg != data_section
12376            && exp_seg != bss_section
12377            && exp_seg != undefined_section
12378            && !bfd_is_com_section (exp_seg))
12379     {
12380       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
12381       ret = 0;
12382     }
12383 #endif
12384
12385   else if (current_templates->start->opcode_modifier.jump == JUMP_BYTE)
12386     i.types[this_operand].bitfield.disp8 = 1;
12387
12388   /* Check if this is a displacement only operand.  */
12389   if (!i.types[this_operand].bitfield.baseindex)
12390     i.types[this_operand] =
12391       operand_type_or (operand_type_and_not (i.types[this_operand], anydisp),
12392                        operand_type_and (i.types[this_operand], types));
12393
12394   return ret;
12395 }
12396
12397 /* Return the active addressing mode, taking address override and
12398    registers forming the address into consideration.  Update the
12399    address override prefix if necessary.  */
12400
12401 static enum flag_code
12402 i386_addressing_mode (void)
12403 {
12404   enum flag_code addr_mode;
12405
12406   if (i.prefix[ADDR_PREFIX])
12407     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
12408   else if (flag_code == CODE_16BIT
12409            && is_cpu (current_templates->start, CpuMPX)
12410            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
12411               from md_assemble() by "is not a valid base/index expression"
12412               when there is a base and/or index.  */
12413            && !i.types[this_operand].bitfield.baseindex)
12414     {
12415       /* MPX insn memory operands with neither base nor index must be forced
12416          to use 32-bit addressing in 16-bit mode.  */
12417       addr_mode = CODE_32BIT;
12418       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
12419       ++i.prefixes;
12420       gas_assert (!i.types[this_operand].bitfield.disp16);
12421       gas_assert (!i.types[this_operand].bitfield.disp32);
12422     }
12423   else
12424     {
12425       addr_mode = flag_code;
12426
12427 #if INFER_ADDR_PREFIX
12428       if (i.mem_operands == 0)
12429         {
12430           /* Infer address prefix from the first memory operand.  */
12431           const reg_entry *addr_reg = i.base_reg;
12432
12433           if (addr_reg == NULL)
12434             addr_reg = i.index_reg;
12435
12436           if (addr_reg)
12437             {
12438               if (addr_reg->reg_type.bitfield.dword)
12439                 addr_mode = CODE_32BIT;
12440               else if (flag_code != CODE_64BIT
12441                        && addr_reg->reg_type.bitfield.word)
12442                 addr_mode = CODE_16BIT;
12443
12444               if (addr_mode != flag_code)
12445                 {
12446                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
12447                   i.prefixes += 1;
12448                   /* Change the size of any displacement too.  At most one
12449                      of Disp16 or Disp32 is set.
12450                      FIXME.  There doesn't seem to be any real need for
12451                      separate Disp16 and Disp32 flags.  The same goes for
12452                      Imm16 and Imm32.  Removing them would probably clean
12453                      up the code quite a lot.  */
12454                   if (flag_code != CODE_64BIT
12455                       && (i.types[this_operand].bitfield.disp16
12456                           || i.types[this_operand].bitfield.disp32))
12457                     {
12458                       static const i386_operand_type disp16_32 = {
12459                         .bitfield = { .disp16 = 1, .disp32 = 1 }
12460                       };
12461
12462                       i.types[this_operand]
12463                         = operand_type_xor (i.types[this_operand], disp16_32);
12464                     }
12465                 }
12466             }
12467         }
12468 #endif
12469     }
12470
12471   return addr_mode;
12472 }
12473
12474 /* Make sure the memory operand we've been dealt is valid.
12475    Return 1 on success, 0 on a failure.  */
12476
12477 static int
12478 i386_index_check (const char *operand_string)
12479 {
12480   const char *kind = "base/index";
12481   enum flag_code addr_mode = i386_addressing_mode ();
12482   const insn_template *t = current_templates->end - 1;
12483
12484   if (t->opcode_modifier.isstring)
12485     {
12486       /* Memory operands of string insns are special in that they only allow
12487          a single register (rDI, rSI, or rBX) as their memory address.  */
12488       const reg_entry *expected_reg;
12489       static const char di_si[][2][4] =
12490         {
12491           { "esi", "edi" },
12492           { "si", "di" },
12493           { "rsi", "rdi" }
12494         };
12495       static const char bx[][4] = { "ebx", "bx", "rbx" };
12496
12497       kind = "string address";
12498
12499       if (t->opcode_modifier.prefixok == PrefixRep)
12500         {
12501           int es_op = t->opcode_modifier.isstring - IS_STRING_ES_OP0;
12502           int op = 0;
12503
12504           if (!t->operand_types[0].bitfield.baseindex
12505               || ((!i.mem_operands != !intel_syntax)
12506                   && t->operand_types[1].bitfield.baseindex))
12507             op = 1;
12508           expected_reg
12509             = (const reg_entry *) str_hash_find (reg_hash,
12510                                                  di_si[addr_mode][op == es_op]);
12511         }
12512       else
12513         expected_reg
12514           = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
12515
12516       if (i.base_reg != expected_reg
12517           || i.index_reg
12518           || operand_type_check (i.types[this_operand], disp))
12519         {
12520           /* The second memory operand must have the same size as
12521              the first one.  */
12522           if (i.mem_operands
12523               && i.base_reg
12524               && !((addr_mode == CODE_64BIT
12525                     && i.base_reg->reg_type.bitfield.qword)
12526                    || (addr_mode == CODE_32BIT
12527                        ? i.base_reg->reg_type.bitfield.dword
12528                        : i.base_reg->reg_type.bitfield.word)))
12529             goto bad_address;
12530
12531           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
12532                    operand_string,
12533                    intel_syntax ? '[' : '(',
12534                    register_prefix,
12535                    expected_reg->reg_name,
12536                    intel_syntax ? ']' : ')');
12537           return 1;
12538         }
12539       else
12540         return 1;
12541
12542     bad_address:
12543       as_bad (_("`%s' is not a valid %s expression"),
12544               operand_string, kind);
12545       return 0;
12546     }
12547   else
12548     {
12549       t = current_templates->start;
12550
12551       if (addr_mode != CODE_16BIT)
12552         {
12553           /* 32-bit/64-bit checks.  */
12554           if (i.disp_encoding == disp_encoding_16bit)
12555             {
12556             bad_disp:
12557               as_bad (_("invalid `%s' prefix"),
12558                       addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
12559               return 0;
12560             }
12561
12562           if ((i.base_reg
12563                && ((addr_mode == CODE_64BIT
12564                     ? !i.base_reg->reg_type.bitfield.qword
12565                     : !i.base_reg->reg_type.bitfield.dword)
12566                    || (i.index_reg && i.base_reg->reg_num == RegIP)
12567                    || i.base_reg->reg_num == RegIZ))
12568               || (i.index_reg
12569                   && !i.index_reg->reg_type.bitfield.xmmword
12570                   && !i.index_reg->reg_type.bitfield.ymmword
12571                   && !i.index_reg->reg_type.bitfield.zmmword
12572                   && ((addr_mode == CODE_64BIT
12573                        ? !i.index_reg->reg_type.bitfield.qword
12574                        : !i.index_reg->reg_type.bitfield.dword)
12575                       || !i.index_reg->reg_type.bitfield.baseindex)))
12576             goto bad_address;
12577
12578           /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
12579           if (t->mnem_off == MN_bndmk
12580               || t->mnem_off == MN_bndldx
12581               || t->mnem_off == MN_bndstx
12582               || t->opcode_modifier.sib == SIBMEM)
12583             {
12584               /* They cannot use RIP-relative addressing. */
12585               if (i.base_reg && i.base_reg->reg_num == RegIP)
12586                 {
12587                   as_bad (_("`%s' cannot be used here"), operand_string);
12588                   return 0;
12589                 }
12590
12591               /* bndldx and bndstx ignore their scale factor. */
12592               if ((t->mnem_off == MN_bndldx || t->mnem_off == MN_bndstx)
12593                   && i.log2_scale_factor)
12594                 as_warn (_("register scaling is being ignored here"));
12595             }
12596         }
12597       else
12598         {
12599           /* 16-bit checks.  */
12600           if (i.disp_encoding == disp_encoding_32bit)
12601             goto bad_disp;
12602
12603           if ((i.base_reg
12604                && (!i.base_reg->reg_type.bitfield.word
12605                    || !i.base_reg->reg_type.bitfield.baseindex))
12606               || (i.index_reg
12607                   && (!i.index_reg->reg_type.bitfield.word
12608                       || !i.index_reg->reg_type.bitfield.baseindex
12609                       || !(i.base_reg
12610                            && i.base_reg->reg_num < 6
12611                            && i.index_reg->reg_num >= 6
12612                            && i.log2_scale_factor == 0))))
12613             goto bad_address;
12614         }
12615     }
12616   return 1;
12617 }
12618
12619 /* Handle vector immediates.  */
12620
12621 static int
12622 RC_SAE_immediate (const char *imm_start)
12623 {
12624   const char *pstr = imm_start;
12625
12626   if (*pstr != '{')
12627     return 0;
12628
12629   pstr = RC_SAE_specifier (pstr + 1);
12630   if (pstr == NULL)
12631     return 0;
12632
12633   if (*pstr++ != '}')
12634     {
12635       as_bad (_("Missing '}': '%s'"), imm_start);
12636       return 0;
12637     }
12638   /* RC/SAE immediate string should contain nothing more.  */;
12639   if (*pstr != 0)
12640     {
12641       as_bad (_("Junk after '}': '%s'"), imm_start);
12642       return 0;
12643     }
12644
12645   /* Internally this doesn't count as an operand.  */
12646   --i.operands;
12647
12648   return 1;
12649 }
12650
12651 static INLINE bool starts_memory_operand (char c)
12652 {
12653   return ISDIGIT (c)
12654          || is_name_beginner (c)
12655          || strchr ("([\"+-!~", c);
12656 }
12657
12658 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
12659    on error.  */
12660
12661 static int
12662 i386_att_operand (char *operand_string)
12663 {
12664   const reg_entry *r;
12665   char *end_op;
12666   char *op_string = operand_string;
12667
12668   if (is_space_char (*op_string))
12669     ++op_string;
12670
12671   /* We check for an absolute prefix (differentiating,
12672      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
12673   if (*op_string == ABSOLUTE_PREFIX
12674       && current_templates->start->opcode_modifier.jump)
12675     {
12676       ++op_string;
12677       if (is_space_char (*op_string))
12678         ++op_string;
12679       i.jumpabsolute = true;
12680     }
12681
12682   /* Check if operand is a register.  */
12683   if ((r = parse_register (op_string, &end_op)) != NULL)
12684     {
12685       i386_operand_type temp;
12686
12687       if (r == &bad_reg)
12688         return 0;
12689
12690       /* Check for a segment override by searching for ':' after a
12691          segment register.  */
12692       op_string = end_op;
12693       if (is_space_char (*op_string))
12694         ++op_string;
12695       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
12696         {
12697           i.seg[i.mem_operands] = r;
12698
12699           /* Skip the ':' and whitespace.  */
12700           ++op_string;
12701           if (is_space_char (*op_string))
12702             ++op_string;
12703
12704           /* Handle case of %es:*foo.  */
12705           if (!i.jumpabsolute && *op_string == ABSOLUTE_PREFIX
12706               && current_templates->start->opcode_modifier.jump)
12707             {
12708               ++op_string;
12709               if (is_space_char (*op_string))
12710                 ++op_string;
12711               i.jumpabsolute = true;
12712             }
12713
12714           if (!starts_memory_operand (*op_string))
12715             {
12716               as_bad (_("bad memory operand `%s'"), op_string);
12717               return 0;
12718             }
12719           goto do_memory_reference;
12720         }
12721
12722       /* Handle vector operations.  */
12723       if (*op_string == '{')
12724         {
12725           op_string = check_VecOperations (op_string);
12726           if (op_string == NULL)
12727             return 0;
12728         }
12729
12730       if (*op_string)
12731         {
12732           as_bad (_("junk `%s' after register"), op_string);
12733           return 0;
12734         }
12735
12736        /* Reject pseudo registers for .insn.  */
12737       if (dot_insn () && r->reg_type.bitfield.class == ClassNone)
12738         {
12739           as_bad (_("`%s%s' cannot be used here"),
12740                   register_prefix, r->reg_name);
12741           return 0;
12742         }
12743
12744       temp = r->reg_type;
12745       temp.bitfield.baseindex = 0;
12746       i.types[this_operand] = operand_type_or (i.types[this_operand],
12747                                                temp);
12748       i.types[this_operand].bitfield.unspecified = 0;
12749       i.op[this_operand].regs = r;
12750       i.reg_operands++;
12751
12752       /* A GPR may follow an RC or SAE immediate only if a (vector) register
12753          operand was also present earlier on.  */
12754       if (i.rounding.type != rc_none && temp.bitfield.class == Reg
12755           && i.reg_operands == 1)
12756         {
12757           unsigned int j;
12758
12759           for (j = 0; j < ARRAY_SIZE (RC_NamesTable); ++j)
12760             if (i.rounding.type == RC_NamesTable[j].type)
12761               break;
12762           as_bad (_("`%s': misplaced `{%s}'"),
12763                   insn_name (current_templates->start), RC_NamesTable[j].name);
12764           return 0;
12765         }
12766     }
12767   else if (*op_string == REGISTER_PREFIX)
12768     {
12769       as_bad (_("bad register name `%s'"), op_string);
12770       return 0;
12771     }
12772   else if (*op_string == IMMEDIATE_PREFIX)
12773     {
12774       ++op_string;
12775       if (i.jumpabsolute)
12776         {
12777           as_bad (_("immediate operand illegal with absolute jump"));
12778           return 0;
12779         }
12780       if (!i386_immediate (op_string))
12781         return 0;
12782       if (i.rounding.type != rc_none)
12783         {
12784           as_bad (_("`%s': RC/SAE operand must follow immediate operands"),
12785                   insn_name (current_templates->start));
12786           return 0;
12787         }
12788     }
12789   else if (RC_SAE_immediate (operand_string))
12790     {
12791       /* If it is a RC or SAE immediate, do the necessary placement check:
12792          Only another immediate or a GPR may precede it.  */
12793       if (i.mem_operands || i.reg_operands + i.imm_operands > 1
12794           || (i.reg_operands == 1
12795               && i.op[0].regs->reg_type.bitfield.class != Reg))
12796         {
12797           as_bad (_("`%s': misplaced `%s'"),
12798                   insn_name (current_templates->start), operand_string);
12799           return 0;
12800         }
12801     }
12802   else if (starts_memory_operand (*op_string))
12803     {
12804       /* This is a memory reference of some sort.  */
12805       char *base_string;
12806
12807       /* Start and end of displacement string expression (if found).  */
12808       char *displacement_string_start;
12809       char *displacement_string_end;
12810
12811     do_memory_reference:
12812       /* Check for base index form.  We detect the base index form by
12813          looking for an ')' at the end of the operand, searching
12814          for the '(' matching it, and finding a REGISTER_PREFIX or ','
12815          after the '('.  */
12816       base_string = op_string + strlen (op_string);
12817
12818       /* Handle vector operations.  */
12819       --base_string;
12820       if (is_space_char (*base_string))
12821         --base_string;
12822
12823       if (*base_string == '}')
12824         {
12825           char *vop_start = NULL;
12826
12827           while (base_string-- > op_string)
12828             {
12829               if (*base_string == '"')
12830                 break;
12831               if (*base_string != '{')
12832                 continue;
12833
12834               vop_start = base_string;
12835
12836               --base_string;
12837               if (is_space_char (*base_string))
12838                 --base_string;
12839
12840               if (*base_string != '}')
12841                 break;
12842
12843               vop_start = NULL;
12844             }
12845
12846           if (!vop_start)
12847             {
12848               as_bad (_("unbalanced figure braces"));
12849               return 0;
12850             }
12851
12852           if (check_VecOperations (vop_start) == NULL)
12853             return 0;
12854         }
12855
12856       /* If we only have a displacement, set-up for it to be parsed later.  */
12857       displacement_string_start = op_string;
12858       displacement_string_end = base_string + 1;
12859
12860       if (*base_string == ')')
12861         {
12862           char *temp_string;
12863           unsigned int parens_not_balanced = 0;
12864           bool in_quotes = false;
12865
12866           /* We've already checked that the number of left & right ()'s are
12867              equal, and that there's a matching set of double quotes.  */
12868           end_op = base_string;
12869           for (temp_string = op_string; temp_string < end_op; temp_string++)
12870             {
12871               if (*temp_string == '\\' && temp_string[1] == '"')
12872                 ++temp_string;
12873               else if (*temp_string == '"')
12874                 in_quotes = !in_quotes;
12875               else if (!in_quotes)
12876                 {
12877                   if (*temp_string == '(' && !parens_not_balanced++)
12878                     base_string = temp_string;
12879                   if (*temp_string == ')')
12880                     --parens_not_balanced;
12881                 }
12882             }
12883
12884           temp_string = base_string;
12885
12886           /* Skip past '(' and whitespace.  */
12887           gas_assert (*base_string == '(');
12888           ++base_string;
12889           if (is_space_char (*base_string))
12890             ++base_string;
12891
12892           if (*base_string == ','
12893               || ((i.base_reg = parse_register (base_string, &end_op))
12894                   != NULL))
12895             {
12896               displacement_string_end = temp_string;
12897
12898               i.types[this_operand].bitfield.baseindex = 1;
12899
12900               if (i.base_reg)
12901                 {
12902                   if (i.base_reg == &bad_reg)
12903                     return 0;
12904                   base_string = end_op;
12905                   if (is_space_char (*base_string))
12906                     ++base_string;
12907                 }
12908
12909               /* There may be an index reg or scale factor here.  */
12910               if (*base_string == ',')
12911                 {
12912                   ++base_string;
12913                   if (is_space_char (*base_string))
12914                     ++base_string;
12915
12916                   if ((i.index_reg = parse_register (base_string, &end_op))
12917                       != NULL)
12918                     {
12919                       if (i.index_reg == &bad_reg)
12920                         return 0;
12921                       base_string = end_op;
12922                       if (is_space_char (*base_string))
12923                         ++base_string;
12924                       if (*base_string == ',')
12925                         {
12926                           ++base_string;
12927                           if (is_space_char (*base_string))
12928                             ++base_string;
12929                         }
12930                       else if (*base_string != ')')
12931                         {
12932                           as_bad (_("expecting `,' or `)' "
12933                                     "after index register in `%s'"),
12934                                   operand_string);
12935                           return 0;
12936                         }
12937                     }
12938                   else if (*base_string == REGISTER_PREFIX)
12939                     {
12940                       end_op = strchr (base_string, ',');
12941                       if (end_op)
12942                         *end_op = '\0';
12943                       as_bad (_("bad register name `%s'"), base_string);
12944                       return 0;
12945                     }
12946
12947                   /* Check for scale factor.  */
12948                   if (*base_string != ')')
12949                     {
12950                       char *end_scale = i386_scale (base_string);
12951
12952                       if (!end_scale)
12953                         return 0;
12954
12955                       base_string = end_scale;
12956                       if (is_space_char (*base_string))
12957                         ++base_string;
12958                       if (*base_string != ')')
12959                         {
12960                           as_bad (_("expecting `)' "
12961                                     "after scale factor in `%s'"),
12962                                   operand_string);
12963                           return 0;
12964                         }
12965                     }
12966                   else if (!i.index_reg)
12967                     {
12968                       as_bad (_("expecting index register or scale factor "
12969                                 "after `,'; got '%c'"),
12970                               *base_string);
12971                       return 0;
12972                     }
12973                 }
12974               else if (*base_string != ')')
12975                 {
12976                   as_bad (_("expecting `,' or `)' "
12977                             "after base register in `%s'"),
12978                           operand_string);
12979                   return 0;
12980                 }
12981             }
12982           else if (*base_string == REGISTER_PREFIX)
12983             {
12984               end_op = strchr (base_string, ',');
12985               if (end_op)
12986                 *end_op = '\0';
12987               as_bad (_("bad register name `%s'"), base_string);
12988               return 0;
12989             }
12990         }
12991
12992       /* If there's an expression beginning the operand, parse it,
12993          assuming displacement_string_start and
12994          displacement_string_end are meaningful.  */
12995       if (displacement_string_start != displacement_string_end)
12996         {
12997           if (!i386_displacement (displacement_string_start,
12998                                   displacement_string_end))
12999             return 0;
13000         }
13001
13002       /* Special case for (%dx) while doing input/output op.  */
13003       if (i.base_reg
13004           && i.base_reg->reg_type.bitfield.instance == RegD
13005           && i.base_reg->reg_type.bitfield.word
13006           && i.index_reg == 0
13007           && i.log2_scale_factor == 0
13008           && i.seg[i.mem_operands] == 0
13009           && !operand_type_check (i.types[this_operand], disp))
13010         {
13011           i.types[this_operand] = i.base_reg->reg_type;
13012           i.input_output_operand = true;
13013           return 1;
13014         }
13015
13016       if (i386_index_check (operand_string) == 0)
13017         return 0;
13018       i.flags[this_operand] |= Operand_Mem;
13019       i.mem_operands++;
13020     }
13021   else
13022     {
13023       /* It's not a memory operand; argh!  */
13024       as_bad (_("invalid char %s beginning operand %d `%s'"),
13025               output_invalid (*op_string),
13026               this_operand + 1,
13027               op_string);
13028       return 0;
13029     }
13030   return 1;                     /* Normal return.  */
13031 }
13032 \f
13033 /* Calculate the maximum variable size (i.e., excluding fr_fix)
13034    that an rs_machine_dependent frag may reach.  */
13035
13036 unsigned int
13037 i386_frag_max_var (fragS *frag)
13038 {
13039   /* The only relaxable frags are for jumps.
13040      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
13041   gas_assert (frag->fr_type == rs_machine_dependent);
13042   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
13043 }
13044
13045 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13046 static int
13047 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
13048 {
13049   /* STT_GNU_IFUNC symbol must go through PLT.  */
13050   if ((symbol_get_bfdsym (fr_symbol)->flags
13051        & BSF_GNU_INDIRECT_FUNCTION) != 0)
13052     return 0;
13053
13054   if (!S_IS_EXTERNAL (fr_symbol))
13055     /* Symbol may be weak or local.  */
13056     return !S_IS_WEAK (fr_symbol);
13057
13058   /* Global symbols with non-default visibility can't be preempted. */
13059   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
13060     return 1;
13061
13062   if (fr_var != NO_RELOC)
13063     switch ((enum bfd_reloc_code_real) fr_var)
13064       {
13065       case BFD_RELOC_386_PLT32:
13066       case BFD_RELOC_X86_64_PLT32:
13067         /* Symbol with PLT relocation may be preempted. */
13068         return 0;
13069       default:
13070         abort ();
13071       }
13072
13073   /* Global symbols with default visibility in a shared library may be
13074      preempted by another definition.  */
13075   return !shared;
13076 }
13077 #endif
13078
13079 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
13080    Note also work for Skylake and Cascadelake.
13081 ---------------------------------------------------------------------
13082 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
13083 | ------  | ----------- | ------- | -------- |
13084 |   Jo    |      N      |    N    |     Y    |
13085 |   Jno   |      N      |    N    |     Y    |
13086 |  Jc/Jb  |      Y      |    N    |     Y    |
13087 | Jae/Jnb |      Y      |    N    |     Y    |
13088 |  Je/Jz  |      Y      |    Y    |     Y    |
13089 | Jne/Jnz |      Y      |    Y    |     Y    |
13090 | Jna/Jbe |      Y      |    N    |     Y    |
13091 | Ja/Jnbe |      Y      |    N    |     Y    |
13092 |   Js    |      N      |    N    |     Y    |
13093 |   Jns   |      N      |    N    |     Y    |
13094 |  Jp/Jpe |      N      |    N    |     Y    |
13095 | Jnp/Jpo |      N      |    N    |     Y    |
13096 | Jl/Jnge |      Y      |    Y    |     Y    |
13097 | Jge/Jnl |      Y      |    Y    |     Y    |
13098 | Jle/Jng |      Y      |    Y    |     Y    |
13099 | Jg/Jnle |      Y      |    Y    |     Y    |
13100 ---------------------------------------------------------------------  */
13101 static int
13102 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
13103 {
13104   if (mf_cmp == mf_cmp_alu_cmp)
13105     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
13106             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
13107   if (mf_cmp == mf_cmp_incdec)
13108     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
13109             || mf_jcc == mf_jcc_jle);
13110   if (mf_cmp == mf_cmp_test_and)
13111     return 1;
13112   return 0;
13113 }
13114
13115 /* Return the next non-empty frag.  */
13116
13117 static fragS *
13118 i386_next_non_empty_frag (fragS *fragP)
13119 {
13120   /* There may be a frag with a ".fill 0" when there is no room in
13121      the current frag for frag_grow in output_insn.  */
13122   for (fragP = fragP->fr_next;
13123        (fragP != NULL
13124         && fragP->fr_type == rs_fill
13125         && fragP->fr_fix == 0);
13126        fragP = fragP->fr_next)
13127     ;
13128   return fragP;
13129 }
13130
13131 /* Return the next jcc frag after BRANCH_PADDING.  */
13132
13133 static fragS *
13134 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
13135 {
13136   fragS *branch_fragP;
13137   if (!pad_fragP)
13138     return NULL;
13139
13140   if (pad_fragP->fr_type == rs_machine_dependent
13141       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
13142           == BRANCH_PADDING))
13143     {
13144       branch_fragP = i386_next_non_empty_frag (pad_fragP);
13145       if (branch_fragP->fr_type != rs_machine_dependent)
13146         return NULL;
13147       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
13148           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
13149                                    pad_fragP->tc_frag_data.mf_type))
13150         return branch_fragP;
13151     }
13152
13153   return NULL;
13154 }
13155
13156 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
13157
13158 static void
13159 i386_classify_machine_dependent_frag (fragS *fragP)
13160 {
13161   fragS *cmp_fragP;
13162   fragS *pad_fragP;
13163   fragS *branch_fragP;
13164   fragS *next_fragP;
13165   unsigned int max_prefix_length;
13166
13167   if (fragP->tc_frag_data.classified)
13168     return;
13169
13170   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
13171      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
13172   for (next_fragP = fragP;
13173        next_fragP != NULL;
13174        next_fragP = next_fragP->fr_next)
13175     {
13176       next_fragP->tc_frag_data.classified = 1;
13177       if (next_fragP->fr_type == rs_machine_dependent)
13178         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
13179           {
13180           case BRANCH_PADDING:
13181             /* The BRANCH_PADDING frag must be followed by a branch
13182                frag.  */
13183             branch_fragP = i386_next_non_empty_frag (next_fragP);
13184             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
13185             break;
13186           case FUSED_JCC_PADDING:
13187             /* Check if this is a fused jcc:
13188                FUSED_JCC_PADDING
13189                CMP like instruction
13190                BRANCH_PADDING
13191                COND_JUMP
13192                */
13193             cmp_fragP = i386_next_non_empty_frag (next_fragP);
13194             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
13195             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
13196             if (branch_fragP)
13197               {
13198                 /* The BRANCH_PADDING frag is merged with the
13199                    FUSED_JCC_PADDING frag.  */
13200                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
13201                 /* CMP like instruction size.  */
13202                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
13203                 frag_wane (pad_fragP);
13204                 /* Skip to branch_fragP.  */
13205                 next_fragP = branch_fragP;
13206               }
13207             else if (next_fragP->tc_frag_data.max_prefix_length)
13208               {
13209                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
13210                    a fused jcc.  */
13211                 next_fragP->fr_subtype
13212                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
13213                 next_fragP->tc_frag_data.max_bytes
13214                   = next_fragP->tc_frag_data.max_prefix_length;
13215                 /* This will be updated in the BRANCH_PREFIX scan.  */
13216                 next_fragP->tc_frag_data.max_prefix_length = 0;
13217               }
13218             else
13219               frag_wane (next_fragP);
13220             break;
13221           }
13222     }
13223
13224   /* Stop if there is no BRANCH_PREFIX.  */
13225   if (!align_branch_prefix_size)
13226     return;
13227
13228   /* Scan for BRANCH_PREFIX.  */
13229   for (; fragP != NULL; fragP = fragP->fr_next)
13230     {
13231       if (fragP->fr_type != rs_machine_dependent
13232           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
13233               != BRANCH_PREFIX))
13234         continue;
13235
13236       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
13237          COND_JUMP_PREFIX.  */
13238       max_prefix_length = 0;
13239       for (next_fragP = fragP;
13240            next_fragP != NULL;
13241            next_fragP = next_fragP->fr_next)
13242         {
13243           if (next_fragP->fr_type == rs_fill)
13244             /* Skip rs_fill frags.  */
13245             continue;
13246           else if (next_fragP->fr_type != rs_machine_dependent)
13247             /* Stop for all other frags.  */
13248             break;
13249
13250           /* rs_machine_dependent frags.  */
13251           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
13252               == BRANCH_PREFIX)
13253             {
13254               /* Count BRANCH_PREFIX frags.  */
13255               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
13256                 {
13257                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
13258                   frag_wane (next_fragP);
13259                 }
13260               else
13261                 max_prefix_length
13262                   += next_fragP->tc_frag_data.max_bytes;
13263             }
13264           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
13265                     == BRANCH_PADDING)
13266                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
13267                        == FUSED_JCC_PADDING))
13268             {
13269               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
13270               fragP->tc_frag_data.u.padding_fragP = next_fragP;
13271               break;
13272             }
13273           else
13274             /* Stop for other rs_machine_dependent frags.  */
13275             break;
13276         }
13277
13278       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
13279
13280       /* Skip to the next frag.  */
13281       fragP = next_fragP;
13282     }
13283 }
13284
13285 /* Compute padding size for
13286
13287         FUSED_JCC_PADDING
13288         CMP like instruction
13289         BRANCH_PADDING
13290         COND_JUMP/UNCOND_JUMP
13291
13292    or
13293
13294         BRANCH_PADDING
13295         COND_JUMP/UNCOND_JUMP
13296  */
13297
13298 static int
13299 i386_branch_padding_size (fragS *fragP, offsetT address)
13300 {
13301   unsigned int offset, size, padding_size;
13302   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
13303
13304   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
13305   if (!address)
13306     address = fragP->fr_address;
13307   address += fragP->fr_fix;
13308
13309   /* CMP like instrunction size.  */
13310   size = fragP->tc_frag_data.cmp_size;
13311
13312   /* The base size of the branch frag.  */
13313   size += branch_fragP->fr_fix;
13314
13315   /* Add opcode and displacement bytes for the rs_machine_dependent
13316      branch frag.  */
13317   if (branch_fragP->fr_type == rs_machine_dependent)
13318     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
13319
13320   /* Check if branch is within boundary and doesn't end at the last
13321      byte.  */
13322   offset = address & ((1U << align_branch_power) - 1);
13323   if ((offset + size) >= (1U << align_branch_power))
13324     /* Padding needed to avoid crossing boundary.  */
13325     padding_size = (1U << align_branch_power) - offset;
13326   else
13327     /* No padding needed.  */
13328     padding_size = 0;
13329
13330   /* The return value may be saved in tc_frag_data.length which is
13331      unsigned byte.  */
13332   if (!fits_in_unsigned_byte (padding_size))
13333     abort ();
13334
13335   return padding_size;
13336 }
13337
13338 /* i386_generic_table_relax_frag()
13339
13340    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
13341    grow/shrink padding to align branch frags.  Hand others to
13342    relax_frag().  */
13343
13344 long
13345 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
13346 {
13347   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
13348       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
13349     {
13350       long padding_size = i386_branch_padding_size (fragP, 0);
13351       long grow = padding_size - fragP->tc_frag_data.length;
13352
13353       /* When the BRANCH_PREFIX frag is used, the computed address
13354          must match the actual address and there should be no padding.  */
13355       if (fragP->tc_frag_data.padding_address
13356           && (fragP->tc_frag_data.padding_address != fragP->fr_address
13357               || padding_size))
13358         abort ();
13359
13360       /* Update the padding size.  */
13361       if (grow)
13362         fragP->tc_frag_data.length = padding_size;
13363
13364       return grow;
13365     }
13366   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
13367     {
13368       fragS *padding_fragP, *next_fragP;
13369       long padding_size, left_size, last_size;
13370
13371       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
13372       if (!padding_fragP)
13373         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
13374         return (fragP->tc_frag_data.length
13375                 - fragP->tc_frag_data.last_length);
13376
13377       /* Compute the relative address of the padding frag in the very
13378         first time where the BRANCH_PREFIX frag sizes are zero.  */
13379       if (!fragP->tc_frag_data.padding_address)
13380         fragP->tc_frag_data.padding_address
13381           = padding_fragP->fr_address - (fragP->fr_address - stretch);
13382
13383       /* First update the last length from the previous interation.  */
13384       left_size = fragP->tc_frag_data.prefix_length;
13385       for (next_fragP = fragP;
13386            next_fragP != padding_fragP;
13387            next_fragP = next_fragP->fr_next)
13388         if (next_fragP->fr_type == rs_machine_dependent
13389             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
13390                 == BRANCH_PREFIX))
13391           {
13392             if (left_size)
13393               {
13394                 int max = next_fragP->tc_frag_data.max_bytes;
13395                 if (max)
13396                   {
13397                     int size;
13398                     if (max > left_size)
13399                       size = left_size;
13400                     else
13401                       size = max;
13402                     left_size -= size;
13403                     next_fragP->tc_frag_data.last_length = size;
13404                   }
13405               }
13406             else
13407               next_fragP->tc_frag_data.last_length = 0;
13408           }
13409
13410       /* Check the padding size for the padding frag.  */
13411       padding_size = i386_branch_padding_size
13412         (padding_fragP, (fragP->fr_address
13413                          + fragP->tc_frag_data.padding_address));
13414
13415       last_size = fragP->tc_frag_data.prefix_length;
13416       /* Check if there is change from the last interation.  */
13417       if (padding_size == last_size)
13418         {
13419           /* Update the expected address of the padding frag.  */
13420           padding_fragP->tc_frag_data.padding_address
13421             = (fragP->fr_address + padding_size
13422                + fragP->tc_frag_data.padding_address);
13423           return 0;
13424         }
13425
13426       if (padding_size > fragP->tc_frag_data.max_prefix_length)
13427         {
13428           /* No padding if there is no sufficient room.  Clear the
13429              expected address of the padding frag.  */
13430           padding_fragP->tc_frag_data.padding_address = 0;
13431           padding_size = 0;
13432         }
13433       else
13434         /* Store the expected address of the padding frag.  */
13435         padding_fragP->tc_frag_data.padding_address
13436           = (fragP->fr_address + padding_size
13437              + fragP->tc_frag_data.padding_address);
13438
13439       fragP->tc_frag_data.prefix_length = padding_size;
13440
13441       /* Update the length for the current interation.  */
13442       left_size = padding_size;
13443       for (next_fragP = fragP;
13444            next_fragP != padding_fragP;
13445            next_fragP = next_fragP->fr_next)
13446         if (next_fragP->fr_type == rs_machine_dependent
13447             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
13448                 == BRANCH_PREFIX))
13449           {
13450             if (left_size)
13451               {
13452                 int max = next_fragP->tc_frag_data.max_bytes;
13453                 if (max)
13454                   {
13455                     int size;
13456                     if (max > left_size)
13457                       size = left_size;
13458                     else
13459                       size = max;
13460                     left_size -= size;
13461                     next_fragP->tc_frag_data.length = size;
13462                   }
13463               }
13464             else
13465               next_fragP->tc_frag_data.length = 0;
13466           }
13467
13468       return (fragP->tc_frag_data.length
13469               - fragP->tc_frag_data.last_length);
13470     }
13471   return relax_frag (segment, fragP, stretch);
13472 }
13473
13474 /* md_estimate_size_before_relax()
13475
13476    Called just before relax() for rs_machine_dependent frags.  The x86
13477    assembler uses these frags to handle variable size jump
13478    instructions.
13479
13480    Any symbol that is now undefined will not become defined.
13481    Return the correct fr_subtype in the frag.
13482    Return the initial "guess for variable size of frag" to caller.
13483    The guess is actually the growth beyond the fixed part.  Whatever
13484    we do to grow the fixed or variable part contributes to our
13485    returned value.  */
13486
13487 int
13488 md_estimate_size_before_relax (fragS *fragP, segT segment)
13489 {
13490   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
13491       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
13492       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
13493     {
13494       i386_classify_machine_dependent_frag (fragP);
13495       return fragP->tc_frag_data.length;
13496     }
13497
13498   /* We've already got fragP->fr_subtype right;  all we have to do is
13499      check for un-relaxable symbols.  On an ELF system, we can't relax
13500      an externally visible symbol, because it may be overridden by a
13501      shared library.  */
13502   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
13503 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13504       || (IS_ELF
13505           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
13506                                                 fragP->fr_var))
13507 #endif
13508 #if defined (OBJ_COFF) && defined (TE_PE)
13509       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
13510           && S_IS_WEAK (fragP->fr_symbol))
13511 #endif
13512       )
13513     {
13514       /* Symbol is undefined in this segment, or we need to keep a
13515          reloc so that weak symbols can be overridden.  */
13516       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
13517       enum bfd_reloc_code_real reloc_type;
13518       unsigned char *opcode;
13519       int old_fr_fix;
13520       fixS *fixP = NULL;
13521
13522       if (fragP->fr_var != NO_RELOC)
13523         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
13524       else if (size == 2)
13525         reloc_type = BFD_RELOC_16_PCREL;
13526 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13527       else if (fragP->tc_frag_data.code64 && fragP->fr_offset == 0
13528                && need_plt32_p (fragP->fr_symbol))
13529         reloc_type = BFD_RELOC_X86_64_PLT32;
13530 #endif
13531       else
13532         reloc_type = BFD_RELOC_32_PCREL;
13533
13534       old_fr_fix = fragP->fr_fix;
13535       opcode = (unsigned char *) fragP->fr_opcode;
13536
13537       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
13538         {
13539         case UNCOND_JUMP:
13540           /* Make jmp (0xeb) a (d)word displacement jump.  */
13541           opcode[0] = 0xe9;
13542           fragP->fr_fix += size;
13543           fixP = fix_new (fragP, old_fr_fix, size,
13544                           fragP->fr_symbol,
13545                           fragP->fr_offset, 1,
13546                           reloc_type);
13547           break;
13548
13549         case COND_JUMP86:
13550           if (size == 2
13551               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
13552             {
13553               /* Negate the condition, and branch past an
13554                  unconditional jump.  */
13555               opcode[0] ^= 1;
13556               opcode[1] = 3;
13557               /* Insert an unconditional jump.  */
13558               opcode[2] = 0xe9;
13559               /* We added two extra opcode bytes, and have a two byte
13560                  offset.  */
13561               fragP->fr_fix += 2 + 2;
13562               fix_new (fragP, old_fr_fix + 2, 2,
13563                        fragP->fr_symbol,
13564                        fragP->fr_offset, 1,
13565                        reloc_type);
13566               break;
13567             }
13568           /* Fall through.  */
13569
13570         case COND_JUMP:
13571           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
13572             {
13573               fragP->fr_fix += 1;
13574               fixP = fix_new (fragP, old_fr_fix, 1,
13575                               fragP->fr_symbol,
13576                               fragP->fr_offset, 1,
13577                               BFD_RELOC_8_PCREL);
13578               fixP->fx_signed = 1;
13579               break;
13580             }
13581
13582           /* This changes the byte-displacement jump 0x7N
13583              to the (d)word-displacement jump 0x0f,0x8N.  */
13584           opcode[1] = opcode[0] + 0x10;
13585           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
13586           /* We've added an opcode byte.  */
13587           fragP->fr_fix += 1 + size;
13588           fixP = fix_new (fragP, old_fr_fix + 1, size,
13589                           fragP->fr_symbol,
13590                           fragP->fr_offset, 1,
13591                           reloc_type);
13592           break;
13593
13594         default:
13595           BAD_CASE (fragP->fr_subtype);
13596           break;
13597         }
13598
13599       /* All jumps handled here are signed, but don't unconditionally use a
13600          signed limit check for 32 and 16 bit jumps as we want to allow wrap
13601          around at 4G (outside of 64-bit mode) and 64k.  */
13602       if (size == 4 && flag_code == CODE_64BIT)
13603         fixP->fx_signed = 1;
13604
13605       frag_wane (fragP);
13606       return fragP->fr_fix - old_fr_fix;
13607     }
13608
13609   /* Guess size depending on current relax state.  Initially the relax
13610      state will correspond to a short jump and we return 1, because
13611      the variable part of the frag (the branch offset) is one byte
13612      long.  However, we can relax a section more than once and in that
13613      case we must either set fr_subtype back to the unrelaxed state,
13614      or return the value for the appropriate branch.  */
13615   return md_relax_table[fragP->fr_subtype].rlx_length;
13616 }
13617
13618 /* Called after relax() is finished.
13619
13620    In:  Address of frag.
13621         fr_type == rs_machine_dependent.
13622         fr_subtype is what the address relaxed to.
13623
13624    Out: Any fixSs and constants are set up.
13625         Caller will turn frag into a ".space 0".  */
13626
13627 void
13628 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
13629                  fragS *fragP)
13630 {
13631   unsigned char *opcode;
13632   unsigned char *where_to_put_displacement = NULL;
13633   offsetT target_address;
13634   offsetT opcode_address;
13635   unsigned int extension = 0;
13636   offsetT displacement_from_opcode_start;
13637
13638   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
13639       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
13640       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
13641     {
13642       /* Generate nop padding.  */
13643       unsigned int size = fragP->tc_frag_data.length;
13644       if (size)
13645         {
13646           if (size > fragP->tc_frag_data.max_bytes)
13647             abort ();
13648
13649           if (flag_debug)
13650             {
13651               const char *msg;
13652               const char *branch = "branch";
13653               const char *prefix = "";
13654               fragS *padding_fragP;
13655               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
13656                   == BRANCH_PREFIX)
13657                 {
13658                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
13659                   switch (fragP->tc_frag_data.default_prefix)
13660                     {
13661                     default:
13662                       abort ();
13663                       break;
13664                     case CS_PREFIX_OPCODE:
13665                       prefix = " cs";
13666                       break;
13667                     case DS_PREFIX_OPCODE:
13668                       prefix = " ds";
13669                       break;
13670                     case ES_PREFIX_OPCODE:
13671                       prefix = " es";
13672                       break;
13673                     case FS_PREFIX_OPCODE:
13674                       prefix = " fs";
13675                       break;
13676                     case GS_PREFIX_OPCODE:
13677                       prefix = " gs";
13678                       break;
13679                     case SS_PREFIX_OPCODE:
13680                       prefix = " ss";
13681                       break;
13682                     }
13683                   if (padding_fragP)
13684                     msg = _("%s:%u: add %d%s at 0x%llx to align "
13685                             "%s within %d-byte boundary\n");
13686                   else
13687                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
13688                             "align %s within %d-byte boundary\n");
13689                 }
13690               else
13691                 {
13692                   padding_fragP = fragP;
13693                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
13694                           "%s within %d-byte boundary\n");
13695                 }
13696
13697               if (padding_fragP)
13698                 switch (padding_fragP->tc_frag_data.branch_type)
13699                   {
13700                   case align_branch_jcc:
13701                     branch = "jcc";
13702                     break;
13703                   case align_branch_fused:
13704                     branch = "fused jcc";
13705                     break;
13706                   case align_branch_jmp:
13707                     branch = "jmp";
13708                     break;
13709                   case align_branch_call:
13710                     branch = "call";
13711                     break;
13712                   case align_branch_indirect:
13713                     branch = "indiret branch";
13714                     break;
13715                   case align_branch_ret:
13716                     branch = "ret";
13717                     break;
13718                   default:
13719                     break;
13720                   }
13721
13722               fprintf (stdout, msg,
13723                        fragP->fr_file, fragP->fr_line, size, prefix,
13724                        (long long) fragP->fr_address, branch,
13725                        1 << align_branch_power);
13726             }
13727           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
13728             memset (fragP->fr_opcode,
13729                     fragP->tc_frag_data.default_prefix, size);
13730           else
13731             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
13732                                 size, 0);
13733           fragP->fr_fix += size;
13734         }
13735       return;
13736     }
13737
13738   opcode = (unsigned char *) fragP->fr_opcode;
13739
13740   /* Address we want to reach in file space.  */
13741   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
13742
13743   /* Address opcode resides at in file space.  */
13744   opcode_address = fragP->fr_address + fragP->fr_fix;
13745
13746   /* Displacement from opcode start to fill into instruction.  */
13747   displacement_from_opcode_start = target_address - opcode_address;
13748
13749   if ((fragP->fr_subtype & BIG) == 0)
13750     {
13751       /* Don't have to change opcode.  */
13752       extension = 1;            /* 1 opcode + 1 displacement  */
13753       where_to_put_displacement = &opcode[1];
13754     }
13755   else
13756     {
13757       if (no_cond_jump_promotion
13758           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
13759         as_warn_where (fragP->fr_file, fragP->fr_line,
13760                        _("long jump required"));
13761
13762       switch (fragP->fr_subtype)
13763         {
13764         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
13765           extension = 4;                /* 1 opcode + 4 displacement  */
13766           opcode[0] = 0xe9;
13767           where_to_put_displacement = &opcode[1];
13768           break;
13769
13770         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
13771           extension = 2;                /* 1 opcode + 2 displacement  */
13772           opcode[0] = 0xe9;
13773           where_to_put_displacement = &opcode[1];
13774           break;
13775
13776         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
13777         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
13778           extension = 5;                /* 2 opcode + 4 displacement  */
13779           opcode[1] = opcode[0] + 0x10;
13780           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
13781           where_to_put_displacement = &opcode[2];
13782           break;
13783
13784         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
13785           extension = 3;                /* 2 opcode + 2 displacement  */
13786           opcode[1] = opcode[0] + 0x10;
13787           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
13788           where_to_put_displacement = &opcode[2];
13789           break;
13790
13791         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
13792           extension = 4;
13793           opcode[0] ^= 1;
13794           opcode[1] = 3;
13795           opcode[2] = 0xe9;
13796           where_to_put_displacement = &opcode[3];
13797           break;
13798
13799         default:
13800           BAD_CASE (fragP->fr_subtype);
13801           break;
13802         }
13803     }
13804
13805   /* If size if less then four we are sure that the operand fits,
13806      but if it's 4, then it could be that the displacement is larger
13807      then -/+ 2GB.  */
13808   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
13809       && object_64bit
13810       && ((addressT) (displacement_from_opcode_start - extension
13811                       + ((addressT) 1 << 31))
13812           > (((addressT) 2 << 31) - 1)))
13813     {
13814       as_bad_where (fragP->fr_file, fragP->fr_line,
13815                     _("jump target out of range"));
13816       /* Make us emit 0.  */
13817       displacement_from_opcode_start = extension;
13818     }
13819   /* Now put displacement after opcode.  */
13820   md_number_to_chars ((char *) where_to_put_displacement,
13821                       (valueT) (displacement_from_opcode_start - extension),
13822                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
13823   fragP->fr_fix += extension;
13824 }
13825 \f
13826 /* Apply a fixup (fixP) to segment data, once it has been determined
13827    by our caller that we have all the info we need to fix it up.
13828
13829    Parameter valP is the pointer to the value of the bits.
13830
13831    On the 386, immediates, displacements, and data pointers are all in
13832    the same (little-endian) format, so we don't need to care about which
13833    we are handling.  */
13834
13835 void
13836 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
13837 {
13838   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
13839   valueT value = *valP;
13840
13841 #if !defined (TE_Mach)
13842   if (fixP->fx_pcrel)
13843     {
13844       switch (fixP->fx_r_type)
13845         {
13846         default:
13847           break;
13848
13849         case BFD_RELOC_64:
13850           fixP->fx_r_type = BFD_RELOC_64_PCREL;
13851           break;
13852         case BFD_RELOC_32:
13853         case BFD_RELOC_X86_64_32S:
13854           fixP->fx_r_type = BFD_RELOC_32_PCREL;
13855           break;
13856         case BFD_RELOC_16:
13857           fixP->fx_r_type = BFD_RELOC_16_PCREL;
13858           break;
13859         case BFD_RELOC_8:
13860           fixP->fx_r_type = BFD_RELOC_8_PCREL;
13861           break;
13862         }
13863     }
13864
13865   if (fixP->fx_addsy != NULL
13866       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
13867           || fixP->fx_r_type == BFD_RELOC_64_PCREL
13868           || fixP->fx_r_type == BFD_RELOC_16_PCREL
13869           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
13870       && !use_rela_relocations)
13871     {
13872       /* This is a hack.  There should be a better way to handle this.
13873          This covers for the fact that bfd_install_relocation will
13874          subtract the current location (for partial_inplace, PC relative
13875          relocations); see more below.  */
13876 #ifndef OBJ_AOUT
13877       if (IS_ELF
13878 #ifdef TE_PE
13879           || OUTPUT_FLAVOR == bfd_target_coff_flavour
13880 #endif
13881           )
13882         value += fixP->fx_where + fixP->fx_frag->fr_address;
13883 #endif
13884 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13885       if (IS_ELF)
13886         {
13887           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
13888
13889           if ((sym_seg == seg
13890                || (symbol_section_p (fixP->fx_addsy)
13891                    && sym_seg != absolute_section))
13892               && !generic_force_reloc (fixP))
13893             {
13894               /* Yes, we add the values in twice.  This is because
13895                  bfd_install_relocation subtracts them out again.  I think
13896                  bfd_install_relocation is broken, but I don't dare change
13897                  it.  FIXME.  */
13898               value += fixP->fx_where + fixP->fx_frag->fr_address;
13899             }
13900         }
13901 #endif
13902 #if defined (OBJ_COFF) && defined (TE_PE)
13903       /* For some reason, the PE format does not store a
13904          section address offset for a PC relative symbol.  */
13905       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
13906           || S_IS_WEAK (fixP->fx_addsy))
13907         value += md_pcrel_from (fixP);
13908 #endif
13909     }
13910 #if defined (OBJ_COFF) && defined (TE_PE)
13911   if (fixP->fx_addsy != NULL
13912       && S_IS_WEAK (fixP->fx_addsy)
13913       /* PR 16858: Do not modify weak function references.  */
13914       && ! fixP->fx_pcrel)
13915     {
13916 #if !defined (TE_PEP)
13917       /* For x86 PE weak function symbols are neither PC-relative
13918          nor do they set S_IS_FUNCTION.  So the only reliable way
13919          to detect them is to check the flags of their containing
13920          section.  */
13921       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
13922           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
13923         ;
13924       else
13925 #endif
13926       value -= S_GET_VALUE (fixP->fx_addsy);
13927     }
13928 #endif
13929
13930   /* Fix a few things - the dynamic linker expects certain values here,
13931      and we must not disappoint it.  */
13932 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13933   if (IS_ELF && fixP->fx_addsy)
13934     switch (fixP->fx_r_type)
13935       {
13936       case BFD_RELOC_386_PLT32:
13937       case BFD_RELOC_X86_64_PLT32:
13938         /* Make the jump instruction point to the address of the operand.
13939            At runtime we merely add the offset to the actual PLT entry.
13940            NB: Subtract the offset size only for jump instructions.  */
13941         if (fixP->fx_pcrel)
13942           value = -4;
13943         break;
13944
13945       case BFD_RELOC_386_TLS_GD:
13946       case BFD_RELOC_386_TLS_LDM:
13947       case BFD_RELOC_386_TLS_IE_32:
13948       case BFD_RELOC_386_TLS_IE:
13949       case BFD_RELOC_386_TLS_GOTIE:
13950       case BFD_RELOC_386_TLS_GOTDESC:
13951       case BFD_RELOC_X86_64_TLSGD:
13952       case BFD_RELOC_X86_64_TLSLD:
13953       case BFD_RELOC_X86_64_GOTTPOFF:
13954       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
13955         value = 0; /* Fully resolved at runtime.  No addend.  */
13956         /* Fallthrough */
13957       case BFD_RELOC_386_TLS_LE:
13958       case BFD_RELOC_386_TLS_LDO_32:
13959       case BFD_RELOC_386_TLS_LE_32:
13960       case BFD_RELOC_X86_64_DTPOFF32:
13961       case BFD_RELOC_X86_64_DTPOFF64:
13962       case BFD_RELOC_X86_64_TPOFF32:
13963       case BFD_RELOC_X86_64_TPOFF64:
13964         S_SET_THREAD_LOCAL (fixP->fx_addsy);
13965         break;
13966
13967       case BFD_RELOC_386_TLS_DESC_CALL:
13968       case BFD_RELOC_X86_64_TLSDESC_CALL:
13969         value = 0; /* Fully resolved at runtime.  No addend.  */
13970         S_SET_THREAD_LOCAL (fixP->fx_addsy);
13971         fixP->fx_done = 0;
13972         return;
13973
13974       case BFD_RELOC_VTABLE_INHERIT:
13975       case BFD_RELOC_VTABLE_ENTRY:
13976         fixP->fx_done = 0;
13977         return;
13978
13979       default:
13980         break;
13981       }
13982 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
13983
13984   /* If not 64bit, massage value, to account for wraparound when !BFD64.  */
13985   if (!object_64bit)
13986     value = extend_to_32bit_address (value);
13987
13988   *valP = value;
13989 #endif /* !defined (TE_Mach)  */
13990
13991   /* Are we finished with this relocation now?  */
13992   if (fixP->fx_addsy == NULL)
13993     {
13994       fixP->fx_done = 1;
13995       switch (fixP->fx_r_type)
13996         {
13997         case BFD_RELOC_X86_64_32S:
13998           fixP->fx_signed = 1;
13999           break;
14000
14001         default:
14002           break;
14003         }
14004     }
14005 #if defined (OBJ_COFF) && defined (TE_PE)
14006   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
14007     {
14008       fixP->fx_done = 0;
14009       /* Remember value for tc_gen_reloc.  */
14010       fixP->fx_addnumber = value;
14011       /* Clear out the frag for now.  */
14012       value = 0;
14013     }
14014 #endif
14015   else if (use_rela_relocations)
14016     {
14017       if (!disallow_64bit_reloc || fixP->fx_r_type == NO_RELOC)
14018         fixP->fx_no_overflow = 1;
14019       /* Remember value for tc_gen_reloc.  */
14020       fixP->fx_addnumber = value;
14021       value = 0;
14022     }
14023
14024   md_number_to_chars (p, value, fixP->fx_size);
14025 }
14026 \f
14027 const char *
14028 md_atof (int type, char *litP, int *sizeP)
14029 {
14030   /* This outputs the LITTLENUMs in REVERSE order;
14031      in accord with the bigendian 386.  */
14032   return ieee_md_atof (type, litP, sizeP, false);
14033 }
14034 \f
14035 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
14036
14037 static char *
14038 output_invalid (int c)
14039 {
14040   if (ISPRINT (c))
14041     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
14042               "'%c'", c);
14043   else
14044     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
14045               "(0x%x)", (unsigned char) c);
14046   return output_invalid_buf;
14047 }
14048
14049 /* Verify that @r can be used in the current context.  */
14050
14051 static bool check_register (const reg_entry *r)
14052 {
14053   if (allow_pseudo_reg)
14054     return true;
14055
14056   if (operand_type_all_zero (&r->reg_type))
14057     return false;
14058
14059   if ((r->reg_type.bitfield.dword
14060        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
14061        || r->reg_type.bitfield.class == RegCR
14062        || r->reg_type.bitfield.class == RegDR)
14063       && !cpu_arch_flags.bitfield.cpui386)
14064     return false;
14065
14066   if (r->reg_type.bitfield.class == RegTR
14067       && (flag_code == CODE_64BIT
14068           || !cpu_arch_flags.bitfield.cpui386
14069           || cpu_arch_isa_flags.bitfield.cpui586
14070           || cpu_arch_isa_flags.bitfield.cpui686))
14071     return false;
14072
14073   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
14074     return false;
14075
14076   if (!cpu_arch_flags.bitfield.cpuavx512f)
14077     {
14078       if (r->reg_type.bitfield.zmmword
14079           || r->reg_type.bitfield.class == RegMask)
14080         return false;
14081
14082       if (!cpu_arch_flags.bitfield.cpuavx)
14083         {
14084           if (r->reg_type.bitfield.ymmword)
14085             return false;
14086
14087           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
14088             return false;
14089         }
14090     }
14091
14092   if (r->reg_type.bitfield.zmmword)
14093     {
14094       if (vector_size < VSZ512)
14095         return false;
14096
14097       if (i.vec_encoding == vex_encoding_default)
14098         i.vec_encoding = vex_encoding_evex512;
14099       else if (i.vec_encoding != vex_encoding_evex
14100                && i.vec_encoding != vex_encoding_evex512)
14101         i.vec_encoding = vex_encoding_error;
14102     }
14103
14104   if (vector_size < VSZ256 && r->reg_type.bitfield.ymmword)
14105     return false;
14106
14107   if (r->reg_type.bitfield.tmmword
14108       && (!cpu_arch_flags.bitfield.cpuamx_tile
14109           || flag_code != CODE_64BIT))
14110     return false;
14111
14112   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
14113     return false;
14114
14115   /* Don't allow fake index register unless allow_index_reg isn't 0. */
14116   if (!allow_index_reg && r->reg_num == RegIZ)
14117     return false;
14118
14119   /* Upper 16 vector registers are only available with VREX in 64bit
14120      mode, and require EVEX encoding.  */
14121   if (r->reg_flags & RegVRex)
14122     {
14123       if (!cpu_arch_flags.bitfield.cpuavx512f
14124           || flag_code != CODE_64BIT)
14125         return false;
14126
14127       if (i.vec_encoding == vex_encoding_default
14128           || i.vec_encoding == vex_encoding_evex512)
14129         i.vec_encoding = vex_encoding_evex;
14130       else if (i.vec_encoding != vex_encoding_evex)
14131         i.vec_encoding = vex_encoding_error;
14132     }
14133
14134   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
14135       && (!cpu_arch_flags.bitfield.cpu64
14136           || r->reg_type.bitfield.class != RegCR
14137           || dot_insn ())
14138       && flag_code != CODE_64BIT)
14139     return false;
14140
14141   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
14142       && !intel_syntax)
14143     return false;
14144
14145   return true;
14146 }
14147
14148 /* REG_STRING starts *before* REGISTER_PREFIX.  */
14149
14150 static const reg_entry *
14151 parse_real_register (const char *reg_string, char **end_op)
14152 {
14153   const char *s = reg_string;
14154   char *p;
14155   char reg_name_given[MAX_REG_NAME_SIZE + 1];
14156   const reg_entry *r;
14157
14158   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
14159   if (*s == REGISTER_PREFIX)
14160     ++s;
14161
14162   if (is_space_char (*s))
14163     ++s;
14164
14165   p = reg_name_given;
14166   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
14167     {
14168       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
14169         return (const reg_entry *) NULL;
14170       s++;
14171     }
14172
14173   if (is_part_of_name (*s))
14174     return (const reg_entry *) NULL;
14175
14176   *end_op = (char *) s;
14177
14178   r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
14179
14180   /* Handle floating point regs, allowing spaces in the (i) part.  */
14181   if (r == reg_st0)
14182     {
14183       if (!cpu_arch_flags.bitfield.cpu8087
14184           && !cpu_arch_flags.bitfield.cpu287
14185           && !cpu_arch_flags.bitfield.cpu387
14186           && !allow_pseudo_reg)
14187         return (const reg_entry *) NULL;
14188
14189       if (is_space_char (*s))
14190         ++s;
14191       if (*s == '(')
14192         {
14193           ++s;
14194           if (is_space_char (*s))
14195             ++s;
14196           if (*s >= '0' && *s <= '7')
14197             {
14198               int fpr = *s - '0';
14199               ++s;
14200               if (is_space_char (*s))
14201                 ++s;
14202               if (*s == ')')
14203                 {
14204                   *end_op = (char *) s + 1;
14205                   know (r[fpr].reg_num == fpr);
14206                   return r + fpr;
14207                 }
14208             }
14209           /* We have "%st(" then garbage.  */
14210           return (const reg_entry *) NULL;
14211         }
14212     }
14213
14214   return r && check_register (r) ? r : NULL;
14215 }
14216
14217 /* REG_STRING starts *before* REGISTER_PREFIX.  */
14218
14219 static const reg_entry *
14220 parse_register (const char *reg_string, char **end_op)
14221 {
14222   const reg_entry *r;
14223
14224   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
14225     r = parse_real_register (reg_string, end_op);
14226   else
14227     r = NULL;
14228   if (!r)
14229     {
14230       char *save = input_line_pointer;
14231       char *buf = xstrdup (reg_string), *name;
14232       symbolS *symbolP;
14233
14234       input_line_pointer = buf;
14235       get_symbol_name (&name);
14236       symbolP = symbol_find (name);
14237       while (symbolP && symbol_equated_p (symbolP))
14238         {
14239           const expressionS *e = symbol_get_value_expression(symbolP);
14240
14241           if (e->X_add_number)
14242             break;
14243           symbolP = e->X_add_symbol;
14244         }
14245       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
14246         {
14247           const expressionS *e = symbol_get_value_expression (symbolP);
14248
14249           if (e->X_op == O_register)
14250             {
14251               know (e->X_add_number >= 0
14252                     && (valueT) e->X_add_number < i386_regtab_size);
14253               r = i386_regtab + e->X_add_number;
14254               *end_op = (char *) reg_string + (input_line_pointer - buf);
14255             }
14256           if (r && !check_register (r))
14257             {
14258               as_bad (_("register '%s%s' cannot be used here"),
14259                       register_prefix, r->reg_name);
14260               r = &bad_reg;
14261             }
14262         }
14263       input_line_pointer = save;
14264       free (buf);
14265     }
14266   return r;
14267 }
14268
14269 int
14270 i386_parse_name (char *name, expressionS *e, char *nextcharP)
14271 {
14272   const reg_entry *r = NULL;
14273   char *end = input_line_pointer;
14274
14275   /* We only know the terminating character here.  It being double quote could
14276      be the closing one of a quoted symbol name, or an opening one from a
14277      following string (or another quoted symbol name).  Since the latter can't
14278      be valid syntax for anything, bailing in either case is good enough.  */
14279   if (*nextcharP == '"')
14280     return 0;
14281
14282   *end = *nextcharP;
14283   if (*name == REGISTER_PREFIX || allow_naked_reg)
14284     r = parse_real_register (name, &input_line_pointer);
14285   if (r && end <= input_line_pointer)
14286     {
14287       *nextcharP = *input_line_pointer;
14288       *input_line_pointer = 0;
14289       e->X_op = O_register;
14290       e->X_add_number = r - i386_regtab;
14291       return 1;
14292     }
14293   input_line_pointer = end;
14294   *end = 0;
14295   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
14296 }
14297
14298 void
14299 md_operand (expressionS *e)
14300 {
14301   char *end;
14302   const reg_entry *r;
14303
14304   switch (*input_line_pointer)
14305     {
14306     case REGISTER_PREFIX:
14307       r = parse_real_register (input_line_pointer, &end);
14308       if (r)
14309         {
14310           e->X_op = O_register;
14311           e->X_add_number = r - i386_regtab;
14312           input_line_pointer = end;
14313         }
14314       break;
14315
14316     case '[':
14317       gas_assert (intel_syntax);
14318       end = input_line_pointer++;
14319       expression (e);
14320       if (*input_line_pointer == ']')
14321         {
14322           ++input_line_pointer;
14323           e->X_op_symbol = make_expr_symbol (e);
14324           e->X_add_symbol = NULL;
14325           e->X_add_number = 0;
14326           e->X_op = O_index;
14327         }
14328       else
14329         {
14330           e->X_op = O_absent;
14331           input_line_pointer = end;
14332         }
14333       break;
14334     }
14335 }
14336
14337 #ifdef BFD64
14338 /* To maintain consistency with !BFD64 builds of gas record, whether any
14339    (binary) operator was involved in an expression.  As expressions are
14340    evaluated in only 32 bits when !BFD64, we use this to decide whether to
14341    truncate results.  */
14342 bool i386_record_operator (operatorT op,
14343                            const expressionS *left,
14344                            const expressionS *right)
14345 {
14346   if (op == O_absent)
14347     return false;
14348
14349   if (!left)
14350     {
14351       /* Since the expression parser applies unary operators fine to bignum
14352          operands, we don't need to be concerned of respective operands not
14353          fitting in 32 bits.  */
14354       if (right->X_op == O_constant && right->X_unsigned
14355           && !fits_in_unsigned_long (right->X_add_number))
14356         return false;
14357     }
14358   /* This isn't entirely right: The pattern can also result when constant
14359      expressions are folded (e.g. 0xffffffff + 1).  */
14360   else if ((left->X_op == O_constant && left->X_unsigned
14361             && !fits_in_unsigned_long (left->X_add_number))
14362            || (right->X_op == O_constant && right->X_unsigned
14363                && !fits_in_unsigned_long (right->X_add_number)))
14364     expr_mode = expr_large_value;
14365
14366   if (expr_mode != expr_large_value)
14367     expr_mode = expr_operator_present;
14368
14369   return false;
14370 }
14371 #endif
14372 \f
14373 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14374 const char *md_shortopts = "kVQ:sqnO::";
14375 #else
14376 const char *md_shortopts = "qnO::";
14377 #endif
14378
14379 #define OPTION_32 (OPTION_MD_BASE + 0)
14380 #define OPTION_64 (OPTION_MD_BASE + 1)
14381 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
14382 #define OPTION_MARCH (OPTION_MD_BASE + 3)
14383 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
14384 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
14385 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
14386 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
14387 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
14388 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
14389 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
14390 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
14391 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
14392 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
14393 #define OPTION_X32 (OPTION_MD_BASE + 14)
14394 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
14395 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
14396 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
14397 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
14398 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
14399 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
14400 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
14401 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
14402 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
14403 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
14404 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
14405 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
14406 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
14407 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
14408 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
14409 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
14410 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
14411 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
14412 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
14413 #define OPTION_MUSE_UNALIGNED_VECTOR_MOVE (OPTION_MD_BASE + 34)
14414
14415 struct option md_longopts[] =
14416 {
14417   {"32", no_argument, NULL, OPTION_32},
14418 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
14419      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
14420   {"64", no_argument, NULL, OPTION_64},
14421 #endif
14422 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14423   {"x32", no_argument, NULL, OPTION_X32},
14424   {"mshared", no_argument, NULL, OPTION_MSHARED},
14425   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
14426 #endif
14427   {"divide", no_argument, NULL, OPTION_DIVIDE},
14428   {"march", required_argument, NULL, OPTION_MARCH},
14429   {"mtune", required_argument, NULL, OPTION_MTUNE},
14430   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
14431   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
14432   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
14433   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
14434   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
14435   {"muse-unaligned-vector-move", no_argument, NULL, OPTION_MUSE_UNALIGNED_VECTOR_MOVE},
14436   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
14437   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
14438   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
14439   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
14440   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
14441   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
14442   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
14443 # if defined (TE_PE) || defined (TE_PEP)
14444   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
14445 #endif
14446   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
14447   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
14448   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
14449   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
14450   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
14451   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
14452   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
14453   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
14454   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
14455   {"mlfence-before-indirect-branch", required_argument, NULL,
14456    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
14457   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
14458   {"mamd64", no_argument, NULL, OPTION_MAMD64},
14459   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
14460   {NULL, no_argument, NULL, 0}
14461 };
14462 size_t md_longopts_size = sizeof (md_longopts);
14463
14464 int
14465 md_parse_option (int c, const char *arg)
14466 {
14467   unsigned int j;
14468   char *arch, *next, *saved, *type;
14469
14470   switch (c)
14471     {
14472     case 'n':
14473       optimize_align_code = 0;
14474       break;
14475
14476     case 'q':
14477       quiet_warnings = 1;
14478       break;
14479
14480 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14481       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
14482          should be emitted or not.  FIXME: Not implemented.  */
14483     case 'Q':
14484       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
14485         return 0;
14486       break;
14487
14488       /* -V: SVR4 argument to print version ID.  */
14489     case 'V':
14490       print_version_id ();
14491       break;
14492
14493       /* -k: Ignore for FreeBSD compatibility.  */
14494     case 'k':
14495       break;
14496
14497     case 's':
14498       /* -s: On i386 Solaris, this tells the native assembler to use
14499          .stab instead of .stab.excl.  We always use .stab anyhow.  */
14500       break;
14501
14502     case OPTION_MSHARED:
14503       shared = 1;
14504       break;
14505
14506     case OPTION_X86_USED_NOTE:
14507       if (strcasecmp (arg, "yes") == 0)
14508         x86_used_note = 1;
14509       else if (strcasecmp (arg, "no") == 0)
14510         x86_used_note = 0;
14511       else
14512         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
14513       break;
14514
14515
14516 #endif
14517 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
14518      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
14519     case OPTION_64:
14520       {
14521         const char **list, **l;
14522
14523         list = bfd_target_list ();
14524         for (l = list; *l != NULL; l++)
14525           if (startswith (*l, "elf64-x86-64")
14526               || strcmp (*l, "coff-x86-64") == 0
14527               || strcmp (*l, "pe-x86-64") == 0
14528               || strcmp (*l, "pei-x86-64") == 0
14529               || strcmp (*l, "mach-o-x86-64") == 0)
14530             {
14531               default_arch = "x86_64";
14532               break;
14533             }
14534         if (*l == NULL)
14535           as_fatal (_("no compiled in support for x86_64"));
14536         free (list);
14537       }
14538       break;
14539 #endif
14540
14541 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14542     case OPTION_X32:
14543       if (IS_ELF)
14544         {
14545           const char **list, **l;
14546
14547           list = bfd_target_list ();
14548           for (l = list; *l != NULL; l++)
14549             if (startswith (*l, "elf32-x86-64"))
14550               {
14551                 default_arch = "x86_64:32";
14552                 break;
14553               }
14554           if (*l == NULL)
14555             as_fatal (_("no compiled in support for 32bit x86_64"));
14556           free (list);
14557         }
14558       else
14559         as_fatal (_("32bit x86_64 is only supported for ELF"));
14560       break;
14561 #endif
14562
14563     case OPTION_32:
14564       {
14565         const char **list, **l;
14566
14567         list = bfd_target_list ();
14568         for (l = list; *l != NULL; l++)
14569           if (strstr (*l, "-i386")
14570               || strstr (*l, "-go32"))
14571             {
14572               default_arch = "i386";
14573               break;
14574             }
14575         if (*l == NULL)
14576           as_fatal (_("no compiled in support for ix86"));
14577         free (list);
14578       }
14579       break;
14580
14581     case OPTION_DIVIDE:
14582 #ifdef SVR4_COMMENT_CHARS
14583       {
14584         char *n, *t;
14585         const char *s;
14586
14587         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
14588         t = n;
14589         for (s = i386_comment_chars; *s != '\0'; s++)
14590           if (*s != '/')
14591             *t++ = *s;
14592         *t = '\0';
14593         i386_comment_chars = n;
14594       }
14595 #endif
14596       break;
14597
14598     case OPTION_MARCH:
14599       saved = xstrdup (arg);
14600       arch = saved;
14601       /* Allow -march=+nosse.  */
14602       if (*arch == '+')
14603         arch++;
14604       do
14605         {
14606           char *vsz;
14607
14608           if (*arch == '.')
14609             as_fatal (_("invalid -march= option: `%s'"), arg);
14610           next = strchr (arch, '+');
14611           if (next)
14612             *next++ = '\0';
14613           vsz = strchr (arch, '/');
14614           if (vsz)
14615             *vsz++ = '\0';
14616           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
14617             {
14618               if (vsz && cpu_arch[j].vsz != vsz_set)
14619                 continue;
14620
14621               if (arch == saved && cpu_arch[j].type != PROCESSOR_NONE
14622                   && strcmp (arch, cpu_arch[j].name) == 0)
14623                 {
14624                   /* Processor.  */
14625                   if (! cpu_arch[j].enable.bitfield.cpui386)
14626                     continue;
14627
14628                   cpu_arch_name = cpu_arch[j].name;
14629                   free (cpu_sub_arch_name);
14630                   cpu_sub_arch_name = NULL;
14631                   cpu_arch_flags = cpu_arch[j].enable;
14632                   cpu_arch_isa = cpu_arch[j].type;
14633                   cpu_arch_isa_flags = cpu_arch[j].enable;
14634                   if (!cpu_arch_tune_set)
14635                     cpu_arch_tune = cpu_arch_isa;
14636                   vector_size = VSZ_DEFAULT;
14637                   break;
14638                 }
14639               else if (cpu_arch[j].type == PROCESSOR_NONE
14640                        && strcmp (arch, cpu_arch[j].name) == 0
14641                        && !cpu_flags_all_zero (&cpu_arch[j].enable))
14642                 {
14643                   /* ISA extension.  */
14644                   isa_enable (j);
14645
14646                   switch (cpu_arch[j].vsz)
14647                     {
14648                     default:
14649                       break;
14650
14651                     case vsz_set:
14652                       if (vsz)
14653                         {
14654                           char *end;
14655                           unsigned long val = strtoul (vsz, &end, 0);
14656
14657                           if (*end)
14658                             val = 0;
14659                           switch (val)
14660                             {
14661                             case 512: vector_size = VSZ512; break;
14662                             case 256: vector_size = VSZ256; break;
14663                             case 128: vector_size = VSZ128; break;
14664                             default:
14665                               as_warn (_("Unrecognized vector size specifier ignored"));
14666                               break;
14667                             }
14668                           break;
14669                         }
14670                         /* Fall through.  */
14671                     case vsz_reset:
14672                       vector_size = VSZ_DEFAULT;
14673                       break;
14674                     }
14675
14676                   break;
14677                 }
14678             }
14679
14680           if (j >= ARRAY_SIZE (cpu_arch) && startswith (arch, "no"))
14681             {
14682               /* Disable an ISA extension.  */
14683               for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
14684                 if (cpu_arch[j].type == PROCESSOR_NONE
14685                     && strcmp (arch + 2, cpu_arch[j].name) == 0)
14686                   {
14687                     isa_disable (j);
14688                     if (cpu_arch[j].vsz == vsz_set)
14689                       vector_size = VSZ_DEFAULT;
14690                     break;
14691                   }
14692             }
14693
14694           if (j >= ARRAY_SIZE (cpu_arch))
14695             as_fatal (_("invalid -march= option: `%s'"), arg);
14696
14697           arch = next;
14698         }
14699       while (next != NULL);
14700       free (saved);
14701       break;
14702
14703     case OPTION_MTUNE:
14704       if (*arg == '.')
14705         as_fatal (_("invalid -mtune= option: `%s'"), arg);
14706       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
14707         {
14708           if (cpu_arch[j].type != PROCESSOR_NONE
14709               && strcmp (arg, cpu_arch[j].name) == 0)
14710             {
14711               cpu_arch_tune_set = 1;
14712               cpu_arch_tune = cpu_arch [j].type;
14713               break;
14714             }
14715         }
14716       if (j >= ARRAY_SIZE (cpu_arch))
14717         as_fatal (_("invalid -mtune= option: `%s'"), arg);
14718       break;
14719
14720     case OPTION_MMNEMONIC:
14721       if (strcasecmp (arg, "att") == 0)
14722         intel_mnemonic = 0;
14723       else if (strcasecmp (arg, "intel") == 0)
14724         intel_mnemonic = 1;
14725       else
14726         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
14727       break;
14728
14729     case OPTION_MSYNTAX:
14730       if (strcasecmp (arg, "att") == 0)
14731         intel_syntax = 0;
14732       else if (strcasecmp (arg, "intel") == 0)
14733         intel_syntax = 1;
14734       else
14735         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
14736       break;
14737
14738     case OPTION_MINDEX_REG:
14739       allow_index_reg = 1;
14740       break;
14741
14742     case OPTION_MNAKED_REG:
14743       allow_naked_reg = 1;
14744       break;
14745
14746     case OPTION_MSSE2AVX:
14747       sse2avx = 1;
14748       break;
14749
14750     case OPTION_MUSE_UNALIGNED_VECTOR_MOVE:
14751       use_unaligned_vector_move = 1;
14752       break;
14753
14754     case OPTION_MSSE_CHECK:
14755       if (strcasecmp (arg, "error") == 0)
14756         sse_check = check_error;
14757       else if (strcasecmp (arg, "warning") == 0)
14758         sse_check = check_warning;
14759       else if (strcasecmp (arg, "none") == 0)
14760         sse_check = check_none;
14761       else
14762         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
14763       break;
14764
14765     case OPTION_MOPERAND_CHECK:
14766       if (strcasecmp (arg, "error") == 0)
14767         operand_check = check_error;
14768       else if (strcasecmp (arg, "warning") == 0)
14769         operand_check = check_warning;
14770       else if (strcasecmp (arg, "none") == 0)
14771         operand_check = check_none;
14772       else
14773         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
14774       break;
14775
14776     case OPTION_MAVXSCALAR:
14777       if (strcasecmp (arg, "128") == 0)
14778         avxscalar = vex128;
14779       else if (strcasecmp (arg, "256") == 0)
14780         avxscalar = vex256;
14781       else
14782         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
14783       break;
14784
14785     case OPTION_MVEXWIG:
14786       if (strcmp (arg, "0") == 0)
14787         vexwig = vexw0;
14788       else if (strcmp (arg, "1") == 0)
14789         vexwig = vexw1;
14790       else
14791         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
14792       break;
14793
14794     case OPTION_MADD_BND_PREFIX:
14795       add_bnd_prefix = 1;
14796       break;
14797
14798     case OPTION_MEVEXLIG:
14799       if (strcmp (arg, "128") == 0)
14800         evexlig = evexl128;
14801       else if (strcmp (arg, "256") == 0)
14802         evexlig = evexl256;
14803       else  if (strcmp (arg, "512") == 0)
14804         evexlig = evexl512;
14805       else
14806         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
14807       break;
14808
14809     case OPTION_MEVEXRCIG:
14810       if (strcmp (arg, "rne") == 0)
14811         evexrcig = rne;
14812       else if (strcmp (arg, "rd") == 0)
14813         evexrcig = rd;
14814       else if (strcmp (arg, "ru") == 0)
14815         evexrcig = ru;
14816       else if (strcmp (arg, "rz") == 0)
14817         evexrcig = rz;
14818       else
14819         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
14820       break;
14821
14822     case OPTION_MEVEXWIG:
14823       if (strcmp (arg, "0") == 0)
14824         evexwig = evexw0;
14825       else if (strcmp (arg, "1") == 0)
14826         evexwig = evexw1;
14827       else
14828         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
14829       break;
14830
14831 # if defined (TE_PE) || defined (TE_PEP)
14832     case OPTION_MBIG_OBJ:
14833       use_big_obj = 1;
14834       break;
14835 #endif
14836
14837     case OPTION_MOMIT_LOCK_PREFIX:
14838       if (strcasecmp (arg, "yes") == 0)
14839         omit_lock_prefix = 1;
14840       else if (strcasecmp (arg, "no") == 0)
14841         omit_lock_prefix = 0;
14842       else
14843         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
14844       break;
14845
14846     case OPTION_MFENCE_AS_LOCK_ADD:
14847       if (strcasecmp (arg, "yes") == 0)
14848         avoid_fence = 1;
14849       else if (strcasecmp (arg, "no") == 0)
14850         avoid_fence = 0;
14851       else
14852         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
14853       break;
14854
14855     case OPTION_MLFENCE_AFTER_LOAD:
14856       if (strcasecmp (arg, "yes") == 0)
14857         lfence_after_load = 1;
14858       else if (strcasecmp (arg, "no") == 0)
14859         lfence_after_load = 0;
14860       else
14861         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
14862       break;
14863
14864     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
14865       if (strcasecmp (arg, "all") == 0)
14866         {
14867           lfence_before_indirect_branch = lfence_branch_all;
14868           if (lfence_before_ret == lfence_before_ret_none)
14869             lfence_before_ret = lfence_before_ret_shl;
14870         }
14871       else if (strcasecmp (arg, "memory") == 0)
14872         lfence_before_indirect_branch = lfence_branch_memory;
14873       else if (strcasecmp (arg, "register") == 0)
14874         lfence_before_indirect_branch = lfence_branch_register;
14875       else if (strcasecmp (arg, "none") == 0)
14876         lfence_before_indirect_branch = lfence_branch_none;
14877       else
14878         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
14879                   arg);
14880       break;
14881
14882     case OPTION_MLFENCE_BEFORE_RET:
14883       if (strcasecmp (arg, "or") == 0)
14884         lfence_before_ret = lfence_before_ret_or;
14885       else if (strcasecmp (arg, "not") == 0)
14886         lfence_before_ret = lfence_before_ret_not;
14887       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
14888         lfence_before_ret = lfence_before_ret_shl;
14889       else if (strcasecmp (arg, "none") == 0)
14890         lfence_before_ret = lfence_before_ret_none;
14891       else
14892         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
14893                   arg);
14894       break;
14895
14896     case OPTION_MRELAX_RELOCATIONS:
14897       if (strcasecmp (arg, "yes") == 0)
14898         generate_relax_relocations = 1;
14899       else if (strcasecmp (arg, "no") == 0)
14900         generate_relax_relocations = 0;
14901       else
14902         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
14903       break;
14904
14905     case OPTION_MALIGN_BRANCH_BOUNDARY:
14906       {
14907         char *end;
14908         long int align = strtoul (arg, &end, 0);
14909         if (*end == '\0')
14910           {
14911             if (align == 0)
14912               {
14913                 align_branch_power = 0;
14914                 break;
14915               }
14916             else if (align >= 16)
14917               {
14918                 int align_power;
14919                 for (align_power = 0;
14920                      (align & 1) == 0;
14921                      align >>= 1, align_power++)
14922                   continue;
14923                 /* Limit alignment power to 31.  */
14924                 if (align == 1 && align_power < 32)
14925                   {
14926                     align_branch_power = align_power;
14927                     break;
14928                   }
14929               }
14930           }
14931         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
14932       }
14933       break;
14934
14935     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
14936       {
14937         char *end;
14938         int align = strtoul (arg, &end, 0);
14939         /* Some processors only support 5 prefixes.  */
14940         if (*end == '\0' && align >= 0 && align < 6)
14941           {
14942             align_branch_prefix_size = align;
14943             break;
14944           }
14945         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
14946                   arg);
14947       }
14948       break;
14949
14950     case OPTION_MALIGN_BRANCH:
14951       align_branch = 0;
14952       saved = xstrdup (arg);
14953       type = saved;
14954       do
14955         {
14956           next = strchr (type, '+');
14957           if (next)
14958             *next++ = '\0';
14959           if (strcasecmp (type, "jcc") == 0)
14960             align_branch |= align_branch_jcc_bit;
14961           else if (strcasecmp (type, "fused") == 0)
14962             align_branch |= align_branch_fused_bit;
14963           else if (strcasecmp (type, "jmp") == 0)
14964             align_branch |= align_branch_jmp_bit;
14965           else if (strcasecmp (type, "call") == 0)
14966             align_branch |= align_branch_call_bit;
14967           else if (strcasecmp (type, "ret") == 0)
14968             align_branch |= align_branch_ret_bit;
14969           else if (strcasecmp (type, "indirect") == 0)
14970             align_branch |= align_branch_indirect_bit;
14971           else
14972             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
14973           type = next;
14974         }
14975       while (next != NULL);
14976       free (saved);
14977       break;
14978
14979     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
14980       align_branch_power = 5;
14981       align_branch_prefix_size = 5;
14982       align_branch = (align_branch_jcc_bit
14983                       | align_branch_fused_bit
14984                       | align_branch_jmp_bit);
14985       break;
14986
14987     case OPTION_MAMD64:
14988       isa64 = amd64;
14989       break;
14990
14991     case OPTION_MINTEL64:
14992       isa64 = intel64;
14993       break;
14994
14995     case 'O':
14996       if (arg == NULL)
14997         {
14998           optimize = 1;
14999           /* Turn off -Os.  */
15000           optimize_for_space = 0;
15001         }
15002       else if (*arg == 's')
15003         {
15004           optimize_for_space = 1;
15005           /* Turn on all encoding optimizations.  */
15006           optimize = INT_MAX;
15007         }
15008       else
15009         {
15010           optimize = atoi (arg);
15011           /* Turn off -Os.  */
15012           optimize_for_space = 0;
15013         }
15014       break;
15015
15016     default:
15017       return 0;
15018     }
15019   return 1;
15020 }
15021
15022 #define MESSAGE_TEMPLATE \
15023 "                                                                                "
15024
15025 static char *
15026 output_message (FILE *stream, char *p, char *message, char *start,
15027                 int *left_p, const char *name, int len)
15028 {
15029   int size = sizeof (MESSAGE_TEMPLATE);
15030   int left = *left_p;
15031
15032   /* Reserve 2 spaces for ", " or ",\0" */
15033   left -= len + 2;
15034
15035   /* Check if there is any room.  */
15036   if (left >= 0)
15037     {
15038       if (p != start)
15039         {
15040           *p++ = ',';
15041           *p++ = ' ';
15042         }
15043       p = mempcpy (p, name, len);
15044     }
15045   else
15046     {
15047       /* Output the current message now and start a new one.  */
15048       *p++ = ',';
15049       *p = '\0';
15050       fprintf (stream, "%s\n", message);
15051       p = start;
15052       left = size - (start - message) - len - 2;
15053
15054       gas_assert (left >= 0);
15055
15056       p = mempcpy (p, name, len);
15057     }
15058
15059   *left_p = left;
15060   return p;
15061 }
15062
15063 static void
15064 show_arch (FILE *stream, int ext, int check)
15065 {
15066   static char message[] = MESSAGE_TEMPLATE;
15067   char *start = message + 27;
15068   char *p;
15069   int size = sizeof (MESSAGE_TEMPLATE);
15070   int left;
15071   const char *name;
15072   int len;
15073   unsigned int j;
15074
15075   p = start;
15076   left = size - (start - message);
15077
15078   if (!ext && check)
15079     {
15080       p = output_message (stream, p, message, start, &left,
15081                           STRING_COMMA_LEN ("default"));
15082       p = output_message (stream, p, message, start, &left,
15083                           STRING_COMMA_LEN ("push"));
15084       p = output_message (stream, p, message, start, &left,
15085                           STRING_COMMA_LEN ("pop"));
15086     }
15087
15088   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
15089     {
15090       /* Should it be skipped?  */
15091       if (cpu_arch [j].skip)
15092         continue;
15093
15094       name = cpu_arch [j].name;
15095       len = cpu_arch [j].len;
15096       if (cpu_arch[j].type == PROCESSOR_NONE)
15097         {
15098           /* It is an extension.  Skip if we aren't asked to show it.  */
15099           if (!ext || cpu_flags_all_zero (&cpu_arch[j].enable))
15100             continue;
15101         }
15102       else if (ext)
15103         {
15104           /* It is an processor.  Skip if we show only extension.  */
15105           continue;
15106         }
15107       else if (check && ! cpu_arch[j].enable.bitfield.cpui386)
15108         {
15109           /* It is an impossible processor - skip.  */
15110           continue;
15111         }
15112
15113       p = output_message (stream, p, message, start, &left, name, len);
15114     }
15115
15116   /* Display disabled extensions.  */
15117   if (ext)
15118     for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
15119       {
15120         char *str;
15121
15122         if (cpu_arch[j].type != PROCESSOR_NONE
15123             || !cpu_flags_all_zero (&cpu_arch[j].enable))
15124           continue;
15125         str = xasprintf ("no%s", cpu_arch[j].name);
15126         p = output_message (stream, p, message, start, &left, str,
15127                             strlen (str));
15128         free (str);
15129       }
15130
15131   *p = '\0';
15132   fprintf (stream, "%s\n", message);
15133 }
15134
15135 void
15136 md_show_usage (FILE *stream)
15137 {
15138 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15139   fprintf (stream, _("\
15140   -Qy, -Qn                ignored\n\
15141   -V                      print assembler version number\n\
15142   -k                      ignored\n"));
15143 #endif
15144   fprintf (stream, _("\
15145   -n                      do not optimize code alignment\n\
15146   -O{012s}                attempt some code optimizations\n\
15147   -q                      quieten some warnings\n"));
15148 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15149   fprintf (stream, _("\
15150   -s                      ignored\n"));
15151 #endif
15152 #ifdef BFD64
15153 # if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15154   fprintf (stream, _("\
15155   --32/--64/--x32         generate 32bit/64bit/x32 object\n"));
15156 # elif defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O)
15157   fprintf (stream, _("\
15158   --32/--64               generate 32bit/64bit object\n"));
15159 # endif
15160 #endif
15161 #ifdef SVR4_COMMENT_CHARS
15162   fprintf (stream, _("\
15163   --divide                do not treat `/' as a comment character\n"));
15164 #else
15165   fprintf (stream, _("\
15166   --divide                ignored\n"));
15167 #endif
15168   fprintf (stream, _("\
15169   -march=CPU[,+EXTENSION...]\n\
15170                           generate code for CPU and EXTENSION, CPU is one of:\n"));
15171   show_arch (stream, 0, 1);
15172   fprintf (stream, _("\
15173                           EXTENSION is combination of (possibly \"no\"-prefixed):\n"));
15174   show_arch (stream, 1, 0);
15175   fprintf (stream, _("\
15176   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
15177   show_arch (stream, 0, 0);
15178   fprintf (stream, _("\
15179   -msse2avx               encode SSE instructions with VEX prefix\n"));
15180   fprintf (stream, _("\
15181   -muse-unaligned-vector-move\n\
15182                           encode aligned vector move as unaligned vector move\n"));
15183   fprintf (stream, _("\
15184   -msse-check=[none|error|warning] (default: warning)\n\
15185                           check SSE instructions\n"));
15186   fprintf (stream, _("\
15187   -moperand-check=[none|error|warning] (default: warning)\n\
15188                           check operand combinations for validity\n"));
15189   fprintf (stream, _("\
15190   -mavxscalar=[128|256] (default: 128)\n\
15191                           encode scalar AVX instructions with specific vector\n\
15192                            length\n"));
15193   fprintf (stream, _("\
15194   -mvexwig=[0|1] (default: 0)\n\
15195                           encode VEX instructions with specific VEX.W value\n\
15196                            for VEX.W bit ignored instructions\n"));
15197   fprintf (stream, _("\
15198   -mevexlig=[128|256|512] (default: 128)\n\
15199                           encode scalar EVEX instructions with specific vector\n\
15200                            length\n"));
15201   fprintf (stream, _("\
15202   -mevexwig=[0|1] (default: 0)\n\
15203                           encode EVEX instructions with specific EVEX.W value\n\
15204                            for EVEX.W bit ignored instructions\n"));
15205   fprintf (stream, _("\
15206   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
15207                           encode EVEX instructions with specific EVEX.RC value\n\
15208                            for SAE-only ignored instructions\n"));
15209   fprintf (stream, _("\
15210   -mmnemonic=[att|intel] "));
15211   if (SYSV386_COMPAT)
15212     fprintf (stream, _("(default: att)\n"));
15213   else
15214     fprintf (stream, _("(default: intel)\n"));
15215   fprintf (stream, _("\
15216                           use AT&T/Intel mnemonic\n"));
15217   fprintf (stream, _("\
15218   -msyntax=[att|intel] (default: att)\n\
15219                           use AT&T/Intel syntax\n"));
15220   fprintf (stream, _("\
15221   -mindex-reg             support pseudo index registers\n"));
15222   fprintf (stream, _("\
15223   -mnaked-reg             don't require `%%' prefix for registers\n"));
15224   fprintf (stream, _("\
15225   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
15226 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15227   fprintf (stream, _("\
15228   -mshared                disable branch optimization for shared code\n"));
15229   fprintf (stream, _("\
15230   -mx86-used-note=[no|yes] "));
15231   if (DEFAULT_X86_USED_NOTE)
15232     fprintf (stream, _("(default: yes)\n"));
15233   else
15234     fprintf (stream, _("(default: no)\n"));
15235   fprintf (stream, _("\
15236                           generate x86 used ISA and feature properties\n"));
15237 #endif
15238 #if defined (TE_PE) || defined (TE_PEP)
15239   fprintf (stream, _("\
15240   -mbig-obj               generate big object files\n"));
15241 #endif
15242   fprintf (stream, _("\
15243   -momit-lock-prefix=[no|yes] (default: no)\n\
15244                           strip all lock prefixes\n"));
15245   fprintf (stream, _("\
15246   -mfence-as-lock-add=[no|yes] (default: no)\n\
15247                           encode lfence, mfence and sfence as\n\
15248                            lock addl $0x0, (%%{re}sp)\n"));
15249   fprintf (stream, _("\
15250   -mrelax-relocations=[no|yes] "));
15251   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
15252     fprintf (stream, _("(default: yes)\n"));
15253   else
15254     fprintf (stream, _("(default: no)\n"));
15255   fprintf (stream, _("\
15256                           generate relax relocations\n"));
15257   fprintf (stream, _("\
15258   -malign-branch-boundary=NUM (default: 0)\n\
15259                           align branches within NUM byte boundary\n"));
15260   fprintf (stream, _("\
15261   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
15262                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
15263                            indirect\n\
15264                           specify types of branches to align\n"));
15265   fprintf (stream, _("\
15266   -malign-branch-prefix-size=NUM (default: 5)\n\
15267                           align branches with NUM prefixes per instruction\n"));
15268   fprintf (stream, _("\
15269   -mbranches-within-32B-boundaries\n\
15270                           align branches within 32 byte boundary\n"));
15271   fprintf (stream, _("\
15272   -mlfence-after-load=[no|yes] (default: no)\n\
15273                           generate lfence after load\n"));
15274   fprintf (stream, _("\
15275   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
15276                           generate lfence before indirect near branch\n"));
15277   fprintf (stream, _("\
15278   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
15279                           generate lfence before ret\n"));
15280   fprintf (stream, _("\
15281   -mamd64                 accept only AMD64 ISA [default]\n"));
15282   fprintf (stream, _("\
15283   -mintel64               accept only Intel64 ISA\n"));
15284 }
15285
15286 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
15287      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
15288      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
15289
15290 /* Pick the target format to use.  */
15291
15292 const char *
15293 i386_target_format (void)
15294 {
15295   if (startswith (default_arch, "x86_64"))
15296     {
15297       update_code_flag (CODE_64BIT, 1);
15298       if (default_arch[6] == '\0')
15299         x86_elf_abi = X86_64_ABI;
15300       else
15301         x86_elf_abi = X86_64_X32_ABI;
15302     }
15303   else if (!strcmp (default_arch, "i386"))
15304     update_code_flag (CODE_32BIT, 1);
15305   else if (!strcmp (default_arch, "iamcu"))
15306     {
15307       update_code_flag (CODE_32BIT, 1);
15308       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
15309         {
15310           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
15311           cpu_arch_name = "iamcu";
15312           free (cpu_sub_arch_name);
15313           cpu_sub_arch_name = NULL;
15314           cpu_arch_flags = iamcu_flags;
15315           cpu_arch_isa = PROCESSOR_IAMCU;
15316           cpu_arch_isa_flags = iamcu_flags;
15317           if (!cpu_arch_tune_set)
15318             cpu_arch_tune = PROCESSOR_IAMCU;
15319         }
15320       else if (cpu_arch_isa != PROCESSOR_IAMCU)
15321         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
15322                   cpu_arch_name);
15323     }
15324   else
15325     as_fatal (_("unknown architecture"));
15326
15327   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
15328     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].enable;
15329
15330   switch (OUTPUT_FLAVOR)
15331     {
15332 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
15333     case bfd_target_aout_flavour:
15334       return AOUT_TARGET_FORMAT;
15335 #endif
15336 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
15337 # if defined (TE_PE) || defined (TE_PEP)
15338     case bfd_target_coff_flavour:
15339       if (flag_code == CODE_64BIT)
15340         {
15341           object_64bit = 1;
15342           return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
15343         }
15344       return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
15345 # elif defined (TE_GO32)
15346     case bfd_target_coff_flavour:
15347       return "coff-go32";
15348 # else
15349     case bfd_target_coff_flavour:
15350       return "coff-i386";
15351 # endif
15352 #endif
15353 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
15354     case bfd_target_elf_flavour:
15355       {
15356         const char *format;
15357
15358         switch (x86_elf_abi)
15359           {
15360           default:
15361             format = ELF_TARGET_FORMAT;
15362 #ifndef TE_SOLARIS
15363             tls_get_addr = "___tls_get_addr";
15364 #endif
15365             break;
15366           case X86_64_ABI:
15367             use_rela_relocations = 1;
15368             object_64bit = 1;
15369 #ifndef TE_SOLARIS
15370             tls_get_addr = "__tls_get_addr";
15371 #endif
15372             format = ELF_TARGET_FORMAT64;
15373             break;
15374           case X86_64_X32_ABI:
15375             use_rela_relocations = 1;
15376             object_64bit = 1;
15377 #ifndef TE_SOLARIS
15378             tls_get_addr = "__tls_get_addr";
15379 #endif
15380             disallow_64bit_reloc = 1;
15381             format = ELF_TARGET_FORMAT32;
15382             break;
15383           }
15384         if (cpu_arch_isa == PROCESSOR_IAMCU)
15385           {
15386             if (x86_elf_abi != I386_ABI)
15387               as_fatal (_("Intel MCU is 32bit only"));
15388             return ELF_TARGET_IAMCU_FORMAT;
15389           }
15390         else
15391           return format;
15392       }
15393 #endif
15394 #if defined (OBJ_MACH_O)
15395     case bfd_target_mach_o_flavour:
15396       if (flag_code == CODE_64BIT)
15397         {
15398           use_rela_relocations = 1;
15399           object_64bit = 1;
15400           return "mach-o-x86-64";
15401         }
15402       else
15403         return "mach-o-i386";
15404 #endif
15405     default:
15406       abort ();
15407       return NULL;
15408     }
15409 }
15410
15411 #endif /* OBJ_MAYBE_ more than one  */
15412 \f
15413 symbolS *
15414 md_undefined_symbol (char *name)
15415 {
15416   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
15417       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
15418       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
15419       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
15420     {
15421       if (!GOT_symbol)
15422         {
15423           if (symbol_find (name))
15424             as_bad (_("GOT already in symbol table"));
15425           GOT_symbol = symbol_new (name, undefined_section,
15426                                    &zero_address_frag, 0);
15427         };
15428       return GOT_symbol;
15429     }
15430   return 0;
15431 }
15432
15433 /* Round up a section size to the appropriate boundary.  */
15434
15435 valueT
15436 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
15437 {
15438 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
15439   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
15440     {
15441       /* For a.out, force the section size to be aligned.  If we don't do
15442          this, BFD will align it for us, but it will not write out the
15443          final bytes of the section.  This may be a bug in BFD, but it is
15444          easier to fix it here since that is how the other a.out targets
15445          work.  */
15446       int align;
15447
15448       align = bfd_section_alignment (segment);
15449       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
15450     }
15451 #endif
15452
15453   return size;
15454 }
15455
15456 /* On the i386, PC-relative offsets are relative to the start of the
15457    next instruction.  That is, the address of the offset, plus its
15458    size, since the offset is always the last part of the insn.  */
15459
15460 long
15461 md_pcrel_from (fixS *fixP)
15462 {
15463   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
15464 }
15465
15466 #ifndef I386COFF
15467
15468 static void
15469 s_bss (int ignore ATTRIBUTE_UNUSED)
15470 {
15471   int temp;
15472
15473 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15474   if (IS_ELF)
15475     obj_elf_section_change_hook ();
15476 #endif
15477   temp = get_absolute_expression ();
15478   subseg_set (bss_section, (subsegT) temp);
15479   demand_empty_rest_of_line ();
15480 }
15481
15482 #endif
15483
15484 /* Remember constant directive.  */
15485
15486 void
15487 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
15488 {
15489   if (last_insn.kind != last_insn_directive
15490       && (bfd_section_flags (now_seg) & SEC_CODE))
15491     {
15492       last_insn.seg = now_seg;
15493       last_insn.kind = last_insn_directive;
15494       last_insn.name = "constant directive";
15495       last_insn.file = as_where (&last_insn.line);
15496       if (lfence_before_ret != lfence_before_ret_none)
15497         {
15498           if (lfence_before_indirect_branch != lfence_branch_none)
15499             as_warn (_("constant directive skips -mlfence-before-ret "
15500                        "and -mlfence-before-indirect-branch"));
15501           else
15502             as_warn (_("constant directive skips -mlfence-before-ret"));
15503         }
15504       else if (lfence_before_indirect_branch != lfence_branch_none)
15505         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
15506     }
15507 }
15508
15509 int
15510 i386_validate_fix (fixS *fixp)
15511 {
15512   if (fixp->fx_addsy && S_GET_SEGMENT(fixp->fx_addsy) == reg_section)
15513     {
15514       reloc_howto_type *howto;
15515
15516       howto = bfd_reloc_type_lookup (stdoutput, fixp->fx_r_type);
15517       as_bad_where (fixp->fx_file, fixp->fx_line,
15518                     _("invalid %s relocation against register"),
15519                     howto ? howto->name : "<unknown>");
15520       return 0;
15521     }
15522
15523 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15524   if (fixp->fx_r_type == BFD_RELOC_SIZE32
15525       || fixp->fx_r_type == BFD_RELOC_SIZE64)
15526     return IS_ELF && fixp->fx_addsy
15527            && (!S_IS_DEFINED (fixp->fx_addsy)
15528                || S_IS_EXTERNAL (fixp->fx_addsy));
15529 #endif
15530
15531   if (fixp->fx_subsy)
15532     {
15533       if (fixp->fx_subsy == GOT_symbol)
15534         {
15535           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
15536             {
15537               if (!object_64bit)
15538                 abort ();
15539 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15540               if (fixp->fx_tcbit2)
15541                 fixp->fx_r_type = (fixp->fx_tcbit
15542                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
15543                                    : BFD_RELOC_X86_64_GOTPCRELX);
15544               else
15545 #endif
15546                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
15547             }
15548           else
15549             {
15550               if (!object_64bit)
15551                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
15552               else
15553                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
15554             }
15555           fixp->fx_subsy = 0;
15556         }
15557     }
15558 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15559   else
15560     {
15561       /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
15562          to section.  Since PLT32 relocation must be against symbols,
15563          turn such PLT32 relocation into PC32 relocation.  */
15564       if (fixp->fx_addsy
15565           && (fixp->fx_r_type == BFD_RELOC_386_PLT32
15566               || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
15567           && symbol_section_p (fixp->fx_addsy))
15568         fixp->fx_r_type = BFD_RELOC_32_PCREL;
15569       if (!object_64bit)
15570         {
15571           if (fixp->fx_r_type == BFD_RELOC_386_GOT32
15572               && fixp->fx_tcbit2)
15573             fixp->fx_r_type = BFD_RELOC_386_GOT32X;
15574         }
15575     }
15576 #endif
15577
15578   return 1;
15579 }
15580
15581 arelent *
15582 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
15583 {
15584   arelent *rel;
15585   bfd_reloc_code_real_type code;
15586
15587   switch (fixp->fx_r_type)
15588     {
15589 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15590       symbolS *sym;
15591
15592     case BFD_RELOC_SIZE32:
15593     case BFD_RELOC_SIZE64:
15594       if (fixp->fx_addsy
15595           && !bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_addsy))
15596           && (!fixp->fx_subsy
15597               || bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_subsy))))
15598         sym = fixp->fx_addsy;
15599       else if (fixp->fx_subsy
15600                && !bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_subsy))
15601                && (!fixp->fx_addsy
15602                    || bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_addsy))))
15603         sym = fixp->fx_subsy;
15604       else
15605         sym = NULL;
15606       if (IS_ELF && sym && S_IS_DEFINED (sym) && !S_IS_EXTERNAL (sym))
15607         {
15608           /* Resolve size relocation against local symbol to size of
15609              the symbol plus addend.  */
15610           valueT value = S_GET_SIZE (sym);
15611
15612           if (symbol_get_bfdsym (sym)->flags & BSF_SECTION_SYM)
15613             value = bfd_section_size (S_GET_SEGMENT (sym));
15614           if (sym == fixp->fx_subsy)
15615             {
15616               value = -value;
15617               if (fixp->fx_addsy)
15618                 value += S_GET_VALUE (fixp->fx_addsy);
15619             }
15620           else if (fixp->fx_subsy)
15621             value -= S_GET_VALUE (fixp->fx_subsy);
15622           value += fixp->fx_offset;
15623           if (fixp->fx_r_type == BFD_RELOC_SIZE32
15624               && object_64bit
15625               && !fits_in_unsigned_long (value))
15626             as_bad_where (fixp->fx_file, fixp->fx_line,
15627                           _("symbol size computation overflow"));
15628           fixp->fx_addsy = NULL;
15629           fixp->fx_subsy = NULL;
15630           md_apply_fix (fixp, (valueT *) &value, NULL);
15631           return NULL;
15632         }
15633       if (!fixp->fx_addsy || fixp->fx_subsy)
15634         {
15635           as_bad_where (fixp->fx_file, fixp->fx_line,
15636                         "unsupported expression involving @size");
15637           return NULL;
15638         }
15639 #endif
15640       /* Fall through.  */
15641
15642     case BFD_RELOC_X86_64_PLT32:
15643     case BFD_RELOC_X86_64_GOT32:
15644     case BFD_RELOC_X86_64_GOTPCREL:
15645     case BFD_RELOC_X86_64_GOTPCRELX:
15646     case BFD_RELOC_X86_64_REX_GOTPCRELX:
15647     case BFD_RELOC_386_PLT32:
15648     case BFD_RELOC_386_GOT32:
15649     case BFD_RELOC_386_GOT32X:
15650     case BFD_RELOC_386_GOTOFF:
15651     case BFD_RELOC_386_GOTPC:
15652     case BFD_RELOC_386_TLS_GD:
15653     case BFD_RELOC_386_TLS_LDM:
15654     case BFD_RELOC_386_TLS_LDO_32:
15655     case BFD_RELOC_386_TLS_IE_32:
15656     case BFD_RELOC_386_TLS_IE:
15657     case BFD_RELOC_386_TLS_GOTIE:
15658     case BFD_RELOC_386_TLS_LE_32:
15659     case BFD_RELOC_386_TLS_LE:
15660     case BFD_RELOC_386_TLS_GOTDESC:
15661     case BFD_RELOC_386_TLS_DESC_CALL:
15662     case BFD_RELOC_X86_64_TLSGD:
15663     case BFD_RELOC_X86_64_TLSLD:
15664     case BFD_RELOC_X86_64_DTPOFF32:
15665     case BFD_RELOC_X86_64_DTPOFF64:
15666     case BFD_RELOC_X86_64_GOTTPOFF:
15667     case BFD_RELOC_X86_64_TPOFF32:
15668     case BFD_RELOC_X86_64_TPOFF64:
15669     case BFD_RELOC_X86_64_GOTOFF64:
15670     case BFD_RELOC_X86_64_GOTPC32:
15671     case BFD_RELOC_X86_64_GOT64:
15672     case BFD_RELOC_X86_64_GOTPCREL64:
15673     case BFD_RELOC_X86_64_GOTPC64:
15674     case BFD_RELOC_X86_64_GOTPLT64:
15675     case BFD_RELOC_X86_64_PLTOFF64:
15676     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
15677     case BFD_RELOC_X86_64_TLSDESC_CALL:
15678     case BFD_RELOC_RVA:
15679     case BFD_RELOC_VTABLE_ENTRY:
15680     case BFD_RELOC_VTABLE_INHERIT:
15681 #ifdef TE_PE
15682     case BFD_RELOC_32_SECREL:
15683     case BFD_RELOC_16_SECIDX:
15684 #endif
15685       code = fixp->fx_r_type;
15686       break;
15687     case BFD_RELOC_X86_64_32S:
15688       if (!fixp->fx_pcrel)
15689         {
15690           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
15691           code = fixp->fx_r_type;
15692           break;
15693         }
15694       /* Fall through.  */
15695     default:
15696       if (fixp->fx_pcrel)
15697         {
15698           switch (fixp->fx_size)
15699             {
15700             default:
15701               as_bad_where (fixp->fx_file, fixp->fx_line,
15702                             _("can not do %d byte pc-relative relocation"),
15703                             fixp->fx_size);
15704               code = BFD_RELOC_32_PCREL;
15705               break;
15706             case 1: code = BFD_RELOC_8_PCREL;  break;
15707             case 2: code = BFD_RELOC_16_PCREL; break;
15708             case 4: code = BFD_RELOC_32_PCREL; break;
15709 #ifdef BFD64
15710             case 8: code = BFD_RELOC_64_PCREL; break;
15711 #endif
15712             }
15713         }
15714       else
15715         {
15716           switch (fixp->fx_size)
15717             {
15718             default:
15719               as_bad_where (fixp->fx_file, fixp->fx_line,
15720                             _("can not do %d byte relocation"),
15721                             fixp->fx_size);
15722               code = BFD_RELOC_32;
15723               break;
15724             case 1: code = BFD_RELOC_8;  break;
15725             case 2: code = BFD_RELOC_16; break;
15726             case 4: code = BFD_RELOC_32; break;
15727 #ifdef BFD64
15728             case 8: code = BFD_RELOC_64; break;
15729 #endif
15730             }
15731         }
15732       break;
15733     }
15734
15735   if ((code == BFD_RELOC_32
15736        || code == BFD_RELOC_32_PCREL
15737        || code == BFD_RELOC_X86_64_32S)
15738       && GOT_symbol
15739       && fixp->fx_addsy == GOT_symbol)
15740     {
15741       if (!object_64bit)
15742         code = BFD_RELOC_386_GOTPC;
15743       else
15744         code = BFD_RELOC_X86_64_GOTPC32;
15745     }
15746   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
15747       && GOT_symbol
15748       && fixp->fx_addsy == GOT_symbol)
15749     {
15750       code = BFD_RELOC_X86_64_GOTPC64;
15751     }
15752
15753   rel = XNEW (arelent);
15754   rel->sym_ptr_ptr = XNEW (asymbol *);
15755   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
15756
15757   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
15758
15759   if (!use_rela_relocations)
15760     {
15761       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
15762          vtable entry to be used in the relocation's section offset.  */
15763       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
15764         rel->address = fixp->fx_offset;
15765 #if defined (OBJ_COFF) && defined (TE_PE)
15766       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
15767         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
15768       else
15769 #endif
15770       rel->addend = 0;
15771     }
15772   /* Use the rela in 64bit mode.  */
15773   else
15774     {
15775       if (disallow_64bit_reloc)
15776         switch (code)
15777           {
15778           case BFD_RELOC_X86_64_DTPOFF64:
15779           case BFD_RELOC_X86_64_TPOFF64:
15780           case BFD_RELOC_64_PCREL:
15781           case BFD_RELOC_X86_64_GOTOFF64:
15782           case BFD_RELOC_X86_64_GOT64:
15783           case BFD_RELOC_X86_64_GOTPCREL64:
15784           case BFD_RELOC_X86_64_GOTPC64:
15785           case BFD_RELOC_X86_64_GOTPLT64:
15786           case BFD_RELOC_X86_64_PLTOFF64:
15787             as_bad_where (fixp->fx_file, fixp->fx_line,
15788                           _("cannot represent relocation type %s in x32 mode"),
15789                           bfd_get_reloc_code_name (code));
15790             break;
15791           default:
15792             break;
15793           }
15794
15795       if (!fixp->fx_pcrel)
15796         rel->addend = fixp->fx_offset;
15797       else
15798         switch (code)
15799           {
15800           case BFD_RELOC_X86_64_PLT32:
15801           case BFD_RELOC_X86_64_GOT32:
15802           case BFD_RELOC_X86_64_GOTPCREL:
15803           case BFD_RELOC_X86_64_GOTPCRELX:
15804           case BFD_RELOC_X86_64_REX_GOTPCRELX:
15805           case BFD_RELOC_X86_64_TLSGD:
15806           case BFD_RELOC_X86_64_TLSLD:
15807           case BFD_RELOC_X86_64_GOTTPOFF:
15808           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
15809           case BFD_RELOC_X86_64_TLSDESC_CALL:
15810             rel->addend = fixp->fx_offset - fixp->fx_size;
15811             break;
15812           default:
15813             rel->addend = (section->vma
15814                            - fixp->fx_size
15815                            + fixp->fx_addnumber
15816                            + md_pcrel_from (fixp));
15817             break;
15818           }
15819     }
15820
15821   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
15822   if (rel->howto == NULL)
15823     {
15824       as_bad_where (fixp->fx_file, fixp->fx_line,
15825                     _("cannot represent relocation type %s"),
15826                     bfd_get_reloc_code_name (code));
15827       /* Set howto to a garbage value so that we can keep going.  */
15828       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
15829       gas_assert (rel->howto != NULL);
15830     }
15831
15832   return rel;
15833 }
15834
15835 #include "tc-i386-intel.c"
15836
15837 void
15838 tc_x86_parse_to_dw2regnum (expressionS *exp)
15839 {
15840   int saved_naked_reg;
15841   char saved_register_dot;
15842
15843   saved_naked_reg = allow_naked_reg;
15844   allow_naked_reg = 1;
15845   saved_register_dot = register_chars['.'];
15846   register_chars['.'] = '.';
15847   allow_pseudo_reg = 1;
15848   expression_and_evaluate (exp);
15849   allow_pseudo_reg = 0;
15850   register_chars['.'] = saved_register_dot;
15851   allow_naked_reg = saved_naked_reg;
15852
15853   if (exp->X_op == O_register && exp->X_add_number >= 0)
15854     {
15855       if ((addressT) exp->X_add_number < i386_regtab_size)
15856         {
15857           exp->X_op = O_constant;
15858           exp->X_add_number = i386_regtab[exp->X_add_number]
15859                               .dw2_regnum[flag_code >> 1];
15860         }
15861       else
15862         exp->X_op = O_illegal;
15863     }
15864 }
15865
15866 void
15867 tc_x86_frame_initial_instructions (void)
15868 {
15869   static unsigned int sp_regno[2];
15870
15871   if (!sp_regno[flag_code >> 1])
15872     {
15873       char *saved_input = input_line_pointer;
15874       char sp[][4] = {"esp", "rsp"};
15875       expressionS exp;
15876
15877       input_line_pointer = sp[flag_code >> 1];
15878       tc_x86_parse_to_dw2regnum (&exp);
15879       gas_assert (exp.X_op == O_constant);
15880       sp_regno[flag_code >> 1] = exp.X_add_number;
15881       input_line_pointer = saved_input;
15882     }
15883
15884   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
15885   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
15886 }
15887
15888 int
15889 x86_dwarf2_addr_size (void)
15890 {
15891 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
15892   if (x86_elf_abi == X86_64_X32_ABI)
15893     return 4;
15894 #endif
15895   return bfd_arch_bits_per_address (stdoutput) / 8;
15896 }
15897
15898 int
15899 i386_elf_section_type (const char *str, size_t len)
15900 {
15901   if (flag_code == CODE_64BIT
15902       && len == sizeof ("unwind") - 1
15903       && startswith (str, "unwind"))
15904     return SHT_X86_64_UNWIND;
15905
15906   return -1;
15907 }
15908
15909 #ifdef TE_SOLARIS
15910 void
15911 i386_solaris_fix_up_eh_frame (segT sec)
15912 {
15913   if (flag_code == CODE_64BIT)
15914     elf_section_type (sec) = SHT_X86_64_UNWIND;
15915 }
15916 #endif
15917
15918 #ifdef TE_PE
15919 void
15920 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
15921 {
15922   expressionS exp;
15923
15924   exp.X_op = O_secrel;
15925   exp.X_add_symbol = symbol;
15926   exp.X_add_number = 0;
15927   emit_expr (&exp, size);
15928 }
15929 #endif
15930
15931 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
15932 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
15933
15934 bfd_vma
15935 x86_64_section_letter (int letter, const char **ptr_msg)
15936 {
15937   if (flag_code == CODE_64BIT)
15938     {
15939       if (letter == 'l')
15940         return SHF_X86_64_LARGE;
15941
15942       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
15943     }
15944   else
15945     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
15946   return -1;
15947 }
15948
15949 static void
15950 handle_large_common (int small ATTRIBUTE_UNUSED)
15951 {
15952   if (flag_code != CODE_64BIT)
15953     {
15954       s_comm_internal (0, elf_common_parse);
15955       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
15956     }
15957   else
15958     {
15959       static segT lbss_section;
15960       asection *saved_com_section_ptr = elf_com_section_ptr;
15961       asection *saved_bss_section = bss_section;
15962
15963       if (lbss_section == NULL)
15964         {
15965           flagword applicable;
15966           segT seg = now_seg;
15967           subsegT subseg = now_subseg;
15968
15969           /* The .lbss section is for local .largecomm symbols.  */
15970           lbss_section = subseg_new (".lbss", 0);
15971           applicable = bfd_applicable_section_flags (stdoutput);
15972           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
15973           seg_info (lbss_section)->bss = 1;
15974
15975           subseg_set (seg, subseg);
15976         }
15977
15978       elf_com_section_ptr = &_bfd_elf_large_com_section;
15979       bss_section = lbss_section;
15980
15981       s_comm_internal (0, elf_common_parse);
15982
15983       elf_com_section_ptr = saved_com_section_ptr;
15984       bss_section = saved_bss_section;
15985     }
15986 }
15987 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */