gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2021 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35 #include <limits.h>
  36
  37 #ifndef INFER_ADDR_PREFIX
  38 #define INFER_ADDR_PREFIX 1
  39 #endif
  40
  41 #ifndef DEFAULT_ARCH
  42 #define DEFAULT_ARCH "i386"
  43 #endif
  44
  45 #ifndef INLINE
  46 #if __GNUC__ >= 2
  47 #define INLINE __inline__
  48 #else
  49 #define INLINE
  50 #endif
  51 #endif
  52
  53 /* Prefixes will be emitted in the order defined below.
  54    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  55    instruction, and so must come before any prefixes.
  56    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  57    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  58 #define WAIT_PREFIX     0
  59 #define SEG_PREFIX      1
  60 #define ADDR_PREFIX     2
  61 #define DATA_PREFIX     3
  62 #define REP_PREFIX      4
  63 #define HLE_PREFIX      REP_PREFIX
  64 #define BND_PREFIX      REP_PREFIX
  65 #define LOCK_PREFIX     5
  66 #define REX_PREFIX      6       /* must come last.  */
  67 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  68
  69 /* we define the syntax here (modulo base,index,scale syntax) */
  70 #define REGISTER_PREFIX '%'
  71 #define IMMEDIATE_PREFIX '$'
  72 #define ABSOLUTE_PREFIX '*'
  73
  74 /* these are the instruction mnemonic suffixes in AT&T syntax or
  75    memory operand size in Intel syntax.  */
  76 #define WORD_MNEM_SUFFIX  'w'
  77 #define BYTE_MNEM_SUFFIX  'b'
  78 #define SHORT_MNEM_SUFFIX 's'
  79 #define LONG_MNEM_SUFFIX  'l'
  80 #define QWORD_MNEM_SUFFIX  'q'
  81 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  82    in instructions.  */
  83 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  84
  85 #define END_OF_INSN '\0'
  86
  87 /* This matches the C -> StaticRounding alias in the opcode table.  */
  88 #define commutative staticrounding
  89
  90 /*
  91   'templates' is for grouping together 'template' structures for opcodes
  92   of the same name.  This is only used for storing the insns in the grand
  93   ole hash table of insns.
  94   The templates themselves start at START and range up to (but not including)
  95   END.
  96   */
  97 typedef struct
  98 {
  99   const insn_template *start;
 100   const insn_template *end;
 101 }
 102 templates;
 103
 104 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 105 typedef struct
 106 {
 107   unsigned int regmem;  /* codes register or memory operand */
 108   unsigned int reg;     /* codes register operand (or extended opcode) */
 109   unsigned int mode;    /* how to interpret regmem & reg */
 110 }
 111 modrm_byte;
 112
 113 /* x86-64 extension prefix.  */
 114 typedef int rex_byte;
 115
 116 /* 386 opcode byte to code indirect addressing.  */
 117 typedef struct
 118 {
 119   unsigned base;
 120   unsigned index;
 121   unsigned scale;
 122 }
 123 sib_byte;
 124
 125 /* x86 arch names, types and features */
 126 typedef struct
 127 {
 128   const char *name;             /* arch name */
 129   unsigned int len;             /* arch string length */
 130   enum processor_type type;     /* arch type */
 131   i386_cpu_flags flags;         /* cpu feature flags */
 132   unsigned int skip;            /* show_arch should skip this. */
 133 }
 134 arch_entry;
 135
 136 /* Used to turn off indicated flags.  */
 137 typedef struct
 138 {
 139   const char *name;             /* arch name */
 140   unsigned int len;             /* arch string length */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142 }
 143 noarch_entry;
 144
 145 static void update_code_flag (int, int);
 146 static void set_code_flag (int);
 147 static void set_16bit_gcc_code_flag (int);
 148 static void set_intel_syntax (int);
 149 static void set_intel_mnemonic (int);
 150 static void set_allow_index_reg (int);
 151 static void set_check (int);
 152 static void set_cpu_arch (int);
 153 #ifdef TE_PE
 154 static void pe_directive_secrel (int);
 155 #endif
 156 static void signed_cons (int);
 157 static char *output_invalid (int c);
 158 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 159                                     const char *);
 160 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 161                                        const char *);
 162 static int i386_att_operand (char *);
 163 static int i386_intel_operand (char *, int);
 164 static int i386_intel_simplify (expressionS *);
 165 static int i386_intel_parse_name (const char *, expressionS *);
 166 static const reg_entry *parse_register (char *, char **);
 167 static char *parse_insn (char *, char *);
 168 static char *parse_operands (char *, const char *);
 169 static void swap_operands (void);
 170 static void swap_2_operands (unsigned int, unsigned int);
 171 static enum flag_code i386_addressing_mode (void);
 172 static void optimize_imm (void);
 173 static void optimize_disp (void);
 174 static const insn_template *match_template (char);
 175 static int check_string (void);
 176 static int process_suffix (void);
 177 static int check_byte_reg (void);
 178 static int check_long_reg (void);
 179 static int check_qword_reg (void);
 180 static int check_word_reg (void);
 181 static int finalize_imm (void);
 182 static int process_operands (void);
 183 static const reg_entry *build_modrm_byte (void);
 184 static void output_insn (void);
 185 static void output_imm (fragS *, offsetT);
 186 static void output_disp (fragS *, offsetT);
 187 #ifndef I386COFF
 188 static void s_bss (int);
 189 #endif
 190 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 191 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 192
 193 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 194 static unsigned int x86_isa_1_used;
 195 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 196 static unsigned int x86_feature_2_used;
 197 /* Generate x86 used ISA and feature properties.  */
 198 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 199 #endif
 200
 201 static const char *default_arch = DEFAULT_ARCH;
 202
 203 /* parse_register() returns this when a register alias cannot be used.  */
 204 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 205                                    { Dw2Inval, Dw2Inval } };
 206
 207 static const reg_entry *reg_eax;
 208 static const reg_entry *reg_ds;
 209 static const reg_entry *reg_es;
 210 static const reg_entry *reg_ss;
 211 static const reg_entry *reg_st0;
 212 static const reg_entry *reg_k0;
 213
 214 /* VEX prefix.  */
 215 typedef struct
 216 {
 217   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 218   unsigned char bytes[4];
 219   unsigned int length;
 220   /* Destination or source register specifier.  */
 221   const reg_entry *register_specifier;
 222 } vex_prefix;
 223
 224 /* 'md_assemble ()' gathers together information and puts it into a
 225    i386_insn.  */
 226
 227 union i386_op
 228   {
 229     expressionS *disps;
 230     expressionS *imms;
 231     const reg_entry *regs;
 232   };
 233
 234 enum i386_error
 235   {
 236     operand_size_mismatch,
 237     operand_type_mismatch,
 238     register_type_mismatch,
 239     number_of_operands_mismatch,
 240     invalid_instruction_suffix,
 241     bad_imm4,
 242     unsupported_with_intel_mnemonic,
 243     unsupported_syntax,
 244     unsupported,
 245     invalid_sib_address,
 246     invalid_vsib_address,
 247     invalid_vector_register_set,
 248     invalid_tmm_register_set,
 249     unsupported_vector_index_register,
 250     unsupported_broadcast,
 251     broadcast_needed,
 252     unsupported_masking,
 253     mask_not_on_destination,
 254     no_default_mask,
 255     unsupported_rc_sae,
 256     rc_sae_operand_not_last_imm,
 257     invalid_register_operand,
 258   };
 259
 260 struct _i386_insn
 261   {
 262     /* TM holds the template for the insn were currently assembling.  */
 263     insn_template tm;
 264
 265     /* SUFFIX holds the instruction size suffix for byte, word, dword
 266        or qword, if given.  */
 267     char suffix;
 268
 269     /* OPCODE_LENGTH holds the number of base opcode bytes.  */
 270     unsigned char opcode_length;
 271
 272     /* OPERANDS gives the number of given operands.  */
 273     unsigned int operands;
 274
 275     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 276        of given register, displacement, memory operands and immediate
 277        operands.  */
 278     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 279
 280     /* TYPES [i] is the type (see above #defines) which tells us how to
 281        use OP[i] for the corresponding operand.  */
 282     i386_operand_type types[MAX_OPERANDS];
 283
 284     /* Displacement expression, immediate expression, or register for each
 285        operand.  */
 286     union i386_op op[MAX_OPERANDS];
 287
 288     /* Flags for operands.  */
 289     unsigned int flags[MAX_OPERANDS];
 290 #define Operand_PCrel 1
 291 #define Operand_Mem   2
 292
 293     /* Relocation type for operand */
 294     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 295
 296     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 297        the base index byte below.  */
 298     const reg_entry *base_reg;
 299     const reg_entry *index_reg;
 300     unsigned int log2_scale_factor;
 301
 302     /* SEG gives the seg_entries of this insn.  They are zero unless
 303        explicit segment overrides are given.  */
 304     const reg_entry *seg[2];
 305
 306     /* Copied first memory operand string, for re-checking.  */
 307     char *memop1_string;
 308
 309     /* PREFIX holds all the given prefix opcodes (usually null).
 310        PREFIXES is the number of prefix opcodes.  */
 311     unsigned int prefixes;
 312     unsigned char prefix[MAX_PREFIXES];
 313
 314     /* Register is in low 3 bits of opcode.  */
 315     bool short_form;
 316
 317     /* The operand to a branch insn indicates an absolute branch.  */
 318     bool jumpabsolute;
 319
 320     /* Extended states.  */
 321     enum
 322       {
 323         /* Use MMX state.  */
 324         xstate_mmx = 1 << 0,
 325         /* Use XMM state.  */
 326         xstate_xmm = 1 << 1,
 327         /* Use YMM state.  */
 328         xstate_ymm = 1 << 2 | xstate_xmm,
 329         /* Use ZMM state.  */
 330         xstate_zmm = 1 << 3 | xstate_ymm,
 331         /* Use TMM state.  */
 332         xstate_tmm = 1 << 4,
 333         /* Use MASK state.  */
 334         xstate_mask = 1 << 5
 335       } xstate;
 336
 337     /* Has GOTPC or TLS relocation.  */
 338     bool has_gotpc_tls_reloc;
 339
 340     /* RM and SIB are the modrm byte and the sib byte where the
 341        addressing modes of this insn are encoded.  */
 342     modrm_byte rm;
 343     rex_byte rex;
 344     rex_byte vrex;
 345     sib_byte sib;
 346     vex_prefix vex;
 347
 348     /* Masking attributes.
 349
 350        The struct describes masking, applied to OPERAND in the instruction.
 351        REG is a pointer to the corresponding mask register.  ZEROING tells
 352        whether merging or zeroing mask is used.  */
 353     struct Mask_Operation
 354     {
 355       const reg_entry *reg;
 356       unsigned int zeroing;
 357       /* The operand where this operation is associated.  */
 358       unsigned int operand;
 359     } mask;
 360
 361     /* Rounding control and SAE attributes.  */
 362     struct RC_Operation
 363     {
 364       enum rc_type
 365         {
 366           rc_none = -1,
 367           rne,
 368           rd,
 369           ru,
 370           rz,
 371           saeonly
 372         } type;
 373
 374       unsigned int operand;
 375     } rounding;
 376
 377     /* Broadcasting attributes.
 378
 379        The struct describes broadcasting, applied to OPERAND.  TYPE is
 380        expresses the broadcast factor.  */
 381     struct Broadcast_Operation
 382     {
 383       /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 384       unsigned int type;
 385
 386       /* Index of broadcasted operand.  */
 387       unsigned int operand;
 388
 389       /* Number of bytes to broadcast.  */
 390       unsigned int bytes;
 391     } broadcast;
 392
 393     /* Compressed disp8*N attribute.  */
 394     unsigned int memshift;
 395
 396     /* Prefer load or store in encoding.  */
 397     enum
 398       {
 399         dir_encoding_default = 0,
 400         dir_encoding_load,
 401         dir_encoding_store,
 402         dir_encoding_swap
 403       } dir_encoding;
 404
 405     /* Prefer 8bit, 16bit, 32bit displacement in encoding.  */
 406     enum
 407       {
 408         disp_encoding_default = 0,
 409         disp_encoding_8bit,
 410         disp_encoding_16bit,
 411         disp_encoding_32bit
 412       } disp_encoding;
 413
 414     /* Prefer the REX byte in encoding.  */
 415     bool rex_encoding;
 416
 417     /* Disable instruction size optimization.  */
 418     bool no_optimize;
 419
 420     /* How to encode vector instructions.  */
 421     enum
 422       {
 423         vex_encoding_default = 0,
 424         vex_encoding_vex,
 425         vex_encoding_vex3,
 426         vex_encoding_evex,
 427         vex_encoding_error
 428       } vec_encoding;
 429
 430     /* REP prefix.  */
 431     const char *rep_prefix;
 432
 433     /* HLE prefix.  */
 434     const char *hle_prefix;
 435
 436     /* Have BND prefix.  */
 437     const char *bnd_prefix;
 438
 439     /* Have NOTRACK prefix.  */
 440     const char *notrack_prefix;
 441
 442     /* Error message.  */
 443     enum i386_error error;
 444   };
 445
 446 typedef struct _i386_insn i386_insn;
 447
 448 /* Link RC type with corresponding string, that'll be looked for in
 449    asm.  */
 450 struct RC_name
 451 {
 452   enum rc_type type;
 453   const char *name;
 454   unsigned int len;
 455 };
 456
 457 static const struct RC_name RC_NamesTable[] =
 458 {
 459   {  rne, STRING_COMMA_LEN ("rn-sae") },
 460   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 461   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 462   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 463   {  saeonly,  STRING_COMMA_LEN ("sae") },
 464 };
 465
 466 /* List of chars besides those in app.c:symbol_chars that can start an
 467    operand.  Used to prevent the scrubber eating vital white-space.  */
 468 const char extra_symbol_chars[] = "*%-([{}"
 469 #ifdef LEX_AT
 470         "@"
 471 #endif
 472 #ifdef LEX_QM
 473         "?"
 474 #endif
 475         ;
 476
 477 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))     \
 478      && !defined (TE_GNU)                               \
 479      && !defined (TE_LINUX)                             \
 480      && !defined (TE_FreeBSD)                           \
 481      && !defined (TE_DragonFly)                         \
 482      && !defined (TE_NetBSD))
 483 /* This array holds the chars that always start a comment.  If the
 484    pre-processor is disabled, these aren't very useful.  The option
 485    --divide will remove '/' from this list.  */
 486 const char *i386_comment_chars = "#/";
 487 #define SVR4_COMMENT_CHARS 1
 488 #define PREFIX_SEPARATOR '\\'
 489
 490 #else
 491 const char *i386_comment_chars = "#";
 492 #define PREFIX_SEPARATOR '/'
 493 #endif
 494
 495 /* This array holds the chars that only start a comment at the beginning of
 496    a line.  If the line seems to have the form '# 123 filename'
 497    .line and .file directives will appear in the pre-processed output.
 498    Note that input_file.c hand checks for '#' at the beginning of the
 499    first line of the input file.  This is because the compiler outputs
 500    #NO_APP at the beginning of its output.
 501    Also note that comments started like this one will always work if
 502    '/' isn't otherwise defined.  */
 503 const char line_comment_chars[] = "#/";
 504
 505 const char line_separator_chars[] = ";";
 506
 507 /* Chars that can be used to separate mant from exp in floating point
 508    nums.  */
 509 const char EXP_CHARS[] = "eE";
 510
 511 /* Chars that mean this number is a floating point constant
 512    As in 0f12.456
 513    or    0d1.2345e12.  */
 514 const char FLT_CHARS[] = "fFdDxX";
 515
 516 /* Tables for lexical analysis.  */
 517 static char mnemonic_chars[256];
 518 static char register_chars[256];
 519 static char operand_chars[256];
 520 static char identifier_chars[256];
 521
 522 /* Lexical macros.  */
 523 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 524 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 525 #define is_register_char(x) (register_chars[(unsigned char) x])
 526 #define is_space_char(x) ((x) == ' ')
 527 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 528
 529 /* All non-digit non-letter characters that may occur in an operand.  */
 530 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 531
 532 /* md_assemble() always leaves the strings it's passed unaltered.  To
 533    effect this we maintain a stack of saved characters that we've smashed
 534    with '\0's (indicating end of strings for various sub-fields of the
 535    assembler instruction).  */
 536 static char save_stack[32];
 537 static char *save_stack_p;
 538 #define END_STRING_AND_SAVE(s) \
 539         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 540 #define RESTORE_END_STRING(s) \
 541         do { *(s) = *--save_stack_p; } while (0)
 542
 543 /* The instruction we're assembling.  */
 544 static i386_insn i;
 545
 546 /* Possible templates for current insn.  */
 547 static const templates *current_templates;
 548
 549 /* Per instruction expressionS buffers: max displacements & immediates.  */
 550 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 551 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 552
 553 /* Current operand we are working on.  */
 554 static int this_operand = -1;
 555
 556 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 557    these.  */
 558
 559 enum flag_code {
 560         CODE_32BIT,
 561         CODE_16BIT,
 562         CODE_64BIT };
 563
 564 static enum flag_code flag_code;
 565 static unsigned int object_64bit;
 566 static unsigned int disallow_64bit_reloc;
 567 static int use_rela_relocations = 0;
 568 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 569 static const char *tls_get_addr;
 570
 571 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 572      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 573      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 574
 575 /* The ELF ABI to use.  */
 576 enum x86_elf_abi
 577 {
 578   I386_ABI,
 579   X86_64_ABI,
 580   X86_64_X32_ABI
 581 };
 582
 583 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 584 #endif
 585
 586 #if defined (TE_PE) || defined (TE_PEP)
 587 /* Use big object file format.  */
 588 static int use_big_obj = 0;
 589 #endif
 590
 591 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 592 /* 1 if generating code for a shared library.  */
 593 static int shared = 0;
 594 #endif
 595
 596 /* 1 for intel syntax,
 597    0 if att syntax.  */
 598 static int intel_syntax = 0;
 599
 600 static enum x86_64_isa
 601 {
 602   amd64 = 1,    /* AMD64 ISA.  */
 603   intel64       /* Intel64 ISA.  */
 604 } isa64;
 605
 606 /* 1 for intel mnemonic,
 607    0 if att mnemonic.  */
 608 static int intel_mnemonic = !SYSV386_COMPAT;
 609
 610 /* 1 if pseudo registers are permitted.  */
 611 static int allow_pseudo_reg = 0;
 612
 613 /* 1 if register prefix % not required.  */
 614 static int allow_naked_reg = 0;
 615
 616 /* 1 if the assembler should add BND prefix for all control-transferring
 617    instructions supporting it, even if this prefix wasn't specified
 618    explicitly.  */
 619 static int add_bnd_prefix = 0;
 620
 621 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 622 static int allow_index_reg = 0;
 623
 624 /* 1 if the assembler should ignore LOCK prefix, even if it was
 625    specified explicitly.  */
 626 static int omit_lock_prefix = 0;
 627
 628 /* 1 if the assembler should encode lfence, mfence, and sfence as
 629    "lock addl $0, (%{re}sp)".  */
 630 static int avoid_fence = 0;
 631
 632 /* 1 if lfence should be inserted after every load.  */
 633 static int lfence_after_load = 0;
 634
 635 /* Non-zero if lfence should be inserted before indirect branch.  */
 636 static enum lfence_before_indirect_branch_kind
 637   {
 638     lfence_branch_none = 0,
 639     lfence_branch_register,
 640     lfence_branch_memory,
 641     lfence_branch_all
 642   }
 643 lfence_before_indirect_branch;
 644
 645 /* Non-zero if lfence should be inserted before ret.  */
 646 static enum lfence_before_ret_kind
 647   {
 648     lfence_before_ret_none = 0,
 649     lfence_before_ret_not,
 650     lfence_before_ret_or,
 651     lfence_before_ret_shl
 652   }
 653 lfence_before_ret;
 654
 655 /* Types of previous instruction is .byte or prefix.  */
 656 static struct
 657   {
 658     segT seg;
 659     const char *file;
 660     const char *name;
 661     unsigned int line;
 662     enum last_insn_kind
 663       {
 664         last_insn_other = 0,
 665         last_insn_directive,
 666         last_insn_prefix
 667       } kind;
 668   } last_insn;
 669
 670 /* 1 if the assembler should generate relax relocations.  */
 671
 672 static int generate_relax_relocations
 673   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 674
 675 static enum check_kind
 676   {
 677     check_none = 0,
 678     check_warning,
 679     check_error
 680   }
 681 sse_check, operand_check = check_warning;
 682
 683 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 684 static int align_branch_power = 0;
 685
 686 /* Types of branches to align.  */
 687 enum align_branch_kind
 688   {
 689     align_branch_none = 0,
 690     align_branch_jcc = 1,
 691     align_branch_fused = 2,
 692     align_branch_jmp = 3,
 693     align_branch_call = 4,
 694     align_branch_indirect = 5,
 695     align_branch_ret = 6
 696   };
 697
 698 /* Type bits of branches to align.  */
 699 enum align_branch_bit
 700   {
 701     align_branch_jcc_bit = 1 << align_branch_jcc,
 702     align_branch_fused_bit = 1 << align_branch_fused,
 703     align_branch_jmp_bit = 1 << align_branch_jmp,
 704     align_branch_call_bit = 1 << align_branch_call,
 705     align_branch_indirect_bit = 1 << align_branch_indirect,
 706     align_branch_ret_bit = 1 << align_branch_ret
 707   };
 708
 709 static unsigned int align_branch = (align_branch_jcc_bit
 710                                     | align_branch_fused_bit
 711                                     | align_branch_jmp_bit);
 712
 713 /* Types of condition jump used by macro-fusion.  */
 714 enum mf_jcc_kind
 715   {
 716     mf_jcc_jo = 0,  /* base opcode 0x70  */
 717     mf_jcc_jc,      /* base opcode 0x72  */
 718     mf_jcc_je,      /* base opcode 0x74  */
 719     mf_jcc_jna,     /* base opcode 0x76  */
 720     mf_jcc_js,      /* base opcode 0x78  */
 721     mf_jcc_jp,      /* base opcode 0x7a  */
 722     mf_jcc_jl,      /* base opcode 0x7c  */
 723     mf_jcc_jle,     /* base opcode 0x7e  */
 724   };
 725
 726 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 727 enum mf_cmp_kind
 728   {
 729     mf_cmp_test_and,  /* test/cmp */
 730     mf_cmp_alu_cmp,  /* add/sub/cmp */
 731     mf_cmp_incdec  /* inc/dec */
 732   };
 733
 734 /* The maximum padding size for fused jcc.  CMP like instruction can
 735    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 736    prefixes.   */
 737 #define MAX_FUSED_JCC_PADDING_SIZE 20
 738
 739 /* The maximum number of prefixes added for an instruction.  */
 740 static unsigned int align_branch_prefix_size = 5;
 741
 742 /* Optimization:
 743    1. Clear the REX_W bit with register operand if possible.
 744    2. Above plus use 128bit vector instruction to clear the full vector
 745       register.
 746  */
 747 static int optimize = 0;
 748
 749 /* Optimization:
 750    1. Clear the REX_W bit with register operand if possible.
 751    2. Above plus use 128bit vector instruction to clear the full vector
 752       register.
 753    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 754       "testb $imm7,%r8".
 755  */
 756 static int optimize_for_space = 0;
 757
 758 /* Register prefix used for error message.  */
 759 static const char *register_prefix = "%";
 760
 761 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 762    leave, push, and pop instructions so that gcc has the same stack
 763    frame as in 32 bit mode.  */
 764 static char stackop_size = '\0';
 765
 766 /* Non-zero to optimize code alignment.  */
 767 int optimize_align_code = 1;
 768
 769 /* Non-zero to quieten some warnings.  */
 770 static int quiet_warnings = 0;
 771
 772 /* CPU name.  */
 773 static const char *cpu_arch_name = NULL;
 774 static char *cpu_sub_arch_name = NULL;
 775
 776 /* CPU feature flags.  */
 777 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 778
 779 /* If we have selected a cpu we are generating instructions for.  */
 780 static int cpu_arch_tune_set = 0;
 781
 782 /* Cpu we are generating instructions for.  */
 783 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 784
 785 /* CPU feature flags of cpu we are generating instructions for.  */
 786 static i386_cpu_flags cpu_arch_tune_flags;
 787
 788 /* CPU instruction set architecture used.  */
 789 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 790
 791 /* CPU feature flags of instruction set architecture used.  */
 792 i386_cpu_flags cpu_arch_isa_flags;
 793
 794 /* If set, conditional jumps are not automatically promoted to handle
 795    larger than a byte offset.  */
 796 static unsigned int no_cond_jump_promotion = 0;
 797
 798 /* Encode SSE instructions with VEX prefix.  */
 799 static unsigned int sse2avx;
 800
 801 /* Encode scalar AVX instructions with specific vector length.  */
 802 static enum
 803   {
 804     vex128 = 0,
 805     vex256
 806   } avxscalar;
 807
 808 /* Encode VEX WIG instructions with specific vex.w.  */
 809 static enum
 810   {
 811     vexw0 = 0,
 812     vexw1
 813   } vexwig;
 814
 815 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 816 static enum
 817   {
 818     evexl128 = 0,
 819     evexl256,
 820     evexl512
 821   } evexlig;
 822
 823 /* Encode EVEX WIG instructions with specific evex.w.  */
 824 static enum
 825   {
 826     evexw0 = 0,
 827     evexw1
 828   } evexwig;
 829
 830 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 831 static enum rc_type evexrcig = rne;
 832
 833 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 834 static symbolS *GOT_symbol;
 835
 836 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 837 unsigned int x86_dwarf2_return_column;
 838
 839 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 840 int x86_cie_data_alignment;
 841
 842 /* Interface to relax_segment.
 843    There are 3 major relax states for 386 jump insns because the
 844    different types of jumps add different sizes to frags when we're
 845    figuring out what sort of jump to choose to reach a given label.
 846
 847    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 848    branches which are handled by md_estimate_size_before_relax() and
 849    i386_generic_table_relax_frag().  */
 850
 851 /* Types.  */
 852 #define UNCOND_JUMP 0
 853 #define COND_JUMP 1
 854 #define COND_JUMP86 2
 855 #define BRANCH_PADDING 3
 856 #define BRANCH_PREFIX 4
 857 #define FUSED_JCC_PADDING 5
 858
 859 /* Sizes.  */
 860 #define CODE16  1
 861 #define SMALL   0
 862 #define SMALL16 (SMALL | CODE16)
 863 #define BIG     2
 864 #define BIG16   (BIG | CODE16)
 865
 866 #ifndef INLINE
 867 #ifdef __GNUC__
 868 #define INLINE __inline__
 869 #else
 870 #define INLINE
 871 #endif
 872 #endif
 873
 874 #define ENCODE_RELAX_STATE(type, size) \
 875   ((relax_substateT) (((type) << 2) | (size)))
 876 #define TYPE_FROM_RELAX_STATE(s) \
 877   ((s) >> 2)
 878 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 879     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 880
 881 /* This table is used by relax_frag to promote short jumps to long
 882    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 883    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 884    don't allow a short jump in a 32 bit code segment to be promoted to
 885    a 16 bit offset jump because it's slower (requires data size
 886    prefix), and doesn't work, unless the destination is in the bottom
 887    64k of the code segment (The top 16 bits of eip are zeroed).  */
 888
 889 const relax_typeS md_relax_table[] =
 890 {
 891   /* The fields are:
 892      1) most positive reach of this state,
 893      2) most negative reach of this state,
 894      3) how many bytes this mode will have in the variable part of the frag
 895      4) which index into the table to try if we can't fit into this one.  */
 896
 897   /* UNCOND_JUMP states.  */
 898   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 899   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 900   /* dword jmp adds 4 bytes to frag:
 901      0 extra opcode bytes, 4 displacement bytes.  */
 902   {0, 0, 4, 0},
 903   /* word jmp adds 2 byte2 to frag:
 904      0 extra opcode bytes, 2 displacement bytes.  */
 905   {0, 0, 2, 0},
 906
 907   /* COND_JUMP states.  */
 908   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 909   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 910   /* dword conditionals adds 5 bytes to frag:
 911      1 extra opcode byte, 4 displacement bytes.  */
 912   {0, 0, 5, 0},
 913   /* word conditionals add 3 bytes to frag:
 914      1 extra opcode byte, 2 displacement bytes.  */
 915   {0, 0, 3, 0},
 916
 917   /* COND_JUMP86 states.  */
 918   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 919   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 920   /* dword conditionals adds 5 bytes to frag:
 921      1 extra opcode byte, 4 displacement bytes.  */
 922   {0, 0, 5, 0},
 923   /* word conditionals add 4 bytes to frag:
 924      1 displacement byte and a 3 byte long branch insn.  */
 925   {0, 0, 4, 0}
 926 };
 927
 928 static const arch_entry cpu_arch[] =
 929 {
 930   /* Do not replace the first two entries - i386_target_format()
 931      relies on them being there in this order.  */
 932   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 933     CPU_GENERIC32_FLAGS, 0 },
 934   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 935     CPU_GENERIC64_FLAGS, 0 },
 936   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 937     CPU_NONE_FLAGS, 0 },
 938   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 939     CPU_I186_FLAGS, 0 },
 940   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 941     CPU_I286_FLAGS, 0 },
 942   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 943     CPU_I386_FLAGS, 0 },
 944   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 945     CPU_I486_FLAGS, 0 },
 946   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 947     CPU_I586_FLAGS, 0 },
 948   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 949     CPU_I686_FLAGS, 0 },
 950   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 951     CPU_I586_FLAGS, 0 },
 952   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 953     CPU_PENTIUMPRO_FLAGS, 0 },
 954   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 955     CPU_P2_FLAGS, 0 },
 956   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 957     CPU_P3_FLAGS, 0 },
 958   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 959     CPU_P4_FLAGS, 0 },
 960   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 961     CPU_CORE_FLAGS, 0 },
 962   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 963     CPU_NOCONA_FLAGS, 0 },
 964   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 965     CPU_CORE_FLAGS, 1 },
 966   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 967     CPU_CORE_FLAGS, 0 },
 968   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 969     CPU_CORE2_FLAGS, 1 },
 970   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 971     CPU_CORE2_FLAGS, 0 },
 972   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 973     CPU_COREI7_FLAGS, 0 },
 974   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 975     CPU_L1OM_FLAGS, 0 },
 976   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 977     CPU_K1OM_FLAGS, 0 },
 978   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 979     CPU_IAMCU_FLAGS, 0 },
 980   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 981     CPU_K6_FLAGS, 0 },
 982   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 983     CPU_K6_2_FLAGS, 0 },
 984   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 985     CPU_ATHLON_FLAGS, 0 },
 986   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 987     CPU_K8_FLAGS, 1 },
 988   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 989     CPU_K8_FLAGS, 0 },
 990   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 991     CPU_K8_FLAGS, 0 },
 992   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 993     CPU_AMDFAM10_FLAGS, 0 },
 994   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 995     CPU_BDVER1_FLAGS, 0 },
 996   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 997     CPU_BDVER2_FLAGS, 0 },
 998   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 999     CPU_BDVER3_FLAGS, 0 },
1000   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1001     CPU_BDVER4_FLAGS, 0 },
1002   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1003     CPU_ZNVER1_FLAGS, 0 },
1004   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1005     CPU_ZNVER2_FLAGS, 0 },
1006   { STRING_COMMA_LEN ("znver3"), PROCESSOR_ZNVER,
1007     CPU_ZNVER3_FLAGS, 0 },
1008   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1009     CPU_BTVER1_FLAGS, 0 },
1010   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1011     CPU_BTVER2_FLAGS, 0 },
1012   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1013     CPU_8087_FLAGS, 0 },
1014   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1015     CPU_287_FLAGS, 0 },
1016   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1017     CPU_387_FLAGS, 0 },
1018   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1019     CPU_687_FLAGS, 0 },
1020   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1021     CPU_CMOV_FLAGS, 0 },
1022   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1023     CPU_FXSR_FLAGS, 0 },
1024   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1025     CPU_MMX_FLAGS, 0 },
1026   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1027     CPU_SSE_FLAGS, 0 },
1028   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1029     CPU_SSE2_FLAGS, 0 },
1030   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1031     CPU_SSE3_FLAGS, 0 },
1032   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1033     CPU_SSE4A_FLAGS, 0 },
1034   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1035     CPU_SSSE3_FLAGS, 0 },
1036   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1037     CPU_SSE4_1_FLAGS, 0 },
1038   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1039     CPU_SSE4_2_FLAGS, 0 },
1040   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1041     CPU_SSE4_2_FLAGS, 0 },
1042   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1043     CPU_AVX_FLAGS, 0 },
1044   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1045     CPU_AVX2_FLAGS, 0 },
1046   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1047     CPU_AVX512F_FLAGS, 0 },
1048   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1049     CPU_AVX512CD_FLAGS, 0 },
1050   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1051     CPU_AVX512ER_FLAGS, 0 },
1052   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1053     CPU_AVX512PF_FLAGS, 0 },
1054   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1055     CPU_AVX512DQ_FLAGS, 0 },
1056   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1057     CPU_AVX512BW_FLAGS, 0 },
1058   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1059     CPU_AVX512VL_FLAGS, 0 },
1060   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1061     CPU_VMX_FLAGS, 0 },
1062   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1063     CPU_VMFUNC_FLAGS, 0 },
1064   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1065     CPU_SMX_FLAGS, 0 },
1066   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1067     CPU_XSAVE_FLAGS, 0 },
1068   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1069     CPU_XSAVEOPT_FLAGS, 0 },
1070   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1071     CPU_XSAVEC_FLAGS, 0 },
1072   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1073     CPU_XSAVES_FLAGS, 0 },
1074   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1075     CPU_AES_FLAGS, 0 },
1076   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1077     CPU_PCLMUL_FLAGS, 0 },
1078   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1079     CPU_PCLMUL_FLAGS, 1 },
1080   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1081     CPU_FSGSBASE_FLAGS, 0 },
1082   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1083     CPU_RDRND_FLAGS, 0 },
1084   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1085     CPU_F16C_FLAGS, 0 },
1086   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1087     CPU_BMI2_FLAGS, 0 },
1088   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1089     CPU_FMA_FLAGS, 0 },
1090   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1091     CPU_FMA4_FLAGS, 0 },
1092   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1093     CPU_XOP_FLAGS, 0 },
1094   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1095     CPU_LWP_FLAGS, 0 },
1096   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1097     CPU_MOVBE_FLAGS, 0 },
1098   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1099     CPU_CX16_FLAGS, 0 },
1100   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1101     CPU_EPT_FLAGS, 0 },
1102   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1103     CPU_LZCNT_FLAGS, 0 },
1104   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1105     CPU_POPCNT_FLAGS, 0 },
1106   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1107     CPU_HLE_FLAGS, 0 },
1108   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1109     CPU_RTM_FLAGS, 0 },
1110   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1111     CPU_INVPCID_FLAGS, 0 },
1112   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1113     CPU_CLFLUSH_FLAGS, 0 },
1114   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1115     CPU_NOP_FLAGS, 0 },
1116   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1117     CPU_SYSCALL_FLAGS, 0 },
1118   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1119     CPU_RDTSCP_FLAGS, 0 },
1120   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1121     CPU_3DNOW_FLAGS, 0 },
1122   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1123     CPU_3DNOWA_FLAGS, 0 },
1124   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1125     CPU_PADLOCK_FLAGS, 0 },
1126   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1127     CPU_SVME_FLAGS, 1 },
1128   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1129     CPU_SVME_FLAGS, 0 },
1130   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1131     CPU_SSE4A_FLAGS, 0 },
1132   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1133     CPU_ABM_FLAGS, 0 },
1134   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1135     CPU_BMI_FLAGS, 0 },
1136   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1137     CPU_TBM_FLAGS, 0 },
1138   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1139     CPU_ADX_FLAGS, 0 },
1140   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1141     CPU_RDSEED_FLAGS, 0 },
1142   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1143     CPU_PRFCHW_FLAGS, 0 },
1144   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1145     CPU_SMAP_FLAGS, 0 },
1146   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1147     CPU_MPX_FLAGS, 0 },
1148   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1149     CPU_SHA_FLAGS, 0 },
1150   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1151     CPU_CLFLUSHOPT_FLAGS, 0 },
1152   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1153     CPU_PREFETCHWT1_FLAGS, 0 },
1154   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1155     CPU_SE1_FLAGS, 0 },
1156   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1157     CPU_CLWB_FLAGS, 0 },
1158   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1159     CPU_AVX512IFMA_FLAGS, 0 },
1160   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1161     CPU_AVX512VBMI_FLAGS, 0 },
1162   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1163     CPU_AVX512_4FMAPS_FLAGS, 0 },
1164   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1165     CPU_AVX512_4VNNIW_FLAGS, 0 },
1166   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1167     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1168   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1169     CPU_AVX512_VBMI2_FLAGS, 0 },
1170   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1171     CPU_AVX512_VNNI_FLAGS, 0 },
1172   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1173     CPU_AVX512_BITALG_FLAGS, 0 },
1174   { STRING_COMMA_LEN (".avx_vnni"), PROCESSOR_UNKNOWN,
1175     CPU_AVX_VNNI_FLAGS, 0 },
1176   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1177     CPU_CLZERO_FLAGS, 0 },
1178   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1179     CPU_MWAITX_FLAGS, 0 },
1180   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1181     CPU_OSPKE_FLAGS, 0 },
1182   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1183     CPU_RDPID_FLAGS, 0 },
1184   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1185     CPU_PTWRITE_FLAGS, 0 },
1186   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1187     CPU_IBT_FLAGS, 0 },
1188   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1189     CPU_SHSTK_FLAGS, 0 },
1190   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1191     CPU_GFNI_FLAGS, 0 },
1192   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1193     CPU_VAES_FLAGS, 0 },
1194   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1195     CPU_VPCLMULQDQ_FLAGS, 0 },
1196   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1197     CPU_WBNOINVD_FLAGS, 0 },
1198   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1199     CPU_PCONFIG_FLAGS, 0 },
1200   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1201     CPU_WAITPKG_FLAGS, 0 },
1202   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1203     CPU_CLDEMOTE_FLAGS, 0 },
1204   { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1205     CPU_AMX_INT8_FLAGS, 0 },
1206   { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1207     CPU_AMX_BF16_FLAGS, 0 },
1208   { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1209     CPU_AMX_TILE_FLAGS, 0 },
1210   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1211     CPU_MOVDIRI_FLAGS, 0 },
1212   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1213     CPU_MOVDIR64B_FLAGS, 0 },
1214   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1215     CPU_AVX512_BF16_FLAGS, 0 },
1216   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1217     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1218   { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1219     CPU_TDX_FLAGS, 0 },
1220   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1221     CPU_ENQCMD_FLAGS, 0 },
1222   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1223     CPU_SERIALIZE_FLAGS, 0 },
1224   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1225     CPU_RDPRU_FLAGS, 0 },
1226   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1227     CPU_MCOMMIT_FLAGS, 0 },
1228   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1229     CPU_SEV_ES_FLAGS, 0 },
1230   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1231     CPU_TSXLDTRK_FLAGS, 0 },
1232   { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1233     CPU_KL_FLAGS, 0 },
1234   { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1235     CPU_WIDEKL_FLAGS, 0 },
1236   { STRING_COMMA_LEN (".uintr"), PROCESSOR_UNKNOWN,
1237     CPU_UINTR_FLAGS, 0 },
1238   { STRING_COMMA_LEN (".hreset"), PROCESSOR_UNKNOWN,
1239     CPU_HRESET_FLAGS, 0 },
1240 };
1241
1242 static const noarch_entry cpu_noarch[] =
1243 {
1244   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1245   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1246   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1247   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1248   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1249   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1250   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1251   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1252   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1253   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1254   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1255   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1256   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1257   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1258   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1259   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1260   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1261   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1262   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1263   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1264   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1265   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1266   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1267   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1268   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1269   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1270   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1271   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1272   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1273   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1274   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1275   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1276   { STRING_COMMA_LEN ("noavx_vnni"), CPU_ANY_AVX_VNNI_FLAGS },
1277   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1278   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1279   { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1280   { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1281   { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1282   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1283   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1284   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1285   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1286     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1287   { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1288   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1289   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1290   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1291   { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1292   { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1293   { STRING_COMMA_LEN ("nouintr"), CPU_ANY_UINTR_FLAGS },
1294   { STRING_COMMA_LEN ("nohreset"), CPU_ANY_HRESET_FLAGS },
1295 };
1296
1297 #ifdef I386COFF
1298 /* Like s_lcomm_internal in gas/read.c but the alignment string
1299    is allowed to be optional.  */
1300
1301 static symbolS *
1302 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1303 {
1304   addressT align = 0;
1305
1306   SKIP_WHITESPACE ();
1307
1308   if (needs_align
1309       && *input_line_pointer == ',')
1310     {
1311       align = parse_align (needs_align - 1);
1312
1313       if (align == (addressT) -1)
1314         return NULL;
1315     }
1316   else
1317     {
1318       if (size >= 8)
1319         align = 3;
1320       else if (size >= 4)
1321         align = 2;
1322       else if (size >= 2)
1323         align = 1;
1324       else
1325         align = 0;
1326     }
1327
1328   bss_alloc (symbolP, size, align);
1329   return symbolP;
1330 }
1331
1332 static void
1333 pe_lcomm (int needs_align)
1334 {
1335   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1336 }
1337 #endif
1338
1339 const pseudo_typeS md_pseudo_table[] =
1340 {
1341 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1342   {"align", s_align_bytes, 0},
1343 #else
1344   {"align", s_align_ptwo, 0},
1345 #endif
1346   {"arch", set_cpu_arch, 0},
1347 #ifndef I386COFF
1348   {"bss", s_bss, 0},
1349 #else
1350   {"lcomm", pe_lcomm, 1},
1351 #endif
1352   {"ffloat", float_cons, 'f'},
1353   {"dfloat", float_cons, 'd'},
1354   {"tfloat", float_cons, 'x'},
1355   {"value", cons, 2},
1356   {"slong", signed_cons, 4},
1357   {"noopt", s_ignore, 0},
1358   {"optim", s_ignore, 0},
1359   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1360   {"code16", set_code_flag, CODE_16BIT},
1361   {"code32", set_code_flag, CODE_32BIT},
1362 #ifdef BFD64
1363   {"code64", set_code_flag, CODE_64BIT},
1364 #endif
1365   {"intel_syntax", set_intel_syntax, 1},
1366   {"att_syntax", set_intel_syntax, 0},
1367   {"intel_mnemonic", set_intel_mnemonic, 1},
1368   {"att_mnemonic", set_intel_mnemonic, 0},
1369   {"allow_index_reg", set_allow_index_reg, 1},
1370   {"disallow_index_reg", set_allow_index_reg, 0},
1371   {"sse_check", set_check, 0},
1372   {"operand_check", set_check, 1},
1373 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1374   {"largecomm", handle_large_common, 0},
1375 #else
1376   {"file", dwarf2_directive_file, 0},
1377   {"loc", dwarf2_directive_loc, 0},
1378   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1379 #endif
1380 #ifdef TE_PE
1381   {"secrel32", pe_directive_secrel, 0},
1382 #endif
1383   {0, 0, 0}
1384 };
1385
1386 /* For interface with expression ().  */
1387 extern char *input_line_pointer;
1388
1389 /* Hash table for instruction mnemonic lookup.  */
1390 static htab_t op_hash;
1391
1392 /* Hash table for register lookup.  */
1393 static htab_t reg_hash;
1394 \f
1395   /* Various efficient no-op patterns for aligning code labels.
1396      Note: Don't try to assemble the instructions in the comments.
1397      0L and 0w are not legal.  */
1398 static const unsigned char f32_1[] =
1399   {0x90};                               /* nop                  */
1400 static const unsigned char f32_2[] =
1401   {0x66,0x90};                          /* xchg %ax,%ax         */
1402 static const unsigned char f32_3[] =
1403   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1404 static const unsigned char f32_4[] =
1405   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1406 static const unsigned char f32_6[] =
1407   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1408 static const unsigned char f32_7[] =
1409   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1410 static const unsigned char f16_3[] =
1411   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1412 static const unsigned char f16_4[] =
1413   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1414 static const unsigned char jump_disp8[] =
1415   {0xeb};                               /* jmp disp8           */
1416 static const unsigned char jump32_disp32[] =
1417   {0xe9};                               /* jmp disp32          */
1418 static const unsigned char jump16_disp32[] =
1419   {0x66,0xe9};                          /* jmp disp32          */
1420 /* 32-bit NOPs patterns.  */
1421 static const unsigned char *const f32_patt[] = {
1422   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1423 };
1424 /* 16-bit NOPs patterns.  */
1425 static const unsigned char *const f16_patt[] = {
1426   f32_1, f32_2, f16_3, f16_4
1427 };
1428 /* nopl (%[re]ax) */
1429 static const unsigned char alt_3[] =
1430   {0x0f,0x1f,0x00};
1431 /* nopl 0(%[re]ax) */
1432 static const unsigned char alt_4[] =
1433   {0x0f,0x1f,0x40,0x00};
1434 /* nopl 0(%[re]ax,%[re]ax,1) */
1435 static const unsigned char alt_5[] =
1436   {0x0f,0x1f,0x44,0x00,0x00};
1437 /* nopw 0(%[re]ax,%[re]ax,1) */
1438 static const unsigned char alt_6[] =
1439   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1440 /* nopl 0L(%[re]ax) */
1441 static const unsigned char alt_7[] =
1442   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1443 /* nopl 0L(%[re]ax,%[re]ax,1) */
1444 static const unsigned char alt_8[] =
1445   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1446 /* nopw 0L(%[re]ax,%[re]ax,1) */
1447 static const unsigned char alt_9[] =
1448   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1449 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1450 static const unsigned char alt_10[] =
1451   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1452 /* data16 nopw %cs:0L(%eax,%eax,1) */
1453 static const unsigned char alt_11[] =
1454   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1455 /* 32-bit and 64-bit NOPs patterns.  */
1456 static const unsigned char *const alt_patt[] = {
1457   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1458   alt_9, alt_10, alt_11
1459 };
1460
1461 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1462    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1463
1464 static void
1465 i386_output_nops (char *where, const unsigned char *const *patt,
1466                   int count, int max_single_nop_size)
1467
1468 {
1469   /* Place the longer NOP first.  */
1470   int last;
1471   int offset;
1472   const unsigned char *nops;
1473
1474   if (max_single_nop_size < 1)
1475     {
1476       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1477                 max_single_nop_size);
1478       return;
1479     }
1480
1481   nops = patt[max_single_nop_size - 1];
1482
1483   /* Use the smaller one if the requsted one isn't available.  */
1484   if (nops == NULL)
1485     {
1486       max_single_nop_size--;
1487       nops = patt[max_single_nop_size - 1];
1488     }
1489
1490   last = count % max_single_nop_size;
1491
1492   count -= last;
1493   for (offset = 0; offset < count; offset += max_single_nop_size)
1494     memcpy (where + offset, nops, max_single_nop_size);
1495
1496   if (last)
1497     {
1498       nops = patt[last - 1];
1499       if (nops == NULL)
1500         {
1501           /* Use the smaller one plus one-byte NOP if the needed one
1502              isn't available.  */
1503           last--;
1504           nops = patt[last - 1];
1505           memcpy (where + offset, nops, last);
1506           where[offset + last] = *patt[0];
1507         }
1508       else
1509         memcpy (where + offset, nops, last);
1510     }
1511 }
1512
1513 static INLINE int
1514 fits_in_imm7 (offsetT num)
1515 {
1516   return (num & 0x7f) == num;
1517 }
1518
1519 static INLINE int
1520 fits_in_imm31 (offsetT num)
1521 {
1522   return (num & 0x7fffffff) == num;
1523 }
1524
1525 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1526    single NOP instruction LIMIT.  */
1527
1528 void
1529 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1530 {
1531   const unsigned char *const *patt = NULL;
1532   int max_single_nop_size;
1533   /* Maximum number of NOPs before switching to jump over NOPs.  */
1534   int max_number_of_nops;
1535
1536   switch (fragP->fr_type)
1537     {
1538     case rs_fill_nop:
1539     case rs_align_code:
1540       break;
1541     case rs_machine_dependent:
1542       /* Allow NOP padding for jumps and calls.  */
1543       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1544           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1545         break;
1546       /* Fall through.  */
1547     default:
1548       return;
1549     }
1550
1551   /* We need to decide which NOP sequence to use for 32bit and
1552      64bit. When -mtune= is used:
1553
1554      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1555      PROCESSOR_GENERIC32, f32_patt will be used.
1556      2. For the rest, alt_patt will be used.
1557
1558      When -mtune= isn't used, alt_patt will be used if
1559      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1560      be used.
1561
1562      When -march= or .arch is used, we can't use anything beyond
1563      cpu_arch_isa_flags.   */
1564
1565   if (flag_code == CODE_16BIT)
1566     {
1567       patt = f16_patt;
1568       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1569       /* Limit number of NOPs to 2 in 16-bit mode.  */
1570       max_number_of_nops = 2;
1571     }
1572   else
1573     {
1574       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1575         {
1576           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1577           switch (cpu_arch_tune)
1578             {
1579             case PROCESSOR_UNKNOWN:
1580               /* We use cpu_arch_isa_flags to check if we SHOULD
1581                  optimize with nops.  */
1582               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1583                 patt = alt_patt;
1584               else
1585                 patt = f32_patt;
1586               break;
1587             case PROCESSOR_PENTIUM4:
1588             case PROCESSOR_NOCONA:
1589             case PROCESSOR_CORE:
1590             case PROCESSOR_CORE2:
1591             case PROCESSOR_COREI7:
1592             case PROCESSOR_L1OM:
1593             case PROCESSOR_K1OM:
1594             case PROCESSOR_GENERIC64:
1595             case PROCESSOR_K6:
1596             case PROCESSOR_ATHLON:
1597             case PROCESSOR_K8:
1598             case PROCESSOR_AMDFAM10:
1599             case PROCESSOR_BD:
1600             case PROCESSOR_ZNVER:
1601             case PROCESSOR_BT:
1602               patt = alt_patt;
1603               break;
1604             case PROCESSOR_I386:
1605             case PROCESSOR_I486:
1606             case PROCESSOR_PENTIUM:
1607             case PROCESSOR_PENTIUMPRO:
1608             case PROCESSOR_IAMCU:
1609             case PROCESSOR_GENERIC32:
1610               patt = f32_patt;
1611               break;
1612             }
1613         }
1614       else
1615         {
1616           switch (fragP->tc_frag_data.tune)
1617             {
1618             case PROCESSOR_UNKNOWN:
1619               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1620                  PROCESSOR_UNKNOWN.  */
1621               abort ();
1622               break;
1623
1624             case PROCESSOR_I386:
1625             case PROCESSOR_I486:
1626             case PROCESSOR_PENTIUM:
1627             case PROCESSOR_IAMCU:
1628             case PROCESSOR_K6:
1629             case PROCESSOR_ATHLON:
1630             case PROCESSOR_K8:
1631             case PROCESSOR_AMDFAM10:
1632             case PROCESSOR_BD:
1633             case PROCESSOR_ZNVER:
1634             case PROCESSOR_BT:
1635             case PROCESSOR_GENERIC32:
1636               /* We use cpu_arch_isa_flags to check if we CAN optimize
1637                  with nops.  */
1638               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1639                 patt = alt_patt;
1640               else
1641                 patt = f32_patt;
1642               break;
1643             case PROCESSOR_PENTIUMPRO:
1644             case PROCESSOR_PENTIUM4:
1645             case PROCESSOR_NOCONA:
1646             case PROCESSOR_CORE:
1647             case PROCESSOR_CORE2:
1648             case PROCESSOR_COREI7:
1649             case PROCESSOR_L1OM:
1650             case PROCESSOR_K1OM:
1651               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1652                 patt = alt_patt;
1653               else
1654                 patt = f32_patt;
1655               break;
1656             case PROCESSOR_GENERIC64:
1657               patt = alt_patt;
1658               break;
1659             }
1660         }
1661
1662       if (patt == f32_patt)
1663         {
1664           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1665           /* Limit number of NOPs to 2 for older processors.  */
1666           max_number_of_nops = 2;
1667         }
1668       else
1669         {
1670           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1671           /* Limit number of NOPs to 7 for newer processors.  */
1672           max_number_of_nops = 7;
1673         }
1674     }
1675
1676   if (limit == 0)
1677     limit = max_single_nop_size;
1678
1679   if (fragP->fr_type == rs_fill_nop)
1680     {
1681       /* Output NOPs for .nop directive.  */
1682       if (limit > max_single_nop_size)
1683         {
1684           as_bad_where (fragP->fr_file, fragP->fr_line,
1685                         _("invalid single nop size: %d "
1686                           "(expect within [0, %d])"),
1687                         limit, max_single_nop_size);
1688           return;
1689         }
1690     }
1691   else if (fragP->fr_type != rs_machine_dependent)
1692     fragP->fr_var = count;
1693
1694   if ((count / max_single_nop_size) > max_number_of_nops)
1695     {
1696       /* Generate jump over NOPs.  */
1697       offsetT disp = count - 2;
1698       if (fits_in_imm7 (disp))
1699         {
1700           /* Use "jmp disp8" if possible.  */
1701           count = disp;
1702           where[0] = jump_disp8[0];
1703           where[1] = count;
1704           where += 2;
1705         }
1706       else
1707         {
1708           unsigned int size_of_jump;
1709
1710           if (flag_code == CODE_16BIT)
1711             {
1712               where[0] = jump16_disp32[0];
1713               where[1] = jump16_disp32[1];
1714               size_of_jump = 2;
1715             }
1716           else
1717             {
1718               where[0] = jump32_disp32[0];
1719               size_of_jump = 1;
1720             }
1721
1722           count -= size_of_jump + 4;
1723           if (!fits_in_imm31 (count))
1724             {
1725               as_bad_where (fragP->fr_file, fragP->fr_line,
1726                             _("jump over nop padding out of range"));
1727               return;
1728             }
1729
1730           md_number_to_chars (where + size_of_jump, count, 4);
1731           where += size_of_jump + 4;
1732         }
1733     }
1734
1735   /* Generate multiple NOPs.  */
1736   i386_output_nops (where, patt, count, limit);
1737 }
1738
1739 static INLINE int
1740 operand_type_all_zero (const union i386_operand_type *x)
1741 {
1742   switch (ARRAY_SIZE(x->array))
1743     {
1744     case 3:
1745       if (x->array[2])
1746         return 0;
1747       /* Fall through.  */
1748     case 2:
1749       if (x->array[1])
1750         return 0;
1751       /* Fall through.  */
1752     case 1:
1753       return !x->array[0];
1754     default:
1755       abort ();
1756     }
1757 }
1758
1759 static INLINE void
1760 operand_type_set (union i386_operand_type *x, unsigned int v)
1761 {
1762   switch (ARRAY_SIZE(x->array))
1763     {
1764     case 3:
1765       x->array[2] = v;
1766       /* Fall through.  */
1767     case 2:
1768       x->array[1] = v;
1769       /* Fall through.  */
1770     case 1:
1771       x->array[0] = v;
1772       /* Fall through.  */
1773       break;
1774     default:
1775       abort ();
1776     }
1777
1778   x->bitfield.class = ClassNone;
1779   x->bitfield.instance = InstanceNone;
1780 }
1781
1782 static INLINE int
1783 operand_type_equal (const union i386_operand_type *x,
1784                     const union i386_operand_type *y)
1785 {
1786   switch (ARRAY_SIZE(x->array))
1787     {
1788     case 3:
1789       if (x->array[2] != y->array[2])
1790         return 0;
1791       /* Fall through.  */
1792     case 2:
1793       if (x->array[1] != y->array[1])
1794         return 0;
1795       /* Fall through.  */
1796     case 1:
1797       return x->array[0] == y->array[0];
1798       break;
1799     default:
1800       abort ();
1801     }
1802 }
1803
1804 static INLINE int
1805 cpu_flags_all_zero (const union i386_cpu_flags *x)
1806 {
1807   switch (ARRAY_SIZE(x->array))
1808     {
1809     case 4:
1810       if (x->array[3])
1811         return 0;
1812       /* Fall through.  */
1813     case 3:
1814       if (x->array[2])
1815         return 0;
1816       /* Fall through.  */
1817     case 2:
1818       if (x->array[1])
1819         return 0;
1820       /* Fall through.  */
1821     case 1:
1822       return !x->array[0];
1823     default:
1824       abort ();
1825     }
1826 }
1827
1828 static INLINE int
1829 cpu_flags_equal (const union i386_cpu_flags *x,
1830                  const union i386_cpu_flags *y)
1831 {
1832   switch (ARRAY_SIZE(x->array))
1833     {
1834     case 4:
1835       if (x->array[3] != y->array[3])
1836         return 0;
1837       /* Fall through.  */
1838     case 3:
1839       if (x->array[2] != y->array[2])
1840         return 0;
1841       /* Fall through.  */
1842     case 2:
1843       if (x->array[1] != y->array[1])
1844         return 0;
1845       /* Fall through.  */
1846     case 1:
1847       return x->array[0] == y->array[0];
1848       break;
1849     default:
1850       abort ();
1851     }
1852 }
1853
1854 static INLINE int
1855 cpu_flags_check_cpu64 (i386_cpu_flags f)
1856 {
1857   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1858            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1859 }
1860
1861 static INLINE i386_cpu_flags
1862 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1863 {
1864   switch (ARRAY_SIZE (x.array))
1865     {
1866     case 4:
1867       x.array [3] &= y.array [3];
1868       /* Fall through.  */
1869     case 3:
1870       x.array [2] &= y.array [2];
1871       /* Fall through.  */
1872     case 2:
1873       x.array [1] &= y.array [1];
1874       /* Fall through.  */
1875     case 1:
1876       x.array [0] &= y.array [0];
1877       break;
1878     default:
1879       abort ();
1880     }
1881   return x;
1882 }
1883
1884 static INLINE i386_cpu_flags
1885 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1886 {
1887   switch (ARRAY_SIZE (x.array))
1888     {
1889     case 4:
1890       x.array [3] |= y.array [3];
1891       /* Fall through.  */
1892     case 3:
1893       x.array [2] |= y.array [2];
1894       /* Fall through.  */
1895     case 2:
1896       x.array [1] |= y.array [1];
1897       /* Fall through.  */
1898     case 1:
1899       x.array [0] |= y.array [0];
1900       break;
1901     default:
1902       abort ();
1903     }
1904   return x;
1905 }
1906
1907 static INLINE i386_cpu_flags
1908 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1909 {
1910   switch (ARRAY_SIZE (x.array))
1911     {
1912     case 4:
1913       x.array [3] &= ~y.array [3];
1914       /* Fall through.  */
1915     case 3:
1916       x.array [2] &= ~y.array [2];
1917       /* Fall through.  */
1918     case 2:
1919       x.array [1] &= ~y.array [1];
1920       /* Fall through.  */
1921     case 1:
1922       x.array [0] &= ~y.array [0];
1923       break;
1924     default:
1925       abort ();
1926     }
1927   return x;
1928 }
1929
1930 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1931
1932 #define CPU_FLAGS_ARCH_MATCH            0x1
1933 #define CPU_FLAGS_64BIT_MATCH           0x2
1934
1935 #define CPU_FLAGS_PERFECT_MATCH \
1936   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1937
1938 /* Return CPU flags match bits. */
1939
1940 static int
1941 cpu_flags_match (const insn_template *t)
1942 {
1943   i386_cpu_flags x = t->cpu_flags;
1944   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1945
1946   x.bitfield.cpu64 = 0;
1947   x.bitfield.cpuno64 = 0;
1948
1949   if (cpu_flags_all_zero (&x))
1950     {
1951       /* This instruction is available on all archs.  */
1952       match |= CPU_FLAGS_ARCH_MATCH;
1953     }
1954   else
1955     {
1956       /* This instruction is available only on some archs.  */
1957       i386_cpu_flags cpu = cpu_arch_flags;
1958
1959       /* AVX512VL is no standalone feature - match it and then strip it.  */
1960       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1961         return match;
1962       x.bitfield.cpuavx512vl = 0;
1963
1964       cpu = cpu_flags_and (x, cpu);
1965       if (!cpu_flags_all_zero (&cpu))
1966         {
1967           if (x.bitfield.cpuavx)
1968             {
1969               /* We need to check a few extra flags with AVX.  */
1970               if (cpu.bitfield.cpuavx
1971                   && (!t->opcode_modifier.sse2avx
1972                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1973                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1974                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1975                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1976                 match |= CPU_FLAGS_ARCH_MATCH;
1977             }
1978           else if (x.bitfield.cpuavx512f)
1979             {
1980               /* We need to check a few extra flags with AVX512F.  */
1981               if (cpu.bitfield.cpuavx512f
1982                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1983                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1984                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1985                 match |= CPU_FLAGS_ARCH_MATCH;
1986             }
1987           else
1988             match |= CPU_FLAGS_ARCH_MATCH;
1989         }
1990     }
1991   return match;
1992 }
1993
1994 static INLINE i386_operand_type
1995 operand_type_and (i386_operand_type x, i386_operand_type y)
1996 {
1997   if (x.bitfield.class != y.bitfield.class)
1998     x.bitfield.class = ClassNone;
1999   if (x.bitfield.instance != y.bitfield.instance)
2000     x.bitfield.instance = InstanceNone;
2001
2002   switch (ARRAY_SIZE (x.array))
2003     {
2004     case 3:
2005       x.array [2] &= y.array [2];
2006       /* Fall through.  */
2007     case 2:
2008       x.array [1] &= y.array [1];
2009       /* Fall through.  */
2010     case 1:
2011       x.array [0] &= y.array [0];
2012       break;
2013     default:
2014       abort ();
2015     }
2016   return x;
2017 }
2018
2019 static INLINE i386_operand_type
2020 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2021 {
2022   gas_assert (y.bitfield.class == ClassNone);
2023   gas_assert (y.bitfield.instance == InstanceNone);
2024
2025   switch (ARRAY_SIZE (x.array))
2026     {
2027     case 3:
2028       x.array [2] &= ~y.array [2];
2029       /* Fall through.  */
2030     case 2:
2031       x.array [1] &= ~y.array [1];
2032       /* Fall through.  */
2033     case 1:
2034       x.array [0] &= ~y.array [0];
2035       break;
2036     default:
2037       abort ();
2038     }
2039   return x;
2040 }
2041
2042 static INLINE i386_operand_type
2043 operand_type_or (i386_operand_type x, i386_operand_type y)
2044 {
2045   gas_assert (x.bitfield.class == ClassNone ||
2046               y.bitfield.class == ClassNone ||
2047               x.bitfield.class == y.bitfield.class);
2048   gas_assert (x.bitfield.instance == InstanceNone ||
2049               y.bitfield.instance == InstanceNone ||
2050               x.bitfield.instance == y.bitfield.instance);
2051
2052   switch (ARRAY_SIZE (x.array))
2053     {
2054     case 3:
2055       x.array [2] |= y.array [2];
2056       /* Fall through.  */
2057     case 2:
2058       x.array [1] |= y.array [1];
2059       /* Fall through.  */
2060     case 1:
2061       x.array [0] |= y.array [0];
2062       break;
2063     default:
2064       abort ();
2065     }
2066   return x;
2067 }
2068
2069 static INLINE i386_operand_type
2070 operand_type_xor (i386_operand_type x, i386_operand_type y)
2071 {
2072   gas_assert (y.bitfield.class == ClassNone);
2073   gas_assert (y.bitfield.instance == InstanceNone);
2074
2075   switch (ARRAY_SIZE (x.array))
2076     {
2077     case 3:
2078       x.array [2] ^= y.array [2];
2079       /* Fall through.  */
2080     case 2:
2081       x.array [1] ^= y.array [1];
2082       /* Fall through.  */
2083     case 1:
2084       x.array [0] ^= y.array [0];
2085       break;
2086     default:
2087       abort ();
2088     }
2089   return x;
2090 }
2091
2092 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2093 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2094 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2095 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2096 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2097 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2098 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2099 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2100 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2101 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2102 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2103 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2104 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2105 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2106 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2107 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2108 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2109
2110 enum operand_type
2111 {
2112   reg,
2113   imm,
2114   disp,
2115   anymem
2116 };
2117
2118 static INLINE int
2119 operand_type_check (i386_operand_type t, enum operand_type c)
2120 {
2121   switch (c)
2122     {
2123     case reg:
2124       return t.bitfield.class == Reg;
2125
2126     case imm:
2127       return (t.bitfield.imm8
2128               || t.bitfield.imm8s
2129               || t.bitfield.imm16
2130               || t.bitfield.imm32
2131               || t.bitfield.imm32s
2132               || t.bitfield.imm64);
2133
2134     case disp:
2135       return (t.bitfield.disp8
2136               || t.bitfield.disp16
2137               || t.bitfield.disp32
2138               || t.bitfield.disp32s
2139               || t.bitfield.disp64);
2140
2141     case anymem:
2142       return (t.bitfield.disp8
2143               || t.bitfield.disp16
2144               || t.bitfield.disp32
2145               || t.bitfield.disp32s
2146               || t.bitfield.disp64
2147               || t.bitfield.baseindex);
2148
2149     default:
2150       abort ();
2151     }
2152
2153   return 0;
2154 }
2155
2156 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2157    between operand GIVEN and opeand WANTED for instruction template T.  */
2158
2159 static INLINE int
2160 match_operand_size (const insn_template *t, unsigned int wanted,
2161                     unsigned int given)
2162 {
2163   return !((i.types[given].bitfield.byte
2164             && !t->operand_types[wanted].bitfield.byte)
2165            || (i.types[given].bitfield.word
2166                && !t->operand_types[wanted].bitfield.word)
2167            || (i.types[given].bitfield.dword
2168                && !t->operand_types[wanted].bitfield.dword)
2169            || (i.types[given].bitfield.qword
2170                && !t->operand_types[wanted].bitfield.qword)
2171            || (i.types[given].bitfield.tbyte
2172                && !t->operand_types[wanted].bitfield.tbyte));
2173 }
2174
2175 /* Return 1 if there is no conflict in SIMD register between operand
2176    GIVEN and opeand WANTED for instruction template T.  */
2177
2178 static INLINE int
2179 match_simd_size (const insn_template *t, unsigned int wanted,
2180                  unsigned int given)
2181 {
2182   return !((i.types[given].bitfield.xmmword
2183             && !t->operand_types[wanted].bitfield.xmmword)
2184            || (i.types[given].bitfield.ymmword
2185                && !t->operand_types[wanted].bitfield.ymmword)
2186            || (i.types[given].bitfield.zmmword
2187                && !t->operand_types[wanted].bitfield.zmmword)
2188            || (i.types[given].bitfield.tmmword
2189                && !t->operand_types[wanted].bitfield.tmmword));
2190 }
2191
2192 /* Return 1 if there is no conflict in any size between operand GIVEN
2193    and opeand WANTED for instruction template T.  */
2194
2195 static INLINE int
2196 match_mem_size (const insn_template *t, unsigned int wanted,
2197                 unsigned int given)
2198 {
2199   return (match_operand_size (t, wanted, given)
2200           && !((i.types[given].bitfield.unspecified
2201                 && !i.broadcast.type
2202                 && !t->operand_types[wanted].bitfield.unspecified)
2203                || (i.types[given].bitfield.fword
2204                    && !t->operand_types[wanted].bitfield.fword)
2205                /* For scalar opcode templates to allow register and memory
2206                   operands at the same time, some special casing is needed
2207                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2208                   down-conversion vpmov*.  */
2209                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2210                     && t->operand_types[wanted].bitfield.byte
2211                        + t->operand_types[wanted].bitfield.word
2212                        + t->operand_types[wanted].bitfield.dword
2213                        + t->operand_types[wanted].bitfield.qword
2214                        > !!t->opcode_modifier.broadcast)
2215                    ? (i.types[given].bitfield.xmmword
2216                       || i.types[given].bitfield.ymmword
2217                       || i.types[given].bitfield.zmmword)
2218                    : !match_simd_size(t, wanted, given))));
2219 }
2220
2221 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2222    operands for instruction template T, and it has MATCH_REVERSE set if there
2223    is no size conflict on any operands for the template with operands reversed
2224    (and the template allows for reversing in the first place).  */
2225
2226 #define MATCH_STRAIGHT 1
2227 #define MATCH_REVERSE  2
2228
2229 static INLINE unsigned int
2230 operand_size_match (const insn_template *t)
2231 {
2232   unsigned int j, match = MATCH_STRAIGHT;
2233
2234   /* Don't check non-absolute jump instructions.  */
2235   if (t->opcode_modifier.jump
2236       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2237     return match;
2238
2239   /* Check memory and accumulator operand size.  */
2240   for (j = 0; j < i.operands; j++)
2241     {
2242       if (i.types[j].bitfield.class != Reg
2243           && i.types[j].bitfield.class != RegSIMD
2244           && t->opcode_modifier.anysize)
2245         continue;
2246
2247       if (t->operand_types[j].bitfield.class == Reg
2248           && !match_operand_size (t, j, j))
2249         {
2250           match = 0;
2251           break;
2252         }
2253
2254       if (t->operand_types[j].bitfield.class == RegSIMD
2255           && !match_simd_size (t, j, j))
2256         {
2257           match = 0;
2258           break;
2259         }
2260
2261       if (t->operand_types[j].bitfield.instance == Accum
2262           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2263         {
2264           match = 0;
2265           break;
2266         }
2267
2268       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2269         {
2270           match = 0;
2271           break;
2272         }
2273     }
2274
2275   if (!t->opcode_modifier.d)
2276     {
2277     mismatch:
2278       if (!match)
2279         i.error = operand_size_mismatch;
2280       return match;
2281     }
2282
2283   /* Check reverse.  */
2284   gas_assert (i.operands >= 2 && i.operands <= 3);
2285
2286   for (j = 0; j < i.operands; j++)
2287     {
2288       unsigned int given = i.operands - j - 1;
2289
2290       if (t->operand_types[j].bitfield.class == Reg
2291           && !match_operand_size (t, j, given))
2292         goto mismatch;
2293
2294       if (t->operand_types[j].bitfield.class == RegSIMD
2295           && !match_simd_size (t, j, given))
2296         goto mismatch;
2297
2298       if (t->operand_types[j].bitfield.instance == Accum
2299           && (!match_operand_size (t, j, given)
2300               || !match_simd_size (t, j, given)))
2301         goto mismatch;
2302
2303       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2304         goto mismatch;
2305     }
2306
2307   return match | MATCH_REVERSE;
2308 }
2309
2310 static INLINE int
2311 operand_type_match (i386_operand_type overlap,
2312                     i386_operand_type given)
2313 {
2314   i386_operand_type temp = overlap;
2315
2316   temp.bitfield.unspecified = 0;
2317   temp.bitfield.byte = 0;
2318   temp.bitfield.word = 0;
2319   temp.bitfield.dword = 0;
2320   temp.bitfield.fword = 0;
2321   temp.bitfield.qword = 0;
2322   temp.bitfield.tbyte = 0;
2323   temp.bitfield.xmmword = 0;
2324   temp.bitfield.ymmword = 0;
2325   temp.bitfield.zmmword = 0;
2326   temp.bitfield.tmmword = 0;
2327   if (operand_type_all_zero (&temp))
2328     goto mismatch;
2329
2330   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2331     return 1;
2332
2333  mismatch:
2334   i.error = operand_type_mismatch;
2335   return 0;
2336 }
2337
2338 /* If given types g0 and g1 are registers they must be of the same type
2339    unless the expected operand type register overlap is null.
2340    Some Intel syntax memory operand size checking also happens here.  */
2341
2342 static INLINE int
2343 operand_type_register_match (i386_operand_type g0,
2344                              i386_operand_type t0,
2345                              i386_operand_type g1,
2346                              i386_operand_type t1)
2347 {
2348   if (g0.bitfield.class != Reg
2349       && g0.bitfield.class != RegSIMD
2350       && (!operand_type_check (g0, anymem)
2351           || g0.bitfield.unspecified
2352           || (t0.bitfield.class != Reg
2353               && t0.bitfield.class != RegSIMD)))
2354     return 1;
2355
2356   if (g1.bitfield.class != Reg
2357       && g1.bitfield.class != RegSIMD
2358       && (!operand_type_check (g1, anymem)
2359           || g1.bitfield.unspecified
2360           || (t1.bitfield.class != Reg
2361               && t1.bitfield.class != RegSIMD)))
2362     return 1;
2363
2364   if (g0.bitfield.byte == g1.bitfield.byte
2365       && g0.bitfield.word == g1.bitfield.word
2366       && g0.bitfield.dword == g1.bitfield.dword
2367       && g0.bitfield.qword == g1.bitfield.qword
2368       && g0.bitfield.xmmword == g1.bitfield.xmmword
2369       && g0.bitfield.ymmword == g1.bitfield.ymmword
2370       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2371     return 1;
2372
2373   if (!(t0.bitfield.byte & t1.bitfield.byte)
2374       && !(t0.bitfield.word & t1.bitfield.word)
2375       && !(t0.bitfield.dword & t1.bitfield.dword)
2376       && !(t0.bitfield.qword & t1.bitfield.qword)
2377       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2378       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2379       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2380     return 1;
2381
2382   i.error = register_type_mismatch;
2383
2384   return 0;
2385 }
2386
2387 static INLINE unsigned int
2388 register_number (const reg_entry *r)
2389 {
2390   unsigned int nr = r->reg_num;
2391
2392   if (r->reg_flags & RegRex)
2393     nr += 8;
2394
2395   if (r->reg_flags & RegVRex)
2396     nr += 16;
2397
2398   return nr;
2399 }
2400
2401 static INLINE unsigned int
2402 mode_from_disp_size (i386_operand_type t)
2403 {
2404   if (t.bitfield.disp8)
2405     return 1;
2406   else if (t.bitfield.disp16
2407            || t.bitfield.disp32
2408            || t.bitfield.disp32s)
2409     return 2;
2410   else
2411     return 0;
2412 }
2413
2414 static INLINE int
2415 fits_in_signed_byte (addressT num)
2416 {
2417   return num + 0x80 <= 0xff;
2418 }
2419
2420 static INLINE int
2421 fits_in_unsigned_byte (addressT num)
2422 {
2423   return num <= 0xff;
2424 }
2425
2426 static INLINE int
2427 fits_in_unsigned_word (addressT num)
2428 {
2429   return num <= 0xffff;
2430 }
2431
2432 static INLINE int
2433 fits_in_signed_word (addressT num)
2434 {
2435   return num + 0x8000 <= 0xffff;
2436 }
2437
2438 static INLINE int
2439 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2440 {
2441 #ifndef BFD64
2442   return 1;
2443 #else
2444   return num + 0x80000000 <= 0xffffffff;
2445 #endif
2446 }                               /* fits_in_signed_long() */
2447
2448 static INLINE int
2449 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2450 {
2451 #ifndef BFD64
2452   return 1;
2453 #else
2454   return num <= 0xffffffff;
2455 #endif
2456 }                               /* fits_in_unsigned_long() */
2457
2458 static INLINE valueT extend_to_32bit_address (addressT num)
2459 {
2460 #ifdef BFD64
2461   if (fits_in_unsigned_long(num))
2462     return (num ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2463
2464   if (!fits_in_signed_long (num))
2465     return num & 0xffffffff;
2466 #endif
2467
2468   return num;
2469 }
2470
2471 static INLINE int
2472 fits_in_disp8 (offsetT num)
2473 {
2474   int shift = i.memshift;
2475   unsigned int mask;
2476
2477   if (shift == -1)
2478     abort ();
2479
2480   mask = (1 << shift) - 1;
2481
2482   /* Return 0 if NUM isn't properly aligned.  */
2483   if ((num & mask))
2484     return 0;
2485
2486   /* Check if NUM will fit in 8bit after shift.  */
2487   return fits_in_signed_byte (num >> shift);
2488 }
2489
2490 static INLINE int
2491 fits_in_imm4 (offsetT num)
2492 {
2493   return (num & 0xf) == num;
2494 }
2495
2496 static i386_operand_type
2497 smallest_imm_type (offsetT num)
2498 {
2499   i386_operand_type t;
2500
2501   operand_type_set (&t, 0);
2502   t.bitfield.imm64 = 1;
2503
2504   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2505     {
2506       /* This code is disabled on the 486 because all the Imm1 forms
2507          in the opcode table are slower on the i486.  They're the
2508          versions with the implicitly specified single-position
2509          displacement, which has another syntax if you really want to
2510          use that form.  */
2511       t.bitfield.imm1 = 1;
2512       t.bitfield.imm8 = 1;
2513       t.bitfield.imm8s = 1;
2514       t.bitfield.imm16 = 1;
2515       t.bitfield.imm32 = 1;
2516       t.bitfield.imm32s = 1;
2517     }
2518   else if (fits_in_signed_byte (num))
2519     {
2520       t.bitfield.imm8 = 1;
2521       t.bitfield.imm8s = 1;
2522       t.bitfield.imm16 = 1;
2523       t.bitfield.imm32 = 1;
2524       t.bitfield.imm32s = 1;
2525     }
2526   else if (fits_in_unsigned_byte (num))
2527     {
2528       t.bitfield.imm8 = 1;
2529       t.bitfield.imm16 = 1;
2530       t.bitfield.imm32 = 1;
2531       t.bitfield.imm32s = 1;
2532     }
2533   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2534     {
2535       t.bitfield.imm16 = 1;
2536       t.bitfield.imm32 = 1;
2537       t.bitfield.imm32s = 1;
2538     }
2539   else if (fits_in_signed_long (num))
2540     {
2541       t.bitfield.imm32 = 1;
2542       t.bitfield.imm32s = 1;
2543     }
2544   else if (fits_in_unsigned_long (num))
2545     t.bitfield.imm32 = 1;
2546
2547   return t;
2548 }
2549
2550 static offsetT
2551 offset_in_range (offsetT val, int size)
2552 {
2553   addressT mask;
2554
2555   switch (size)
2556     {
2557     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2558     case 2: mask = ((addressT) 1 << 16) - 1; break;
2559     case 4: mask = ((addressT) 2 << 31) - 1; break;
2560 #ifdef BFD64
2561     case 8: mask = ((addressT) 2 << 63) - 1; break;
2562 #endif
2563     default: abort ();
2564     }
2565
2566   if ((val & ~mask) != 0 && (-val & ~mask) != 0)
2567     as_warn (_("%"BFD_VMA_FMT"x shortened to %"BFD_VMA_FMT"x"),
2568              val, val & mask);
2569
2570   return val & mask;
2571 }
2572
2573 enum PREFIX_GROUP
2574 {
2575   PREFIX_EXIST = 0,
2576   PREFIX_LOCK,
2577   PREFIX_REP,
2578   PREFIX_DS,
2579   PREFIX_OTHER
2580 };
2581
2582 /* Returns
2583    a. PREFIX_EXIST if attempting to add a prefix where one from the
2584    same class already exists.
2585    b. PREFIX_LOCK if lock prefix is added.
2586    c. PREFIX_REP if rep/repne prefix is added.
2587    d. PREFIX_DS if ds prefix is added.
2588    e. PREFIX_OTHER if other prefix is added.
2589  */
2590
2591 static enum PREFIX_GROUP
2592 add_prefix (unsigned int prefix)
2593 {
2594   enum PREFIX_GROUP ret = PREFIX_OTHER;
2595   unsigned int q;
2596
2597   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2598       && flag_code == CODE_64BIT)
2599     {
2600       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2601           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2602           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2603           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2604         ret = PREFIX_EXIST;
2605       q = REX_PREFIX;
2606     }
2607   else
2608     {
2609       switch (prefix)
2610         {
2611         default:
2612           abort ();
2613
2614         case DS_PREFIX_OPCODE:
2615           ret = PREFIX_DS;
2616           /* Fall through.  */
2617         case CS_PREFIX_OPCODE:
2618         case ES_PREFIX_OPCODE:
2619         case FS_PREFIX_OPCODE:
2620         case GS_PREFIX_OPCODE:
2621         case SS_PREFIX_OPCODE:
2622           q = SEG_PREFIX;
2623           break;
2624
2625         case REPNE_PREFIX_OPCODE:
2626         case REPE_PREFIX_OPCODE:
2627           q = REP_PREFIX;
2628           ret = PREFIX_REP;
2629           break;
2630
2631         case LOCK_PREFIX_OPCODE:
2632           q = LOCK_PREFIX;
2633           ret = PREFIX_LOCK;
2634           break;
2635
2636         case FWAIT_OPCODE:
2637           q = WAIT_PREFIX;
2638           break;
2639
2640         case ADDR_PREFIX_OPCODE:
2641           q = ADDR_PREFIX;
2642           break;
2643
2644         case DATA_PREFIX_OPCODE:
2645           q = DATA_PREFIX;
2646           break;
2647         }
2648       if (i.prefix[q] != 0)
2649         ret = PREFIX_EXIST;
2650     }
2651
2652   if (ret)
2653     {
2654       if (!i.prefix[q])
2655         ++i.prefixes;
2656       i.prefix[q] |= prefix;
2657     }
2658   else
2659     as_bad (_("same type of prefix used twice"));
2660
2661   return ret;
2662 }
2663
2664 static void
2665 update_code_flag (int value, int check)
2666 {
2667   PRINTF_LIKE ((*as_error));
2668
2669   flag_code = (enum flag_code) value;
2670   if (flag_code == CODE_64BIT)
2671     {
2672       cpu_arch_flags.bitfield.cpu64 = 1;
2673       cpu_arch_flags.bitfield.cpuno64 = 0;
2674     }
2675   else
2676     {
2677       cpu_arch_flags.bitfield.cpu64 = 0;
2678       cpu_arch_flags.bitfield.cpuno64 = 1;
2679     }
2680   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2681     {
2682       if (check)
2683         as_error = as_fatal;
2684       else
2685         as_error = as_bad;
2686       (*as_error) (_("64bit mode not supported on `%s'."),
2687                    cpu_arch_name ? cpu_arch_name : default_arch);
2688     }
2689   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2690     {
2691       if (check)
2692         as_error = as_fatal;
2693       else
2694         as_error = as_bad;
2695       (*as_error) (_("32bit mode not supported on `%s'."),
2696                    cpu_arch_name ? cpu_arch_name : default_arch);
2697     }
2698   stackop_size = '\0';
2699 }
2700
2701 static void
2702 set_code_flag (int value)
2703 {
2704   update_code_flag (value, 0);
2705 }
2706
2707 static void
2708 set_16bit_gcc_code_flag (int new_code_flag)
2709 {
2710   flag_code = (enum flag_code) new_code_flag;
2711   if (flag_code != CODE_16BIT)
2712     abort ();
2713   cpu_arch_flags.bitfield.cpu64 = 0;
2714   cpu_arch_flags.bitfield.cpuno64 = 1;
2715   stackop_size = LONG_MNEM_SUFFIX;
2716 }
2717
2718 static void
2719 set_intel_syntax (int syntax_flag)
2720 {
2721   /* Find out if register prefixing is specified.  */
2722   int ask_naked_reg = 0;
2723
2724   SKIP_WHITESPACE ();
2725   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2726     {
2727       char *string;
2728       int e = get_symbol_name (&string);
2729
2730       if (strcmp (string, "prefix") == 0)
2731         ask_naked_reg = 1;
2732       else if (strcmp (string, "noprefix") == 0)
2733         ask_naked_reg = -1;
2734       else
2735         as_bad (_("bad argument to syntax directive."));
2736       (void) restore_line_pointer (e);
2737     }
2738   demand_empty_rest_of_line ();
2739
2740   intel_syntax = syntax_flag;
2741
2742   if (ask_naked_reg == 0)
2743     allow_naked_reg = (intel_syntax
2744                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2745   else
2746     allow_naked_reg = (ask_naked_reg < 0);
2747
2748   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2749
2750   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2751   identifier_chars['$'] = intel_syntax ? '$' : 0;
2752   register_prefix = allow_naked_reg ? "" : "%";
2753 }
2754
2755 static void
2756 set_intel_mnemonic (int mnemonic_flag)
2757 {
2758   intel_mnemonic = mnemonic_flag;
2759 }
2760
2761 static void
2762 set_allow_index_reg (int flag)
2763 {
2764   allow_index_reg = flag;
2765 }
2766
2767 static void
2768 set_check (int what)
2769 {
2770   enum check_kind *kind;
2771   const char *str;
2772
2773   if (what)
2774     {
2775       kind = &operand_check;
2776       str = "operand";
2777     }
2778   else
2779     {
2780       kind = &sse_check;
2781       str = "sse";
2782     }
2783
2784   SKIP_WHITESPACE ();
2785
2786   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2787     {
2788       char *string;
2789       int e = get_symbol_name (&string);
2790
2791       if (strcmp (string, "none") == 0)
2792         *kind = check_none;
2793       else if (strcmp (string, "warning") == 0)
2794         *kind = check_warning;
2795       else if (strcmp (string, "error") == 0)
2796         *kind = check_error;
2797       else
2798         as_bad (_("bad argument to %s_check directive."), str);
2799       (void) restore_line_pointer (e);
2800     }
2801   else
2802     as_bad (_("missing argument for %s_check directive"), str);
2803
2804   demand_empty_rest_of_line ();
2805 }
2806
2807 static void
2808 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2809                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2810 {
2811 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2812   static const char *arch;
2813
2814   /* Intel LIOM is only supported on ELF.  */
2815   if (!IS_ELF)
2816     return;
2817
2818   if (!arch)
2819     {
2820       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2821          use default_arch.  */
2822       arch = cpu_arch_name;
2823       if (!arch)
2824         arch = default_arch;
2825     }
2826
2827   /* If we are targeting Intel MCU, we must enable it.  */
2828   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2829       || new_flag.bitfield.cpuiamcu)
2830     return;
2831
2832   /* If we are targeting Intel L1OM, we must enable it.  */
2833   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2834       || new_flag.bitfield.cpul1om)
2835     return;
2836
2837   /* If we are targeting Intel K1OM, we must enable it.  */
2838   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2839       || new_flag.bitfield.cpuk1om)
2840     return;
2841
2842   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2843 #endif
2844 }
2845
2846 static void
2847 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2848 {
2849   SKIP_WHITESPACE ();
2850
2851   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2852     {
2853       char *string;
2854       int e = get_symbol_name (&string);
2855       unsigned int j;
2856       i386_cpu_flags flags;
2857
2858       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2859         {
2860           if (strcmp (string, cpu_arch[j].name) == 0)
2861             {
2862               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2863
2864               if (*string != '.')
2865                 {
2866                   cpu_arch_name = cpu_arch[j].name;
2867                   cpu_sub_arch_name = NULL;
2868                   cpu_arch_flags = cpu_arch[j].flags;
2869                   if (flag_code == CODE_64BIT)
2870                     {
2871                       cpu_arch_flags.bitfield.cpu64 = 1;
2872                       cpu_arch_flags.bitfield.cpuno64 = 0;
2873                     }
2874                   else
2875                     {
2876                       cpu_arch_flags.bitfield.cpu64 = 0;
2877                       cpu_arch_flags.bitfield.cpuno64 = 1;
2878                     }
2879                   cpu_arch_isa = cpu_arch[j].type;
2880                   cpu_arch_isa_flags = cpu_arch[j].flags;
2881                   if (!cpu_arch_tune_set)
2882                     {
2883                       cpu_arch_tune = cpu_arch_isa;
2884                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2885                     }
2886                   break;
2887                 }
2888
2889               flags = cpu_flags_or (cpu_arch_flags,
2890                                     cpu_arch[j].flags);
2891
2892               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2893                 {
2894                   if (cpu_sub_arch_name)
2895                     {
2896                       char *name = cpu_sub_arch_name;
2897                       cpu_sub_arch_name = concat (name,
2898                                                   cpu_arch[j].name,
2899                                                   (const char *) NULL);
2900                       free (name);
2901                     }
2902                   else
2903                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2904                   cpu_arch_flags = flags;
2905                   cpu_arch_isa_flags = flags;
2906                 }
2907               else
2908                 cpu_arch_isa_flags
2909                   = cpu_flags_or (cpu_arch_isa_flags,
2910                                   cpu_arch[j].flags);
2911               (void) restore_line_pointer (e);
2912               demand_empty_rest_of_line ();
2913               return;
2914             }
2915         }
2916
2917       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2918         {
2919           /* Disable an ISA extension.  */
2920           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2921             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2922               {
2923                 flags = cpu_flags_and_not (cpu_arch_flags,
2924                                            cpu_noarch[j].flags);
2925                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2926                   {
2927                     if (cpu_sub_arch_name)
2928                       {
2929                         char *name = cpu_sub_arch_name;
2930                         cpu_sub_arch_name = concat (name, string,
2931                                                     (const char *) NULL);
2932                         free (name);
2933                       }
2934                     else
2935                       cpu_sub_arch_name = xstrdup (string);
2936                     cpu_arch_flags = flags;
2937                     cpu_arch_isa_flags = flags;
2938                   }
2939                 (void) restore_line_pointer (e);
2940                 demand_empty_rest_of_line ();
2941                 return;
2942               }
2943
2944           j = ARRAY_SIZE (cpu_arch);
2945         }
2946
2947       if (j >= ARRAY_SIZE (cpu_arch))
2948         as_bad (_("no such architecture: `%s'"), string);
2949
2950       *input_line_pointer = e;
2951     }
2952   else
2953     as_bad (_("missing cpu architecture"));
2954
2955   no_cond_jump_promotion = 0;
2956   if (*input_line_pointer == ','
2957       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2958     {
2959       char *string;
2960       char e;
2961
2962       ++input_line_pointer;
2963       e = get_symbol_name (&string);
2964
2965       if (strcmp (string, "nojumps") == 0)
2966         no_cond_jump_promotion = 1;
2967       else if (strcmp (string, "jumps") == 0)
2968         ;
2969       else
2970         as_bad (_("no such architecture modifier: `%s'"), string);
2971
2972       (void) restore_line_pointer (e);
2973     }
2974
2975   demand_empty_rest_of_line ();
2976 }
2977
2978 enum bfd_architecture
2979 i386_arch (void)
2980 {
2981   if (cpu_arch_isa == PROCESSOR_L1OM)
2982     {
2983       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2984           || flag_code != CODE_64BIT)
2985         as_fatal (_("Intel L1OM is 64bit ELF only"));
2986       return bfd_arch_l1om;
2987     }
2988   else if (cpu_arch_isa == PROCESSOR_K1OM)
2989     {
2990       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2991           || flag_code != CODE_64BIT)
2992         as_fatal (_("Intel K1OM is 64bit ELF only"));
2993       return bfd_arch_k1om;
2994     }
2995   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2996     {
2997       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2998           || flag_code == CODE_64BIT)
2999         as_fatal (_("Intel MCU is 32bit ELF only"));
3000       return bfd_arch_iamcu;
3001     }
3002   else
3003     return bfd_arch_i386;
3004 }
3005
3006 unsigned long
3007 i386_mach (void)
3008 {
3009   if (startswith (default_arch, "x86_64"))
3010     {
3011       if (cpu_arch_isa == PROCESSOR_L1OM)
3012         {
3013           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3014               || default_arch[6] != '\0')
3015             as_fatal (_("Intel L1OM is 64bit ELF only"));
3016           return bfd_mach_l1om;
3017         }
3018       else if (cpu_arch_isa == PROCESSOR_K1OM)
3019         {
3020           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3021               || default_arch[6] != '\0')
3022             as_fatal (_("Intel K1OM is 64bit ELF only"));
3023           return bfd_mach_k1om;
3024         }
3025       else if (default_arch[6] == '\0')
3026         return bfd_mach_x86_64;
3027       else
3028         return bfd_mach_x64_32;
3029     }
3030   else if (!strcmp (default_arch, "i386")
3031            || !strcmp (default_arch, "iamcu"))
3032     {
3033       if (cpu_arch_isa == PROCESSOR_IAMCU)
3034         {
3035           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3036             as_fatal (_("Intel MCU is 32bit ELF only"));
3037           return bfd_mach_i386_iamcu;
3038         }
3039       else
3040         return bfd_mach_i386_i386;
3041     }
3042   else
3043     as_fatal (_("unknown architecture"));
3044 }
3045 \f
3046 void
3047 md_begin (void)
3048 {
3049   /* Support pseudo prefixes like {disp32}.  */
3050   lex_type ['{'] = LEX_BEGIN_NAME;
3051
3052   /* Initialize op_hash hash table.  */
3053   op_hash = str_htab_create ();
3054
3055   {
3056     const insn_template *optab;
3057     templates *core_optab;
3058
3059     /* Setup for loop.  */
3060     optab = i386_optab;
3061     core_optab = XNEW (templates);
3062     core_optab->start = optab;
3063
3064     while (1)
3065       {
3066         ++optab;
3067         if (optab->name == NULL
3068             || strcmp (optab->name, (optab - 1)->name) != 0)
3069           {
3070             /* different name --> ship out current template list;
3071                add to hash table; & begin anew.  */
3072             core_optab->end = optab;
3073             if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3074               as_fatal (_("duplicate %s"), (optab - 1)->name);
3075
3076             if (optab->name == NULL)
3077               break;
3078             core_optab = XNEW (templates);
3079             core_optab->start = optab;
3080           }
3081       }
3082   }
3083
3084   /* Initialize reg_hash hash table.  */
3085   reg_hash = str_htab_create ();
3086   {
3087     const reg_entry *regtab;
3088     unsigned int regtab_size = i386_regtab_size;
3089
3090     for (regtab = i386_regtab; regtab_size--; regtab++)
3091       {
3092         switch (regtab->reg_type.bitfield.class)
3093           {
3094           case Reg:
3095             if (regtab->reg_type.bitfield.dword)
3096               {
3097                 if (regtab->reg_type.bitfield.instance == Accum)
3098                   reg_eax = regtab;
3099               }
3100             else if (regtab->reg_type.bitfield.tbyte)
3101               {
3102                 /* There's no point inserting st(<N>) in the hash table, as
3103                    parentheses aren't included in register_chars[] anyway.  */
3104                 if (regtab->reg_type.bitfield.instance != Accum)
3105                   continue;
3106                 reg_st0 = regtab;
3107               }
3108             break;
3109
3110           case SReg:
3111             switch (regtab->reg_num)
3112               {
3113               case 0: reg_es = regtab; break;
3114               case 2: reg_ss = regtab; break;
3115               case 3: reg_ds = regtab; break;
3116               }
3117             break;
3118
3119           case RegMask:
3120             if (!regtab->reg_num)
3121               reg_k0 = regtab;
3122             break;
3123           }
3124
3125         if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3126           as_fatal (_("duplicate %s"), regtab->reg_name);
3127       }
3128   }
3129
3130   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3131   {
3132     int c;
3133     char *p;
3134
3135     for (c = 0; c < 256; c++)
3136       {
3137         if (ISDIGIT (c) || ISLOWER (c))
3138           {
3139             mnemonic_chars[c] = c;
3140             register_chars[c] = c;
3141             operand_chars[c] = c;
3142           }
3143         else if (ISUPPER (c))
3144           {
3145             mnemonic_chars[c] = TOLOWER (c);
3146             register_chars[c] = mnemonic_chars[c];
3147             operand_chars[c] = c;
3148           }
3149         else if (c == '{' || c == '}')
3150           {
3151             mnemonic_chars[c] = c;
3152             operand_chars[c] = c;
3153           }
3154 #ifdef SVR4_COMMENT_CHARS
3155         else if (c == '\\' && strchr (i386_comment_chars, '/'))
3156           operand_chars[c] = c;
3157 #endif
3158
3159         if (ISALPHA (c) || ISDIGIT (c))
3160           identifier_chars[c] = c;
3161         else if (c >= 128)
3162           {
3163             identifier_chars[c] = c;
3164             operand_chars[c] = c;
3165           }
3166       }
3167
3168 #ifdef LEX_AT
3169     identifier_chars['@'] = '@';
3170 #endif
3171 #ifdef LEX_QM
3172     identifier_chars['?'] = '?';
3173     operand_chars['?'] = '?';
3174 #endif
3175     mnemonic_chars['_'] = '_';
3176     mnemonic_chars['-'] = '-';
3177     mnemonic_chars['.'] = '.';
3178     identifier_chars['_'] = '_';
3179     identifier_chars['.'] = '.';
3180
3181     for (p = operand_special_chars; *p != '\0'; p++)
3182       operand_chars[(unsigned char) *p] = *p;
3183   }
3184
3185   if (flag_code == CODE_64BIT)
3186     {
3187 #if defined (OBJ_COFF) && defined (TE_PE)
3188       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3189                                   ? 32 : 16);
3190 #else
3191       x86_dwarf2_return_column = 16;
3192 #endif
3193       x86_cie_data_alignment = -8;
3194     }
3195   else
3196     {
3197       x86_dwarf2_return_column = 8;
3198       x86_cie_data_alignment = -4;
3199     }
3200
3201   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3202      can be turned into BRANCH_PREFIX frag.  */
3203   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3204     abort ();
3205 }
3206
3207 void
3208 i386_print_statistics (FILE *file)
3209 {
3210   htab_print_statistics (file, "i386 opcode", op_hash);
3211   htab_print_statistics (file, "i386 register", reg_hash);
3212 }
3213 \f
3214 #ifdef DEBUG386
3215
3216 /* Debugging routines for md_assemble.  */
3217 static void pte (insn_template *);
3218 static void pt (i386_operand_type);
3219 static void pe (expressionS *);
3220 static void ps (symbolS *);
3221
3222 static void
3223 pi (const char *line, i386_insn *x)
3224 {
3225   unsigned int j;
3226
3227   fprintf (stdout, "%s: template ", line);
3228   pte (&x->tm);
3229   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3230            x->base_reg ? x->base_reg->reg_name : "none",
3231            x->index_reg ? x->index_reg->reg_name : "none",
3232            x->log2_scale_factor);
3233   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3234            x->rm.mode, x->rm.reg, x->rm.regmem);
3235   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3236            x->sib.base, x->sib.index, x->sib.scale);
3237   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3238            (x->rex & REX_W) != 0,
3239            (x->rex & REX_R) != 0,
3240            (x->rex & REX_X) != 0,
3241            (x->rex & REX_B) != 0);
3242   for (j = 0; j < x->operands; j++)
3243     {
3244       fprintf (stdout, "    #%d:  ", j + 1);
3245       pt (x->types[j]);
3246       fprintf (stdout, "\n");
3247       if (x->types[j].bitfield.class == Reg
3248           || x->types[j].bitfield.class == RegMMX
3249           || x->types[j].bitfield.class == RegSIMD
3250           || x->types[j].bitfield.class == RegMask
3251           || x->types[j].bitfield.class == SReg
3252           || x->types[j].bitfield.class == RegCR
3253           || x->types[j].bitfield.class == RegDR
3254           || x->types[j].bitfield.class == RegTR
3255           || x->types[j].bitfield.class == RegBND)
3256         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3257       if (operand_type_check (x->types[j], imm))
3258         pe (x->op[j].imms);
3259       if (operand_type_check (x->types[j], disp))
3260         pe (x->op[j].disps);
3261     }
3262 }
3263
3264 static void
3265 pte (insn_template *t)
3266 {
3267   static const unsigned char opc_pfx[] = { 0, 0x66, 0xf3, 0xf2 };
3268   static const char *const opc_spc[] = {
3269     NULL, "0f", "0f38", "0f3a", NULL, NULL, NULL, NULL,
3270     "XOP08", "XOP09", "XOP0A",
3271   };
3272   unsigned int j;
3273
3274   fprintf (stdout, " %d operands ", t->operands);
3275   if (opc_pfx[t->opcode_modifier.opcodeprefix])
3276     fprintf (stdout, "pfx %x ", opc_pfx[t->opcode_modifier.opcodeprefix]);
3277   if (opc_spc[t->opcode_modifier.opcodespace])
3278     fprintf (stdout, "space %s ", opc_spc[t->opcode_modifier.opcodespace]);
3279   fprintf (stdout, "opcode %x ", t->base_opcode);
3280   if (t->extension_opcode != None)
3281     fprintf (stdout, "ext %x ", t->extension_opcode);
3282   if (t->opcode_modifier.d)
3283     fprintf (stdout, "D");
3284   if (t->opcode_modifier.w)
3285     fprintf (stdout, "W");
3286   fprintf (stdout, "\n");
3287   for (j = 0; j < t->operands; j++)
3288     {
3289       fprintf (stdout, "    #%d type ", j + 1);
3290       pt (t->operand_types[j]);
3291       fprintf (stdout, "\n");
3292     }
3293 }
3294
3295 static void
3296 pe (expressionS *e)
3297 {
3298   fprintf (stdout, "    operation     %d\n", e->X_op);
3299   fprintf (stdout, "    add_number    %" BFD_VMA_FMT "d (%" BFD_VMA_FMT "x)\n",
3300            e->X_add_number, e->X_add_number);
3301   if (e->X_add_symbol)
3302     {
3303       fprintf (stdout, "    add_symbol    ");
3304       ps (e->X_add_symbol);
3305       fprintf (stdout, "\n");
3306     }
3307   if (e->X_op_symbol)
3308     {
3309       fprintf (stdout, "    op_symbol    ");
3310       ps (e->X_op_symbol);
3311       fprintf (stdout, "\n");
3312     }
3313 }
3314
3315 static void
3316 ps (symbolS *s)
3317 {
3318   fprintf (stdout, "%s type %s%s",
3319            S_GET_NAME (s),
3320            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3321            segment_name (S_GET_SEGMENT (s)));
3322 }
3323
3324 static struct type_name
3325   {
3326     i386_operand_type mask;
3327     const char *name;
3328   }
3329 const type_names[] =
3330 {
3331   { OPERAND_TYPE_REG8, "r8" },
3332   { OPERAND_TYPE_REG16, "r16" },
3333   { OPERAND_TYPE_REG32, "r32" },
3334   { OPERAND_TYPE_REG64, "r64" },
3335   { OPERAND_TYPE_ACC8, "acc8" },
3336   { OPERAND_TYPE_ACC16, "acc16" },
3337   { OPERAND_TYPE_ACC32, "acc32" },
3338   { OPERAND_TYPE_ACC64, "acc64" },
3339   { OPERAND_TYPE_IMM8, "i8" },
3340   { OPERAND_TYPE_IMM8, "i8s" },
3341   { OPERAND_TYPE_IMM16, "i16" },
3342   { OPERAND_TYPE_IMM32, "i32" },
3343   { OPERAND_TYPE_IMM32S, "i32s" },
3344   { OPERAND_TYPE_IMM64, "i64" },
3345   { OPERAND_TYPE_IMM1, "i1" },
3346   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3347   { OPERAND_TYPE_DISP8, "d8" },
3348   { OPERAND_TYPE_DISP16, "d16" },
3349   { OPERAND_TYPE_DISP32, "d32" },
3350   { OPERAND_TYPE_DISP32S, "d32s" },
3351   { OPERAND_TYPE_DISP64, "d64" },
3352   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3353   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3354   { OPERAND_TYPE_CONTROL, "control reg" },
3355   { OPERAND_TYPE_TEST, "test reg" },
3356   { OPERAND_TYPE_DEBUG, "debug reg" },
3357   { OPERAND_TYPE_FLOATREG, "FReg" },
3358   { OPERAND_TYPE_FLOATACC, "FAcc" },
3359   { OPERAND_TYPE_SREG, "SReg" },
3360   { OPERAND_TYPE_REGMMX, "rMMX" },
3361   { OPERAND_TYPE_REGXMM, "rXMM" },
3362   { OPERAND_TYPE_REGYMM, "rYMM" },
3363   { OPERAND_TYPE_REGZMM, "rZMM" },
3364   { OPERAND_TYPE_REGTMM, "rTMM" },
3365   { OPERAND_TYPE_REGMASK, "Mask reg" },
3366 };
3367
3368 static void
3369 pt (i386_operand_type t)
3370 {
3371   unsigned int j;
3372   i386_operand_type a;
3373
3374   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3375     {
3376       a = operand_type_and (t, type_names[j].mask);
3377       if (operand_type_equal (&a, &type_names[j].mask))
3378         fprintf (stdout, "%s, ",  type_names[j].name);
3379     }
3380   fflush (stdout);
3381 }
3382
3383 #endif /* DEBUG386 */
3384 \f
3385 static bfd_reloc_code_real_type
3386 reloc (unsigned int size,
3387        int pcrel,
3388        int sign,
3389        bfd_reloc_code_real_type other)
3390 {
3391   if (other != NO_RELOC)
3392     {
3393       reloc_howto_type *rel;
3394
3395       if (size == 8)
3396         switch (other)
3397           {
3398           case BFD_RELOC_X86_64_GOT32:
3399             return BFD_RELOC_X86_64_GOT64;
3400             break;
3401           case BFD_RELOC_X86_64_GOTPLT64:
3402             return BFD_RELOC_X86_64_GOTPLT64;
3403             break;
3404           case BFD_RELOC_X86_64_PLTOFF64:
3405             return BFD_RELOC_X86_64_PLTOFF64;
3406             break;
3407           case BFD_RELOC_X86_64_GOTPC32:
3408             other = BFD_RELOC_X86_64_GOTPC64;
3409             break;
3410           case BFD_RELOC_X86_64_GOTPCREL:
3411             other = BFD_RELOC_X86_64_GOTPCREL64;
3412             break;
3413           case BFD_RELOC_X86_64_TPOFF32:
3414             other = BFD_RELOC_X86_64_TPOFF64;
3415             break;
3416           case BFD_RELOC_X86_64_DTPOFF32:
3417             other = BFD_RELOC_X86_64_DTPOFF64;
3418             break;
3419           default:
3420             break;
3421           }
3422
3423 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3424       if (other == BFD_RELOC_SIZE32)
3425         {
3426           if (size == 8)
3427             other = BFD_RELOC_SIZE64;
3428           if (pcrel)
3429             {
3430               as_bad (_("there are no pc-relative size relocations"));
3431               return NO_RELOC;
3432             }
3433         }
3434 #endif
3435
3436       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3437       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3438         sign = -1;
3439
3440       rel = bfd_reloc_type_lookup (stdoutput, other);
3441       if (!rel)
3442         as_bad (_("unknown relocation (%u)"), other);
3443       else if (size != bfd_get_reloc_size (rel))
3444         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3445                 bfd_get_reloc_size (rel),
3446                 size);
3447       else if (pcrel && !rel->pc_relative)
3448         as_bad (_("non-pc-relative relocation for pc-relative field"));
3449       else if ((rel->complain_on_overflow == complain_overflow_signed
3450                 && !sign)
3451                || (rel->complain_on_overflow == complain_overflow_unsigned
3452                    && sign > 0))
3453         as_bad (_("relocated field and relocation type differ in signedness"));
3454       else
3455         return other;
3456       return NO_RELOC;
3457     }
3458
3459   if (pcrel)
3460     {
3461       if (!sign)
3462         as_bad (_("there are no unsigned pc-relative relocations"));
3463       switch (size)
3464         {
3465         case 1: return BFD_RELOC_8_PCREL;
3466         case 2: return BFD_RELOC_16_PCREL;
3467         case 4: return BFD_RELOC_32_PCREL;
3468         case 8: return BFD_RELOC_64_PCREL;
3469         }
3470       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3471     }
3472   else
3473     {
3474       if (sign > 0)
3475         switch (size)
3476           {
3477           case 4: return BFD_RELOC_X86_64_32S;
3478           }
3479       else
3480         switch (size)
3481           {
3482           case 1: return BFD_RELOC_8;
3483           case 2: return BFD_RELOC_16;
3484           case 4: return BFD_RELOC_32;
3485           case 8: return BFD_RELOC_64;
3486           }
3487       as_bad (_("cannot do %s %u byte relocation"),
3488               sign > 0 ? "signed" : "unsigned", size);
3489     }
3490
3491   return NO_RELOC;
3492 }
3493
3494 /* Here we decide which fixups can be adjusted to make them relative to
3495    the beginning of the section instead of the symbol.  Basically we need
3496    to make sure that the dynamic relocations are done correctly, so in
3497    some cases we force the original symbol to be used.  */
3498
3499 int
3500 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3501 {
3502 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3503   if (!IS_ELF)
3504     return 1;
3505
3506   /* Don't adjust pc-relative references to merge sections in 64-bit
3507      mode.  */
3508   if (use_rela_relocations
3509       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3510       && fixP->fx_pcrel)
3511     return 0;
3512
3513   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3514      and changed later by validate_fix.  */
3515   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3516       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3517     return 0;
3518
3519   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3520      for size relocations.  */
3521   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3522       || fixP->fx_r_type == BFD_RELOC_SIZE64
3523       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3524       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3525       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3526       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3527       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3528       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3529       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3530       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3531       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3532       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3533       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3534       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3535       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3536       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3537       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3538       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3539       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3540       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3541       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3542       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3543       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3544       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3545       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3546       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3547       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3548       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3549       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3550       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3551       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3552     return 0;
3553 #endif
3554   return 1;
3555 }
3556
3557 static INLINE bool
3558 want_disp32 (const insn_template *t)
3559 {
3560   return flag_code != CODE_64BIT
3561          || i.prefix[ADDR_PREFIX]
3562          || (t->base_opcode == 0x8d
3563              && t->opcode_modifier.opcodespace == SPACE_BASE
3564              && (!i.types[1].bitfield.qword
3565                 || t->opcode_modifier.size == SIZE32));
3566 }
3567
3568 static int
3569 intel_float_operand (const char *mnemonic)
3570 {
3571   /* Note that the value returned is meaningful only for opcodes with (memory)
3572      operands, hence the code here is free to improperly handle opcodes that
3573      have no operands (for better performance and smaller code). */
3574
3575   if (mnemonic[0] != 'f')
3576     return 0; /* non-math */
3577
3578   switch (mnemonic[1])
3579     {
3580     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3581        the fs segment override prefix not currently handled because no
3582        call path can make opcodes without operands get here */
3583     case 'i':
3584       return 2 /* integer op */;
3585     case 'l':
3586       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3587         return 3; /* fldcw/fldenv */
3588       break;
3589     case 'n':
3590       if (mnemonic[2] != 'o' /* fnop */)
3591         return 3; /* non-waiting control op */
3592       break;
3593     case 'r':
3594       if (mnemonic[2] == 's')
3595         return 3; /* frstor/frstpm */
3596       break;
3597     case 's':
3598       if (mnemonic[2] == 'a')
3599         return 3; /* fsave */
3600       if (mnemonic[2] == 't')
3601         {
3602           switch (mnemonic[3])
3603             {
3604             case 'c': /* fstcw */
3605             case 'd': /* fstdw */
3606             case 'e': /* fstenv */
3607             case 's': /* fsts[gw] */
3608               return 3;
3609             }
3610         }
3611       break;
3612     case 'x':
3613       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3614         return 0; /* fxsave/fxrstor are not really math ops */
3615       break;
3616     }
3617
3618   return 1;
3619 }
3620
3621 static INLINE void
3622 install_template (const insn_template *t)
3623 {
3624   unsigned int l;
3625
3626   i.tm = *t;
3627
3628   /* Note that for pseudo prefixes this produces a length of 1. But for them
3629      the length isn't interesting at all.  */
3630   for (l = 1; l < 4; ++l)
3631     if (!(t->base_opcode >> (8 * l)))
3632       break;
3633
3634   i.opcode_length = l;
3635 }
3636
3637 /* Build the VEX prefix.  */
3638
3639 static void
3640 build_vex_prefix (const insn_template *t)
3641 {
3642   unsigned int register_specifier;
3643   unsigned int vector_length;
3644   unsigned int w;
3645
3646   /* Check register specifier.  */
3647   if (i.vex.register_specifier)
3648     {
3649       register_specifier =
3650         ~register_number (i.vex.register_specifier) & 0xf;
3651       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3652     }
3653   else
3654     register_specifier = 0xf;
3655
3656   /* Use 2-byte VEX prefix by swapping destination and source operand
3657      if there are more than 1 register operand.  */
3658   if (i.reg_operands > 1
3659       && i.vec_encoding != vex_encoding_vex3
3660       && i.dir_encoding == dir_encoding_default
3661       && i.operands == i.reg_operands
3662       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3663       && i.tm.opcode_modifier.opcodespace == SPACE_0F
3664       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3665       && i.rex == REX_B)
3666     {
3667       unsigned int xchg = i.operands - 1;
3668       union i386_op temp_op;
3669       i386_operand_type temp_type;
3670
3671       temp_type = i.types[xchg];
3672       i.types[xchg] = i.types[0];
3673       i.types[0] = temp_type;
3674       temp_op = i.op[xchg];
3675       i.op[xchg] = i.op[0];
3676       i.op[0] = temp_op;
3677
3678       gas_assert (i.rm.mode == 3);
3679
3680       i.rex = REX_R;
3681       xchg = i.rm.regmem;
3682       i.rm.regmem = i.rm.reg;
3683       i.rm.reg = xchg;
3684
3685       if (i.tm.opcode_modifier.d)
3686         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3687                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3688       else /* Use the next insn.  */
3689         install_template (&t[1]);
3690     }
3691
3692   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3693      are no memory operands and at least 3 register ones.  */
3694   if (i.reg_operands >= 3
3695       && i.vec_encoding != vex_encoding_vex3
3696       && i.reg_operands == i.operands - i.imm_operands
3697       && i.tm.opcode_modifier.vex
3698       && i.tm.opcode_modifier.commutative
3699       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3700       && i.rex == REX_B
3701       && i.vex.register_specifier
3702       && !(i.vex.register_specifier->reg_flags & RegRex))
3703     {
3704       unsigned int xchg = i.operands - i.reg_operands;
3705       union i386_op temp_op;
3706       i386_operand_type temp_type;
3707
3708       gas_assert (i.tm.opcode_modifier.opcodespace == SPACE_0F);
3709       gas_assert (!i.tm.opcode_modifier.sae);
3710       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3711                                       &i.types[i.operands - 3]));
3712       gas_assert (i.rm.mode == 3);
3713
3714       temp_type = i.types[xchg];
3715       i.types[xchg] = i.types[xchg + 1];
3716       i.types[xchg + 1] = temp_type;
3717       temp_op = i.op[xchg];
3718       i.op[xchg] = i.op[xchg + 1];
3719       i.op[xchg + 1] = temp_op;
3720
3721       i.rex = 0;
3722       xchg = i.rm.regmem | 8;
3723       i.rm.regmem = ~register_specifier & 0xf;
3724       gas_assert (!(i.rm.regmem & 8));
3725       i.vex.register_specifier += xchg - i.rm.regmem;
3726       register_specifier = ~xchg & 0xf;
3727     }
3728
3729   if (i.tm.opcode_modifier.vex == VEXScalar)
3730     vector_length = avxscalar;
3731   else if (i.tm.opcode_modifier.vex == VEX256)
3732     vector_length = 1;
3733   else
3734     {
3735       unsigned int op;
3736
3737       /* Determine vector length from the last multi-length vector
3738          operand.  */
3739       vector_length = 0;
3740       for (op = t->operands; op--;)
3741         if (t->operand_types[op].bitfield.xmmword
3742             && t->operand_types[op].bitfield.ymmword
3743             && i.types[op].bitfield.ymmword)
3744           {
3745             vector_length = 1;
3746             break;
3747           }
3748     }
3749
3750   /* Check the REX.W bit and VEXW.  */
3751   if (i.tm.opcode_modifier.vexw == VEXWIG)
3752     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3753   else if (i.tm.opcode_modifier.vexw)
3754     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3755   else
3756     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3757
3758   /* Use 2-byte VEX prefix if possible.  */
3759   if (w == 0
3760       && i.vec_encoding != vex_encoding_vex3
3761       && i.tm.opcode_modifier.opcodespace == SPACE_0F
3762       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3763     {
3764       /* 2-byte VEX prefix.  */
3765       unsigned int r;
3766
3767       i.vex.length = 2;
3768       i.vex.bytes[0] = 0xc5;
3769
3770       /* Check the REX.R bit.  */
3771       r = (i.rex & REX_R) ? 0 : 1;
3772       i.vex.bytes[1] = (r << 7
3773                         | register_specifier << 3
3774                         | vector_length << 2
3775                         | i.tm.opcode_modifier.opcodeprefix);
3776     }
3777   else
3778     {
3779       /* 3-byte VEX prefix.  */
3780       i.vex.length = 3;
3781
3782       switch (i.tm.opcode_modifier.opcodespace)
3783         {
3784         case SPACE_0F:
3785         case SPACE_0F38:
3786         case SPACE_0F3A:
3787           i.vex.bytes[0] = 0xc4;
3788           break;
3789         case SPACE_XOP08:
3790         case SPACE_XOP09:
3791         case SPACE_XOP0A:
3792           i.vex.bytes[0] = 0x8f;
3793           break;
3794         default:
3795           abort ();
3796         }
3797
3798       /* The high 3 bits of the second VEX byte are 1's compliment
3799          of RXB bits from REX.  */
3800       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3801
3802       i.vex.bytes[2] = (w << 7
3803                         | register_specifier << 3
3804                         | vector_length << 2
3805                         | i.tm.opcode_modifier.opcodeprefix);
3806     }
3807 }
3808
3809 static INLINE bool
3810 is_evex_encoding (const insn_template *t)
3811 {
3812   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3813          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3814          || t->opcode_modifier.sae;
3815 }
3816
3817 static INLINE bool
3818 is_any_vex_encoding (const insn_template *t)
3819 {
3820   return t->opcode_modifier.vex || is_evex_encoding (t);
3821 }
3822
3823 /* Build the EVEX prefix.  */
3824
3825 static void
3826 build_evex_prefix (void)
3827 {
3828   unsigned int register_specifier, w;
3829   rex_byte vrex_used = 0;
3830
3831   /* Check register specifier.  */
3832   if (i.vex.register_specifier)
3833     {
3834       gas_assert ((i.vrex & REX_X) == 0);
3835
3836       register_specifier = i.vex.register_specifier->reg_num;
3837       if ((i.vex.register_specifier->reg_flags & RegRex))
3838         register_specifier += 8;
3839       /* The upper 16 registers are encoded in the fourth byte of the
3840          EVEX prefix.  */
3841       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3842         i.vex.bytes[3] = 0x8;
3843       register_specifier = ~register_specifier & 0xf;
3844     }
3845   else
3846     {
3847       register_specifier = 0xf;
3848
3849       /* Encode upper 16 vector index register in the fourth byte of
3850          the EVEX prefix.  */
3851       if (!(i.vrex & REX_X))
3852         i.vex.bytes[3] = 0x8;
3853       else
3854         vrex_used |= REX_X;
3855     }
3856
3857   /* 4 byte EVEX prefix.  */
3858   i.vex.length = 4;
3859   i.vex.bytes[0] = 0x62;
3860
3861   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3862      bits from REX.  */
3863   gas_assert (i.tm.opcode_modifier.opcodespace >= SPACE_0F);
3864   gas_assert (i.tm.opcode_modifier.opcodespace <= SPACE_0F3A);
3865   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3866
3867   /* The fifth bit of the second EVEX byte is 1's compliment of the
3868      REX_R bit in VREX.  */
3869   if (!(i.vrex & REX_R))
3870     i.vex.bytes[1] |= 0x10;
3871   else
3872     vrex_used |= REX_R;
3873
3874   if ((i.reg_operands + i.imm_operands) == i.operands)
3875     {
3876       /* When all operands are registers, the REX_X bit in REX is not
3877          used.  We reuse it to encode the upper 16 registers, which is
3878          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3879          as 1's compliment.  */
3880       if ((i.vrex & REX_B))
3881         {
3882           vrex_used |= REX_B;
3883           i.vex.bytes[1] &= ~0x40;
3884         }
3885     }
3886
3887   /* EVEX instructions shouldn't need the REX prefix.  */
3888   i.vrex &= ~vrex_used;
3889   gas_assert (i.vrex == 0);
3890
3891   /* Check the REX.W bit and VEXW.  */
3892   if (i.tm.opcode_modifier.vexw == VEXWIG)
3893     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3894   else if (i.tm.opcode_modifier.vexw)
3895     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3896   else
3897     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3898
3899   /* The third byte of the EVEX prefix.  */
3900   i.vex.bytes[2] = ((w << 7)
3901                     | (register_specifier << 3)
3902                     | 4 /* Encode the U bit.  */
3903                     | i.tm.opcode_modifier.opcodeprefix);
3904
3905   /* The fourth byte of the EVEX prefix.  */
3906   /* The zeroing-masking bit.  */
3907   if (i.mask.reg && i.mask.zeroing)
3908     i.vex.bytes[3] |= 0x80;
3909
3910   /* Don't always set the broadcast bit if there is no RC.  */
3911   if (i.rounding.type == rc_none)
3912     {
3913       /* Encode the vector length.  */
3914       unsigned int vec_length;
3915
3916       if (!i.tm.opcode_modifier.evex
3917           || i.tm.opcode_modifier.evex == EVEXDYN)
3918         {
3919           unsigned int op;
3920
3921           /* Determine vector length from the last multi-length vector
3922              operand.  */
3923           for (op = i.operands; op--;)
3924             if (i.tm.operand_types[op].bitfield.xmmword
3925                 + i.tm.operand_types[op].bitfield.ymmword
3926                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3927               {
3928                 if (i.types[op].bitfield.zmmword)
3929                   {
3930                     i.tm.opcode_modifier.evex = EVEX512;
3931                     break;
3932                   }
3933                 else if (i.types[op].bitfield.ymmword)
3934                   {
3935                     i.tm.opcode_modifier.evex = EVEX256;
3936                     break;
3937                   }
3938                 else if (i.types[op].bitfield.xmmword)
3939                   {
3940                     i.tm.opcode_modifier.evex = EVEX128;
3941                     break;
3942                   }
3943                 else if (i.broadcast.type && op == i.broadcast.operand)
3944                   {
3945                     switch (i.broadcast.bytes)
3946                       {
3947                         case 64:
3948                           i.tm.opcode_modifier.evex = EVEX512;
3949                           break;
3950                         case 32:
3951                           i.tm.opcode_modifier.evex = EVEX256;
3952                           break;
3953                         case 16:
3954                           i.tm.opcode_modifier.evex = EVEX128;
3955                           break;
3956                         default:
3957                           abort ();
3958                       }
3959                     break;
3960                   }
3961               }
3962
3963           if (op >= MAX_OPERANDS)
3964             abort ();
3965         }
3966
3967       switch (i.tm.opcode_modifier.evex)
3968         {
3969         case EVEXLIG: /* LL' is ignored */
3970           vec_length = evexlig << 5;
3971           break;
3972         case EVEX128:
3973           vec_length = 0 << 5;
3974           break;
3975         case EVEX256:
3976           vec_length = 1 << 5;
3977           break;
3978         case EVEX512:
3979           vec_length = 2 << 5;
3980           break;
3981         default:
3982           abort ();
3983           break;
3984         }
3985       i.vex.bytes[3] |= vec_length;
3986       /* Encode the broadcast bit.  */
3987       if (i.broadcast.type)
3988         i.vex.bytes[3] |= 0x10;
3989     }
3990   else if (i.rounding.type != saeonly)
3991     i.vex.bytes[3] |= 0x10 | (i.rounding.type << 5);
3992   else
3993     i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3994
3995   if (i.mask.reg)
3996     i.vex.bytes[3] |= i.mask.reg->reg_num;
3997 }
3998
3999 static void
4000 process_immext (void)
4001 {
4002   expressionS *exp;
4003
4004   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
4005      which is coded in the same place as an 8-bit immediate field
4006      would be.  Here we fake an 8-bit immediate operand from the
4007      opcode suffix stored in tm.extension_opcode.
4008
4009      AVX instructions also use this encoding, for some of
4010      3 argument instructions.  */
4011
4012   gas_assert (i.imm_operands <= 1
4013               && (i.operands <= 2
4014                   || (is_any_vex_encoding (&i.tm)
4015                       && i.operands <= 4)));
4016
4017   exp = &im_expressions[i.imm_operands++];
4018   i.op[i.operands].imms = exp;
4019   i.types[i.operands] = imm8;
4020   i.operands++;
4021   exp->X_op = O_constant;
4022   exp->X_add_number = i.tm.extension_opcode;
4023   i.tm.extension_opcode = None;
4024 }
4025
4026
4027 static int
4028 check_hle (void)
4029 {
4030   switch (i.tm.opcode_modifier.prefixok)
4031     {
4032     default:
4033       abort ();
4034     case PrefixLock:
4035     case PrefixNone:
4036     case PrefixNoTrack:
4037     case PrefixRep:
4038       as_bad (_("invalid instruction `%s' after `%s'"),
4039               i.tm.name, i.hle_prefix);
4040       return 0;
4041     case PrefixHLELock:
4042       if (i.prefix[LOCK_PREFIX])
4043         return 1;
4044       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4045       return 0;
4046     case PrefixHLEAny:
4047       return 1;
4048     case PrefixHLERelease:
4049       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4050         {
4051           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4052                   i.tm.name);
4053           return 0;
4054         }
4055       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4056         {
4057           as_bad (_("memory destination needed for instruction `%s'"
4058                     " after `xrelease'"), i.tm.name);
4059           return 0;
4060         }
4061       return 1;
4062     }
4063 }
4064
4065 /* Try the shortest encoding by shortening operand size.  */
4066
4067 static void
4068 optimize_encoding (void)
4069 {
4070   unsigned int j;
4071
4072   if (i.tm.opcode_modifier.opcodespace == SPACE_BASE
4073       && i.tm.base_opcode == 0x8d)
4074     {
4075       /* Optimize: -O:
4076            lea symbol, %rN    -> mov $symbol, %rN
4077            lea (%rM), %rN     -> mov %rM, %rN
4078            lea (,%rM,1), %rN  -> mov %rM, %rN
4079
4080            and in 32-bit mode for 16-bit addressing
4081
4082            lea (%rM), %rN     -> movzx %rM, %rN
4083
4084            and in 64-bit mode zap 32-bit addressing in favor of using a
4085            32-bit (or less) destination.
4086        */
4087       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4088         {
4089           if (!i.op[1].regs->reg_type.bitfield.word)
4090             i.tm.opcode_modifier.size = SIZE32;
4091           i.prefix[ADDR_PREFIX] = 0;
4092         }
4093
4094       if (!i.index_reg && !i.base_reg)
4095         {
4096           /* Handle:
4097                lea symbol, %rN    -> mov $symbol, %rN
4098            */
4099           if (flag_code == CODE_64BIT)
4100             {
4101               /* Don't transform a relocation to a 16-bit one.  */
4102               if (i.op[0].disps
4103                   && i.op[0].disps->X_op != O_constant
4104                   && i.op[1].regs->reg_type.bitfield.word)
4105                 return;
4106
4107               if (!i.op[1].regs->reg_type.bitfield.qword
4108                   || i.tm.opcode_modifier.size == SIZE32)
4109                 {
4110                   i.tm.base_opcode = 0xb8;
4111                   i.tm.opcode_modifier.modrm = 0;
4112                   if (!i.op[1].regs->reg_type.bitfield.word)
4113                     i.types[0].bitfield.imm32 = 1;
4114                   else
4115                     {
4116                       i.tm.opcode_modifier.size = SIZE16;
4117                       i.types[0].bitfield.imm16 = 1;
4118                     }
4119                 }
4120               else
4121                 {
4122                   /* Subject to further optimization below.  */
4123                   i.tm.base_opcode = 0xc7;
4124                   i.tm.extension_opcode = 0;
4125                   i.types[0].bitfield.imm32s = 1;
4126                   i.types[0].bitfield.baseindex = 0;
4127                 }
4128             }
4129           /* Outside of 64-bit mode address and operand sizes have to match if
4130              a relocation is involved, as otherwise we wouldn't (currently) or
4131              even couldn't express the relocation correctly.  */
4132           else if (i.op[0].disps
4133                    && i.op[0].disps->X_op != O_constant
4134                    && ((!i.prefix[ADDR_PREFIX])
4135                        != (flag_code == CODE_32BIT
4136                            ? i.op[1].regs->reg_type.bitfield.dword
4137                            : i.op[1].regs->reg_type.bitfield.word)))
4138             return;
4139           /* In 16-bit mode converting LEA with 16-bit addressing and a 32-bit
4140              destination is going to grow encoding size.  */
4141           else if (flag_code == CODE_16BIT
4142                    && (optimize <= 1 || optimize_for_space)
4143                    && !i.prefix[ADDR_PREFIX]
4144                    && i.op[1].regs->reg_type.bitfield.dword)
4145             return;
4146           else
4147             {
4148               i.tm.base_opcode = 0xb8;
4149               i.tm.opcode_modifier.modrm = 0;
4150               if (i.op[1].regs->reg_type.bitfield.dword)
4151                 i.types[0].bitfield.imm32 = 1;
4152               else
4153                 i.types[0].bitfield.imm16 = 1;
4154
4155               if (i.op[0].disps
4156                   && i.op[0].disps->X_op == O_constant
4157                   && i.op[1].regs->reg_type.bitfield.dword
4158                   /* NB: Add () to !i.prefix[ADDR_PREFIX] to silence
4159                      GCC 5. */
4160                   && (!i.prefix[ADDR_PREFIX]) != (flag_code == CODE_32BIT))
4161                 i.op[0].disps->X_add_number &= 0xffff;
4162             }
4163
4164           i.tm.operand_types[0] = i.types[0];
4165           i.imm_operands = 1;
4166           if (!i.op[0].imms)
4167             {
4168               i.op[0].imms = &im_expressions[0];
4169               i.op[0].imms->X_op = O_absent;
4170             }
4171         }
4172       else if (i.op[0].disps
4173                   && (i.op[0].disps->X_op != O_constant
4174                       || i.op[0].disps->X_add_number))
4175         return;
4176       else
4177         {
4178           /* Handle:
4179                lea (%rM), %rN     -> mov %rM, %rN
4180                lea (,%rM,1), %rN  -> mov %rM, %rN
4181                lea (%rM), %rN     -> movzx %rM, %rN
4182            */
4183           const reg_entry *addr_reg;
4184
4185           if (!i.index_reg && i.base_reg->reg_num != RegIP)
4186             addr_reg = i.base_reg;
4187           else if (!i.base_reg
4188                    && i.index_reg->reg_num != RegIZ
4189                    && !i.log2_scale_factor)
4190             addr_reg = i.index_reg;
4191           else
4192             return;
4193
4194           if (addr_reg->reg_type.bitfield.word
4195               && i.op[1].regs->reg_type.bitfield.dword)
4196             {
4197               if (flag_code != CODE_32BIT)
4198                 return;
4199               i.tm.opcode_modifier.opcodespace = SPACE_0F;
4200               i.tm.base_opcode = 0xb7;
4201             }
4202           else
4203             i.tm.base_opcode = 0x8b;
4204
4205           if (addr_reg->reg_type.bitfield.dword
4206               && i.op[1].regs->reg_type.bitfield.qword)
4207             i.tm.opcode_modifier.size = SIZE32;
4208
4209           i.op[0].regs = addr_reg;
4210           i.reg_operands = 2;
4211         }
4212
4213       i.mem_operands = 0;
4214       i.disp_operands = 0;
4215       i.prefix[ADDR_PREFIX] = 0;
4216       i.prefix[SEG_PREFIX] = 0;
4217       i.seg[0] = NULL;
4218     }
4219
4220   if (optimize_for_space
4221       && i.tm.opcode_modifier.opcodespace == SPACE_BASE
4222       && i.reg_operands == 1
4223       && i.imm_operands == 1
4224       && !i.types[1].bitfield.byte
4225       && i.op[0].imms->X_op == O_constant
4226       && fits_in_imm7 (i.op[0].imms->X_add_number)
4227       && (i.tm.base_opcode == 0xa8
4228           || (i.tm.base_opcode == 0xf6
4229               && i.tm.extension_opcode == 0x0)))
4230     {
4231       /* Optimize: -Os:
4232            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4233        */
4234       unsigned int base_regnum = i.op[1].regs->reg_num;
4235       if (flag_code == CODE_64BIT || base_regnum < 4)
4236         {
4237           i.types[1].bitfield.byte = 1;
4238           /* Ignore the suffix.  */
4239           i.suffix = 0;
4240           /* Convert to byte registers.  */
4241           if (i.types[1].bitfield.word)
4242             j = 16;
4243           else if (i.types[1].bitfield.dword)
4244             j = 32;
4245           else
4246             j = 48;
4247           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4248             j += 8;
4249           i.op[1].regs -= j;
4250         }
4251     }
4252   else if (flag_code == CODE_64BIT
4253            && i.tm.opcode_modifier.opcodespace == SPACE_BASE
4254            && ((i.types[1].bitfield.qword
4255                 && i.reg_operands == 1
4256                 && i.imm_operands == 1
4257                 && i.op[0].imms->X_op == O_constant
4258                 && ((i.tm.base_opcode == 0xb8
4259                      && i.tm.extension_opcode == None
4260                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4261                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4262                         && ((i.tm.base_opcode == 0x24
4263                              || i.tm.base_opcode == 0xa8)
4264                             || (i.tm.base_opcode == 0x80
4265                                 && i.tm.extension_opcode == 0x4)
4266                             || ((i.tm.base_opcode == 0xf6
4267                                  || (i.tm.base_opcode | 1) == 0xc7)
4268                                 && i.tm.extension_opcode == 0x0)))
4269                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4270                         && i.tm.base_opcode == 0x83
4271                         && i.tm.extension_opcode == 0x4)))
4272                || (i.types[0].bitfield.qword
4273                    && ((i.reg_operands == 2
4274                         && i.op[0].regs == i.op[1].regs
4275                         && (i.tm.base_opcode == 0x30
4276                             || i.tm.base_opcode == 0x28))
4277                        || (i.reg_operands == 1
4278                            && i.operands == 1
4279                            && i.tm.base_opcode == 0x30)))))
4280     {
4281       /* Optimize: -O:
4282            andq $imm31, %r64   -> andl $imm31, %r32
4283            andq $imm7, %r64    -> andl $imm7, %r32
4284            testq $imm31, %r64  -> testl $imm31, %r32
4285            xorq %r64, %r64     -> xorl %r32, %r32
4286            subq %r64, %r64     -> subl %r32, %r32
4287            movq $imm31, %r64   -> movl $imm31, %r32
4288            movq $imm32, %r64   -> movl $imm32, %r32
4289         */
4290       i.tm.opcode_modifier.norex64 = 1;
4291       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4292         {
4293           /* Handle
4294                movq $imm31, %r64   -> movl $imm31, %r32
4295                movq $imm32, %r64   -> movl $imm32, %r32
4296            */
4297           i.tm.operand_types[0].bitfield.imm32 = 1;
4298           i.tm.operand_types[0].bitfield.imm32s = 0;
4299           i.tm.operand_types[0].bitfield.imm64 = 0;
4300           i.types[0].bitfield.imm32 = 1;
4301           i.types[0].bitfield.imm32s = 0;
4302           i.types[0].bitfield.imm64 = 0;
4303           i.types[1].bitfield.dword = 1;
4304           i.types[1].bitfield.qword = 0;
4305           if ((i.tm.base_opcode | 1) == 0xc7)
4306             {
4307               /* Handle
4308                    movq $imm31, %r64   -> movl $imm31, %r32
4309                */
4310               i.tm.base_opcode = 0xb8;
4311               i.tm.extension_opcode = None;
4312               i.tm.opcode_modifier.w = 0;
4313               i.tm.opcode_modifier.modrm = 0;
4314             }
4315         }
4316     }
4317   else if (optimize > 1
4318            && !optimize_for_space
4319            && i.tm.opcode_modifier.opcodespace == SPACE_BASE
4320            && i.reg_operands == 2
4321            && i.op[0].regs == i.op[1].regs
4322            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4323                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4324            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4325     {
4326       /* Optimize: -O2:
4327            andb %rN, %rN  -> testb %rN, %rN
4328            andw %rN, %rN  -> testw %rN, %rN
4329            andq %rN, %rN  -> testq %rN, %rN
4330            orb %rN, %rN   -> testb %rN, %rN
4331            orw %rN, %rN   -> testw %rN, %rN
4332            orq %rN, %rN   -> testq %rN, %rN
4333
4334            and outside of 64-bit mode
4335
4336            andl %rN, %rN  -> testl %rN, %rN
4337            orl %rN, %rN   -> testl %rN, %rN
4338        */
4339       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4340     }
4341   else if (i.reg_operands == 3
4342            && i.op[0].regs == i.op[1].regs
4343            && !i.types[2].bitfield.xmmword
4344            && (i.tm.opcode_modifier.vex
4345                || ((!i.mask.reg || i.mask.zeroing)
4346                    && i.rounding.type == rc_none
4347                    && is_evex_encoding (&i.tm)
4348                    && (i.vec_encoding != vex_encoding_evex
4349                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4350                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4351                        || (i.tm.operand_types[2].bitfield.zmmword
4352                            && i.types[2].bitfield.ymmword))))
4353            && ((i.tm.base_opcode == 0x55
4354                 || i.tm.base_opcode == 0x57
4355                 || i.tm.base_opcode == 0xdf
4356                 || i.tm.base_opcode == 0xef
4357                 || i.tm.base_opcode == 0xf8
4358                 || i.tm.base_opcode == 0xf9
4359                 || i.tm.base_opcode == 0xfa
4360                 || i.tm.base_opcode == 0xfb
4361                 || i.tm.base_opcode == 0x42
4362                 || i.tm.base_opcode == 0x47)
4363                && i.tm.extension_opcode == None))
4364     {
4365       /* Optimize: -O1:
4366            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4367            vpsubq and vpsubw:
4368              EVEX VOP %zmmM, %zmmM, %zmmN
4369                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4370                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4371              EVEX VOP %ymmM, %ymmM, %ymmN
4372                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4373                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4374              VEX VOP %ymmM, %ymmM, %ymmN
4375                -> VEX VOP %xmmM, %xmmM, %xmmN
4376            VOP, one of vpandn and vpxor:
4377              VEX VOP %ymmM, %ymmM, %ymmN
4378                -> VEX VOP %xmmM, %xmmM, %xmmN
4379            VOP, one of vpandnd and vpandnq:
4380              EVEX VOP %zmmM, %zmmM, %zmmN
4381                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4382                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4383              EVEX VOP %ymmM, %ymmM, %ymmN
4384                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4385                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4386            VOP, one of vpxord and vpxorq:
4387              EVEX VOP %zmmM, %zmmM, %zmmN
4388                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4389                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4390              EVEX VOP %ymmM, %ymmM, %ymmN
4391                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4392                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4393            VOP, one of kxord and kxorq:
4394              VEX VOP %kM, %kM, %kN
4395                -> VEX kxorw %kM, %kM, %kN
4396            VOP, one of kandnd and kandnq:
4397              VEX VOP %kM, %kM, %kN
4398                -> VEX kandnw %kM, %kM, %kN
4399        */
4400       if (is_evex_encoding (&i.tm))
4401         {
4402           if (i.vec_encoding != vex_encoding_evex)
4403             {
4404               i.tm.opcode_modifier.vex = VEX128;
4405               i.tm.opcode_modifier.vexw = VEXW0;
4406               i.tm.opcode_modifier.evex = 0;
4407             }
4408           else if (optimize > 1)
4409             i.tm.opcode_modifier.evex = EVEX128;
4410           else
4411             return;
4412         }
4413       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4414         {
4415           i.tm.opcode_modifier.opcodeprefix = PREFIX_NONE;
4416           i.tm.opcode_modifier.vexw = VEXW0;
4417         }
4418       else
4419         i.tm.opcode_modifier.vex = VEX128;
4420
4421       if (i.tm.opcode_modifier.vex)
4422         for (j = 0; j < 3; j++)
4423           {
4424             i.types[j].bitfield.xmmword = 1;
4425             i.types[j].bitfield.ymmword = 0;
4426           }
4427     }
4428   else if (i.vec_encoding != vex_encoding_evex
4429            && !i.types[0].bitfield.zmmword
4430            && !i.types[1].bitfield.zmmword
4431            && !i.mask.reg
4432            && !i.broadcast.type
4433            && is_evex_encoding (&i.tm)
4434            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4435                || (i.tm.base_opcode & ~4) == 0xdb
4436                || (i.tm.base_opcode & ~4) == 0xeb)
4437            && i.tm.extension_opcode == None)
4438     {
4439       /* Optimize: -O1:
4440            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4441            vmovdqu32 and vmovdqu64:
4442              EVEX VOP %xmmM, %xmmN
4443                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4444              EVEX VOP %ymmM, %ymmN
4445                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4446              EVEX VOP %xmmM, mem
4447                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4448              EVEX VOP %ymmM, mem
4449                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4450              EVEX VOP mem, %xmmN
4451                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4452              EVEX VOP mem, %ymmN
4453                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4454            VOP, one of vpand, vpandn, vpor, vpxor:
4455              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4456                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4457              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4458                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4459              EVEX VOP{d,q} mem, %xmmM, %xmmN
4460                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4461              EVEX VOP{d,q} mem, %ymmM, %ymmN
4462                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4463        */
4464       for (j = 0; j < i.operands; j++)
4465         if (operand_type_check (i.types[j], disp)
4466             && i.op[j].disps->X_op == O_constant)
4467           {
4468             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4469                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4470                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4471             int evex_disp8, vex_disp8;
4472             unsigned int memshift = i.memshift;
4473             offsetT n = i.op[j].disps->X_add_number;
4474
4475             evex_disp8 = fits_in_disp8 (n);
4476             i.memshift = 0;
4477             vex_disp8 = fits_in_disp8 (n);
4478             if (evex_disp8 != vex_disp8)
4479               {
4480                 i.memshift = memshift;
4481                 return;
4482               }
4483
4484             i.types[j].bitfield.disp8 = vex_disp8;
4485             break;
4486           }
4487       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4488           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2)
4489         i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
4490       i.tm.opcode_modifier.vex
4491         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4492       i.tm.opcode_modifier.vexw = VEXW0;
4493       /* VPAND, VPOR, and VPXOR are commutative.  */
4494       if (i.reg_operands == 3 && i.tm.base_opcode != 0xdf)
4495         i.tm.opcode_modifier.commutative = 1;
4496       i.tm.opcode_modifier.evex = 0;
4497       i.tm.opcode_modifier.masking = 0;
4498       i.tm.opcode_modifier.broadcast = 0;
4499       i.tm.opcode_modifier.disp8memshift = 0;
4500       i.memshift = 0;
4501       if (j < i.operands)
4502         i.types[j].bitfield.disp8
4503           = fits_in_disp8 (i.op[j].disps->X_add_number);
4504     }
4505 }
4506
4507 /* Return non-zero for load instruction.  */
4508
4509 static int
4510 load_insn_p (void)
4511 {
4512   unsigned int dest;
4513   int any_vex_p = is_any_vex_encoding (&i.tm);
4514   unsigned int base_opcode = i.tm.base_opcode | 1;
4515
4516   if (!any_vex_p)
4517     {
4518       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4519          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4520          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4521       if (i.tm.opcode_modifier.anysize)
4522         return 0;
4523
4524       /* pop.   */
4525       if (strcmp (i.tm.name, "pop") == 0)
4526         return 1;
4527     }
4528
4529   if (i.tm.opcode_modifier.opcodespace == SPACE_BASE)
4530     {
4531       /* popf, popa.   */
4532       if (i.tm.base_opcode == 0x9d
4533           || i.tm.base_opcode == 0x61)
4534         return 1;
4535
4536       /* movs, cmps, lods, scas.  */
4537       if ((i.tm.base_opcode | 0xb) == 0xaf)
4538         return 1;
4539
4540       /* outs, xlatb.  */
4541       if (base_opcode == 0x6f
4542           || i.tm.base_opcode == 0xd7)
4543         return 1;
4544       /* NB: For AMD-specific insns with implicit memory operands,
4545          they're intentionally not covered.  */
4546     }
4547
4548   /* No memory operand.  */
4549   if (!i.mem_operands)
4550     return 0;
4551
4552   if (any_vex_p)
4553     {
4554       /* vldmxcsr.  */
4555       if (i.tm.base_opcode == 0xae
4556           && i.tm.opcode_modifier.vex
4557           && i.tm.opcode_modifier.opcodespace == SPACE_0F
4558           && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4559           && i.tm.extension_opcode == 2)
4560         return 1;
4561     }
4562   else if (i.tm.opcode_modifier.opcodespace == SPACE_BASE)
4563     {
4564       /* test, not, neg, mul, imul, div, idiv.  */
4565       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4566           && i.tm.extension_opcode != 1)
4567         return 1;
4568
4569       /* inc, dec.  */
4570       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4571         return 1;
4572
4573       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4574       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4575         return 1;
4576
4577       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4578       if ((base_opcode == 0xc1
4579            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4580           && i.tm.extension_opcode != 6)
4581         return 1;
4582
4583       /* Check for x87 instructions.  */
4584       if (base_opcode >= 0xd8 && base_opcode <= 0xdf)
4585         {
4586           /* Skip fst, fstp, fstenv, fstcw.  */
4587           if (i.tm.base_opcode == 0xd9
4588               && (i.tm.extension_opcode == 2
4589                   || i.tm.extension_opcode == 3
4590                   || i.tm.extension_opcode == 6
4591                   || i.tm.extension_opcode == 7))
4592             return 0;
4593
4594           /* Skip fisttp, fist, fistp, fstp.  */
4595           if (i.tm.base_opcode == 0xdb
4596               && (i.tm.extension_opcode == 1
4597                   || i.tm.extension_opcode == 2
4598                   || i.tm.extension_opcode == 3
4599                   || i.tm.extension_opcode == 7))
4600             return 0;
4601
4602           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4603           if (i.tm.base_opcode == 0xdd
4604               && (i.tm.extension_opcode == 1
4605                   || i.tm.extension_opcode == 2
4606                   || i.tm.extension_opcode == 3
4607                   || i.tm.extension_opcode == 6
4608                   || i.tm.extension_opcode == 7))
4609             return 0;
4610
4611           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4612           if (i.tm.base_opcode == 0xdf
4613               && (i.tm.extension_opcode == 1
4614                   || i.tm.extension_opcode == 2
4615                   || i.tm.extension_opcode == 3
4616                   || i.tm.extension_opcode == 6
4617                   || i.tm.extension_opcode == 7))
4618             return 0;
4619
4620           return 1;
4621         }
4622     }
4623   else if (i.tm.opcode_modifier.opcodespace == SPACE_0F)
4624     {
4625       /* bt, bts, btr, btc.  */
4626       if (i.tm.base_opcode == 0xba
4627           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4628         return 1;
4629
4630       /* cmpxchg8b, cmpxchg16b, xrstors, vmptrld.  */
4631       if (i.tm.base_opcode == 0xc7
4632           && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4633           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3
4634               || i.tm.extension_opcode == 6))
4635         return 1;
4636
4637       /* fxrstor, ldmxcsr, xrstor.  */
4638       if (i.tm.base_opcode == 0xae
4639           && (i.tm.extension_opcode == 1
4640               || i.tm.extension_opcode == 2
4641               || i.tm.extension_opcode == 5))
4642         return 1;
4643
4644       /* lgdt, lidt, lmsw.  */
4645       if (i.tm.base_opcode == 0x01
4646           && (i.tm.extension_opcode == 2
4647               || i.tm.extension_opcode == 3
4648               || i.tm.extension_opcode == 6))
4649         return 1;
4650     }
4651
4652   dest = i.operands - 1;
4653
4654   /* Check fake imm8 operand and 3 source operands.  */
4655   if ((i.tm.opcode_modifier.immext
4656        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4657       && i.types[dest].bitfield.imm8)
4658     dest--;
4659
4660   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg.  */
4661   if (i.tm.opcode_modifier.opcodespace == SPACE_BASE
4662       && (base_opcode == 0x1
4663           || base_opcode == 0x9
4664           || base_opcode == 0x11
4665           || base_opcode == 0x19
4666           || base_opcode == 0x21
4667           || base_opcode == 0x29
4668           || base_opcode == 0x31
4669           || base_opcode == 0x39
4670           || (base_opcode | 2) == 0x87))
4671     return 1;
4672
4673   /* xadd.  */
4674   if (i.tm.opcode_modifier.opcodespace == SPACE_0F
4675       && base_opcode == 0xc1)
4676     return 1;
4677
4678   /* Check for load instruction.  */
4679   return (i.types[dest].bitfield.class != ClassNone
4680           || i.types[dest].bitfield.instance == Accum);
4681 }
4682
4683 /* Output lfence, 0xfaee8, after instruction.  */
4684
4685 static void
4686 insert_lfence_after (void)
4687 {
4688   if (lfence_after_load && load_insn_p ())
4689     {
4690       /* There are also two REP string instructions that require
4691          special treatment. Specifically, the compare string (CMPS)
4692          and scan string (SCAS) instructions set EFLAGS in a manner
4693          that depends on the data being compared/scanned. When used
4694          with a REP prefix, the number of iterations may therefore
4695          vary depending on this data. If the data is a program secret
4696          chosen by the adversary using an LVI method,
4697          then this data-dependent behavior may leak some aspect
4698          of the secret.  */
4699       if (((i.tm.base_opcode | 0x1) == 0xa7
4700            || (i.tm.base_opcode | 0x1) == 0xaf)
4701           && i.prefix[REP_PREFIX])
4702         {
4703             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4704                      i.tm.name);
4705         }
4706       char *p = frag_more (3);
4707       *p++ = 0xf;
4708       *p++ = 0xae;
4709       *p = 0xe8;
4710     }
4711 }
4712
4713 /* Output lfence, 0xfaee8, before instruction.  */
4714
4715 static void
4716 insert_lfence_before (void)
4717 {
4718   char *p;
4719
4720   if (i.tm.opcode_modifier.opcodespace != SPACE_BASE)
4721     return;
4722
4723   if (i.tm.base_opcode == 0xff
4724       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4725     {
4726       /* Insert lfence before indirect branch if needed.  */
4727
4728       if (lfence_before_indirect_branch == lfence_branch_none)
4729         return;
4730
4731       if (i.operands != 1)
4732         abort ();
4733
4734       if (i.reg_operands == 1)
4735         {
4736           /* Indirect branch via register.  Don't insert lfence with
4737              -mlfence-after-load=yes.  */
4738           if (lfence_after_load
4739               || lfence_before_indirect_branch == lfence_branch_memory)
4740             return;
4741         }
4742       else if (i.mem_operands == 1
4743                && lfence_before_indirect_branch != lfence_branch_register)
4744         {
4745           as_warn (_("indirect `%s` with memory operand should be avoided"),
4746                    i.tm.name);
4747           return;
4748         }
4749       else
4750         return;
4751
4752       if (last_insn.kind != last_insn_other
4753           && last_insn.seg == now_seg)
4754         {
4755           as_warn_where (last_insn.file, last_insn.line,
4756                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4757                          last_insn.name, i.tm.name);
4758           return;
4759         }
4760
4761       p = frag_more (3);
4762       *p++ = 0xf;
4763       *p++ = 0xae;
4764       *p = 0xe8;
4765       return;
4766     }
4767
4768   /* Output or/not/shl and lfence before near ret.  */
4769   if (lfence_before_ret != lfence_before_ret_none
4770       && (i.tm.base_opcode == 0xc2
4771           || i.tm.base_opcode == 0xc3))
4772     {
4773       if (last_insn.kind != last_insn_other
4774           && last_insn.seg == now_seg)
4775         {
4776           as_warn_where (last_insn.file, last_insn.line,
4777                          _("`%s` skips -mlfence-before-ret on `%s`"),
4778                          last_insn.name, i.tm.name);
4779           return;
4780         }
4781
4782       /* Near ret ingore operand size override under CPU64.  */
4783       char prefix = flag_code == CODE_64BIT
4784                     ? 0x48
4785                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4786
4787       if (lfence_before_ret == lfence_before_ret_not)
4788         {
4789           /* not: 0xf71424, may add prefix
4790              for operand size override or 64-bit code.  */
4791           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4792           if (prefix)
4793             *p++ = prefix;
4794           *p++ = 0xf7;
4795           *p++ = 0x14;
4796           *p++ = 0x24;
4797           if (prefix)
4798             *p++ = prefix;
4799           *p++ = 0xf7;
4800           *p++ = 0x14;
4801           *p++ = 0x24;
4802         }
4803       else
4804         {
4805           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4806           if (prefix)
4807             *p++ = prefix;
4808           if (lfence_before_ret == lfence_before_ret_or)
4809             {
4810               /* or: 0x830c2400, may add prefix
4811                  for operand size override or 64-bit code.  */
4812               *p++ = 0x83;
4813               *p++ = 0x0c;
4814             }
4815           else
4816             {
4817               /* shl: 0xc1242400, may add prefix
4818                  for operand size override or 64-bit code.  */
4819               *p++ = 0xc1;
4820               *p++ = 0x24;
4821             }
4822
4823           *p++ = 0x24;
4824           *p++ = 0x0;
4825         }
4826
4827       *p++ = 0xf;
4828       *p++ = 0xae;
4829       *p = 0xe8;
4830     }
4831 }
4832
4833 /* This is the guts of the machine-dependent assembler.  LINE points to a
4834    machine dependent instruction.  This function is supposed to emit
4835    the frags/bytes it assembles to.  */
4836
4837 void
4838 md_assemble (char *line)
4839 {
4840   unsigned int j;
4841   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4842   const insn_template *t;
4843
4844   /* Initialize globals.  */
4845   memset (&i, '\0', sizeof (i));
4846   i.rounding.type = rc_none;
4847   for (j = 0; j < MAX_OPERANDS; j++)
4848     i.reloc[j] = NO_RELOC;
4849   memset (disp_expressions, '\0', sizeof (disp_expressions));
4850   memset (im_expressions, '\0', sizeof (im_expressions));
4851   save_stack_p = save_stack;
4852
4853   /* First parse an instruction mnemonic & call i386_operand for the operands.
4854      We assume that the scrubber has arranged it so that line[0] is the valid
4855      start of a (possibly prefixed) mnemonic.  */
4856
4857   line = parse_insn (line, mnemonic);
4858   if (line == NULL)
4859     return;
4860   mnem_suffix = i.suffix;
4861
4862   line = parse_operands (line, mnemonic);
4863   this_operand = -1;
4864   xfree (i.memop1_string);
4865   i.memop1_string = NULL;
4866   if (line == NULL)
4867     return;
4868
4869   /* Now we've parsed the mnemonic into a set of templates, and have the
4870      operands at hand.  */
4871
4872   /* All Intel opcodes have reversed operands except for "bound", "enter",
4873      "invlpg*", "monitor*", "mwait*", "tpause", "umwait", "pvalidate",
4874      "rmpadjust", and "rmpupdate".  We also don't reverse intersegment "jmp"
4875      and "call" instructions with 2 immediate operands so that the immediate
4876      segment precedes the offset consistently in Intel and AT&T modes.  */
4877   if (intel_syntax
4878       && i.operands > 1
4879       && (strcmp (mnemonic, "bound") != 0)
4880       && (strncmp (mnemonic, "invlpg", 6) != 0)
4881       && !startswith (mnemonic, "monitor")
4882       && !startswith (mnemonic, "mwait")
4883       && (strcmp (mnemonic, "pvalidate") != 0)
4884       && !startswith (mnemonic, "rmp")
4885       && (strcmp (mnemonic, "tpause") != 0)
4886       && (strcmp (mnemonic, "umwait") != 0)
4887       && !(operand_type_check (i.types[0], imm)
4888            && operand_type_check (i.types[1], imm)))
4889     swap_operands ();
4890
4891   /* The order of the immediates should be reversed
4892      for 2 immediates extrq and insertq instructions */
4893   if (i.imm_operands == 2
4894       && (strcmp (mnemonic, "extrq") == 0
4895           || strcmp (mnemonic, "insertq") == 0))
4896       swap_2_operands (0, 1);
4897
4898   if (i.imm_operands)
4899     optimize_imm ();
4900
4901   if (i.disp_operands && !want_disp32 (current_templates->start))
4902     {
4903       for (j = 0; j < i.operands; ++j)
4904         {
4905           const expressionS *exp = i.op[j].disps;
4906
4907           if (!operand_type_check (i.types[j], disp))
4908             continue;
4909
4910           if (exp->X_op != O_constant)
4911             continue;
4912
4913           /* Since displacement is signed extended to 64bit, don't allow
4914              disp32 and turn off disp32s if they are out of range.  */
4915           i.types[j].bitfield.disp32 = 0;
4916           if (fits_in_signed_long (exp->X_add_number))
4917             continue;
4918
4919           i.types[j].bitfield.disp32s = 0;
4920           if (i.types[j].bitfield.baseindex)
4921             {
4922               as_bad (_("0x%" BFD_VMA_FMT "x out of range of signed 32bit displacement"),
4923                       exp->X_add_number);
4924               return;
4925             }
4926         }
4927     }
4928
4929   /* Don't optimize displacement for movabs since it only takes 64bit
4930      displacement.  */
4931   if (i.disp_operands
4932       && i.disp_encoding != disp_encoding_32bit
4933       && (flag_code != CODE_64BIT
4934           || strcmp (mnemonic, "movabs") != 0))
4935     optimize_disp ();
4936
4937   /* Next, we find a template that matches the given insn,
4938      making sure the overlap of the given operands types is consistent
4939      with the template operand types.  */
4940
4941   if (!(t = match_template (mnem_suffix)))
4942     return;
4943
4944   if (sse_check != check_none
4945       && !i.tm.opcode_modifier.noavx
4946       && !i.tm.cpu_flags.bitfield.cpuavx
4947       && !i.tm.cpu_flags.bitfield.cpuavx512f
4948       && (i.tm.cpu_flags.bitfield.cpusse
4949           || i.tm.cpu_flags.bitfield.cpusse2
4950           || i.tm.cpu_flags.bitfield.cpusse3
4951           || i.tm.cpu_flags.bitfield.cpussse3
4952           || i.tm.cpu_flags.bitfield.cpusse4_1
4953           || i.tm.cpu_flags.bitfield.cpusse4_2
4954           || i.tm.cpu_flags.bitfield.cpupclmul
4955           || i.tm.cpu_flags.bitfield.cpuaes
4956           || i.tm.cpu_flags.bitfield.cpusha
4957           || i.tm.cpu_flags.bitfield.cpugfni))
4958     {
4959       (sse_check == check_warning
4960        ? as_warn
4961        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4962     }
4963
4964   if (i.tm.opcode_modifier.fwait)
4965     if (!add_prefix (FWAIT_OPCODE))
4966       return;
4967
4968   /* Check if REP prefix is OK.  */
4969   if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
4970     {
4971       as_bad (_("invalid instruction `%s' after `%s'"),
4972                 i.tm.name, i.rep_prefix);
4973       return;
4974     }
4975
4976   /* Check for lock without a lockable instruction.  Destination operand
4977      must be memory unless it is xchg (0x86).  */
4978   if (i.prefix[LOCK_PREFIX]
4979       && (i.tm.opcode_modifier.prefixok < PrefixLock
4980           || i.mem_operands == 0
4981           || (i.tm.base_opcode != 0x86
4982               && !(i.flags[i.operands - 1] & Operand_Mem))))
4983     {
4984       as_bad (_("expecting lockable instruction after `lock'"));
4985       return;
4986     }
4987
4988   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4989   if (i.prefix[DATA_PREFIX]
4990       && (is_any_vex_encoding (&i.tm)
4991           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4992           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4993     {
4994       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4995       return;
4996     }
4997
4998   /* Check if HLE prefix is OK.  */
4999   if (i.hle_prefix && !check_hle ())
5000     return;
5001
5002   /* Check BND prefix.  */
5003   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
5004     as_bad (_("expecting valid branch instruction after `bnd'"));
5005
5006   /* Check NOTRACK prefix.  */
5007   if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
5008     as_bad (_("expecting indirect branch instruction after `notrack'"));
5009
5010   if (i.tm.cpu_flags.bitfield.cpumpx)
5011     {
5012       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
5013         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
5014       else if (flag_code != CODE_16BIT
5015                ? i.prefix[ADDR_PREFIX]
5016                : i.mem_operands && !i.prefix[ADDR_PREFIX])
5017         as_bad (_("16-bit address isn't allowed in MPX instructions"));
5018     }
5019
5020   /* Insert BND prefix.  */
5021   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
5022     {
5023       if (!i.prefix[BND_PREFIX])
5024         add_prefix (BND_PREFIX_OPCODE);
5025       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
5026         {
5027           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
5028           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
5029         }
5030     }
5031
5032   /* Check string instruction segment overrides.  */
5033   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
5034     {
5035       gas_assert (i.mem_operands);
5036       if (!check_string ())
5037         return;
5038       i.disp_operands = 0;
5039     }
5040
5041   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
5042     optimize_encoding ();
5043
5044   if (!process_suffix ())
5045     return;
5046
5047   /* Update operand types and check extended states.  */
5048   for (j = 0; j < i.operands; j++)
5049     {
5050       i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
5051       switch (i.tm.operand_types[j].bitfield.class)
5052         {
5053         default:
5054           break;
5055         case RegMMX:
5056           i.xstate |= xstate_mmx;
5057           break;
5058         case RegMask:
5059           i.xstate |= xstate_mask;
5060           break;
5061         case RegSIMD:
5062           if (i.tm.operand_types[j].bitfield.tmmword)
5063             i.xstate |= xstate_tmm;
5064           else if (i.tm.operand_types[j].bitfield.zmmword)
5065             i.xstate |= xstate_zmm;
5066           else if (i.tm.operand_types[j].bitfield.ymmword)
5067             i.xstate |= xstate_ymm;
5068           else if (i.tm.operand_types[j].bitfield.xmmword)
5069             i.xstate |= xstate_xmm;
5070           break;
5071         }
5072     }
5073
5074   /* Make still unresolved immediate matches conform to size of immediate
5075      given in i.suffix.  */
5076   if (!finalize_imm ())
5077     return;
5078
5079   if (i.types[0].bitfield.imm1)
5080     i.imm_operands = 0; /* kludge for shift insns.  */
5081
5082   /* We only need to check those implicit registers for instructions
5083      with 3 operands or less.  */
5084   if (i.operands <= 3)
5085     for (j = 0; j < i.operands; j++)
5086       if (i.types[j].bitfield.instance != InstanceNone
5087           && !i.types[j].bitfield.xmmword)
5088         i.reg_operands--;
5089
5090   /* For insns with operands there are more diddles to do to the opcode.  */
5091   if (i.operands)
5092     {
5093       if (!process_operands ())
5094         return;
5095     }
5096   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
5097     {
5098       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
5099       as_warn (_("translating to `%sp'"), i.tm.name);
5100     }
5101
5102   if (is_any_vex_encoding (&i.tm))
5103     {
5104       if (!cpu_arch_flags.bitfield.cpui286)
5105         {
5106           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
5107                   i.tm.name);
5108           return;
5109         }
5110
5111       /* Check for explicit REX prefix.  */
5112       if (i.prefix[REX_PREFIX] || i.rex_encoding)
5113         {
5114           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
5115           return;
5116         }
5117
5118       if (i.tm.opcode_modifier.vex)
5119         build_vex_prefix (t);
5120       else
5121         build_evex_prefix ();
5122
5123       /* The individual REX.RXBW bits got consumed.  */
5124       i.rex &= REX_OPCODE;
5125     }
5126
5127   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
5128      instructions may define INT_OPCODE as well, so avoid this corner
5129      case for those instructions that use MODRM.  */
5130   if (i.tm.opcode_modifier.opcodespace == SPACE_BASE
5131       && i.tm.base_opcode == INT_OPCODE
5132       && !i.tm.opcode_modifier.modrm
5133       && i.op[0].imms->X_add_number == 3)
5134     {
5135       i.tm.base_opcode = INT3_OPCODE;
5136       i.imm_operands = 0;
5137     }
5138
5139   if ((i.tm.opcode_modifier.jump == JUMP
5140        || i.tm.opcode_modifier.jump == JUMP_BYTE
5141        || i.tm.opcode_modifier.jump == JUMP_DWORD)
5142       && i.op[0].disps->X_op == O_constant)
5143     {
5144       /* Convert "jmp constant" (and "call constant") to a jump (call) to
5145          the absolute address given by the constant.  Since ix86 jumps and
5146          calls are pc relative, we need to generate a reloc.  */
5147       i.op[0].disps->X_add_symbol = &abs_symbol;
5148       i.op[0].disps->X_op = O_symbol;
5149     }
5150
5151   /* For 8 bit registers we need an empty rex prefix.  Also if the
5152      instruction already has a prefix, we need to convert old
5153      registers to new ones.  */
5154
5155   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
5156        && (i.op[0].regs->reg_flags & RegRex64) != 0)
5157       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
5158           && (i.op[1].regs->reg_flags & RegRex64) != 0)
5159       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
5160            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
5161           && i.rex != 0))
5162     {
5163       int x;
5164
5165       i.rex |= REX_OPCODE;
5166       for (x = 0; x < 2; x++)
5167         {
5168           /* Look for 8 bit operand that uses old registers.  */
5169           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
5170               && (i.op[x].regs->reg_flags & RegRex64) == 0)
5171             {
5172               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5173               /* In case it is "hi" register, give up.  */
5174               if (i.op[x].regs->reg_num > 3)
5175                 as_bad (_("can't encode register '%s%s' in an "
5176                           "instruction requiring REX prefix."),
5177                         register_prefix, i.op[x].regs->reg_name);
5178
5179               /* Otherwise it is equivalent to the extended register.
5180                  Since the encoding doesn't change this is merely
5181                  cosmetic cleanup for debug output.  */
5182
5183               i.op[x].regs = i.op[x].regs + 8;
5184             }
5185         }
5186     }
5187
5188   if (i.rex == 0 && i.rex_encoding)
5189     {
5190       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
5191          that uses legacy register.  If it is "hi" register, don't add
5192          the REX_OPCODE byte.  */
5193       int x;
5194       for (x = 0; x < 2; x++)
5195         if (i.types[x].bitfield.class == Reg
5196             && i.types[x].bitfield.byte
5197             && (i.op[x].regs->reg_flags & RegRex64) == 0
5198             && i.op[x].regs->reg_num > 3)
5199           {
5200             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5201             i.rex_encoding = false;
5202             break;
5203           }
5204
5205       if (i.rex_encoding)
5206         i.rex = REX_OPCODE;
5207     }
5208
5209   if (i.rex != 0)
5210     add_prefix (REX_OPCODE | i.rex);
5211
5212   insert_lfence_before ();
5213
5214   /* We are ready to output the insn.  */
5215   output_insn ();
5216
5217   insert_lfence_after ();
5218
5219   last_insn.seg = now_seg;
5220
5221   if (i.tm.opcode_modifier.isprefix)
5222     {
5223       last_insn.kind = last_insn_prefix;
5224       last_insn.name = i.tm.name;
5225       last_insn.file = as_where (&last_insn.line);
5226     }
5227   else
5228     last_insn.kind = last_insn_other;
5229 }
5230
5231 static char *
5232 parse_insn (char *line, char *mnemonic)
5233 {
5234   char *l = line;
5235   char *token_start = l;
5236   char *mnem_p;
5237   int supported;
5238   const insn_template *t;
5239   char *dot_p = NULL;
5240
5241   while (1)
5242     {
5243       mnem_p = mnemonic;
5244       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5245         {
5246           if (*mnem_p == '.')
5247             dot_p = mnem_p;
5248           mnem_p++;
5249           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5250             {
5251               as_bad (_("no such instruction: `%s'"), token_start);
5252               return NULL;
5253             }
5254           l++;
5255         }
5256       if (!is_space_char (*l)
5257           && *l != END_OF_INSN
5258           && (intel_syntax
5259               || (*l != PREFIX_SEPARATOR
5260                   && *l != ',')))
5261         {
5262           as_bad (_("invalid character %s in mnemonic"),
5263                   output_invalid (*l));
5264           return NULL;
5265         }
5266       if (token_start == l)
5267         {
5268           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5269             as_bad (_("expecting prefix; got nothing"));
5270           else
5271             as_bad (_("expecting mnemonic; got nothing"));
5272           return NULL;
5273         }
5274
5275       /* Look up instruction (or prefix) via hash table.  */
5276       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5277
5278       if (*l != END_OF_INSN
5279           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5280           && current_templates
5281           && current_templates->start->opcode_modifier.isprefix)
5282         {
5283           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5284             {
5285               as_bad ((flag_code != CODE_64BIT
5286                        ? _("`%s' is only supported in 64-bit mode")
5287                        : _("`%s' is not supported in 64-bit mode")),
5288                       current_templates->start->name);
5289               return NULL;
5290             }
5291           /* If we are in 16-bit mode, do not allow addr16 or data16.
5292              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5293           if ((current_templates->start->opcode_modifier.size == SIZE16
5294                || current_templates->start->opcode_modifier.size == SIZE32)
5295               && flag_code != CODE_64BIT
5296               && ((current_templates->start->opcode_modifier.size == SIZE32)
5297                   ^ (flag_code == CODE_16BIT)))
5298             {
5299               as_bad (_("redundant %s prefix"),
5300                       current_templates->start->name);
5301               return NULL;
5302             }
5303
5304           if (current_templates->start->base_opcode == PSEUDO_PREFIX)
5305             {
5306               /* Handle pseudo prefixes.  */
5307               switch (current_templates->start->extension_opcode)
5308                 {
5309                 case Prefix_Disp8:
5310                   /* {disp8} */
5311                   i.disp_encoding = disp_encoding_8bit;
5312                   break;
5313                 case Prefix_Disp16:
5314                   /* {disp16} */
5315                   i.disp_encoding = disp_encoding_16bit;
5316                   break;
5317                 case Prefix_Disp32:
5318                   /* {disp32} */
5319                   i.disp_encoding = disp_encoding_32bit;
5320                   break;
5321                 case Prefix_Load:
5322                   /* {load} */
5323                   i.dir_encoding = dir_encoding_load;
5324                   break;
5325                 case Prefix_Store:
5326                   /* {store} */
5327                   i.dir_encoding = dir_encoding_store;
5328                   break;
5329                 case Prefix_VEX:
5330                   /* {vex} */
5331                   i.vec_encoding = vex_encoding_vex;
5332                   break;
5333                 case Prefix_VEX3:
5334                   /* {vex3} */
5335                   i.vec_encoding = vex_encoding_vex3;
5336                   break;
5337                 case Prefix_EVEX:
5338                   /* {evex} */
5339                   i.vec_encoding = vex_encoding_evex;
5340                   break;
5341                 case Prefix_REX:
5342                   /* {rex} */
5343                   i.rex_encoding = true;
5344                   break;
5345                 case Prefix_NoOptimize:
5346                   /* {nooptimize} */
5347                   i.no_optimize = true;
5348                   break;
5349                 default:
5350                   abort ();
5351                 }
5352             }
5353           else
5354             {
5355               /* Add prefix, checking for repeated prefixes.  */
5356               switch (add_prefix (current_templates->start->base_opcode))
5357                 {
5358                 case PREFIX_EXIST:
5359                   return NULL;
5360                 case PREFIX_DS:
5361                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5362                     i.notrack_prefix = current_templates->start->name;
5363                   break;
5364                 case PREFIX_REP:
5365                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5366                     i.hle_prefix = current_templates->start->name;
5367                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5368                     i.bnd_prefix = current_templates->start->name;
5369                   else
5370                     i.rep_prefix = current_templates->start->name;
5371                   break;
5372                 default:
5373                   break;
5374                 }
5375             }
5376           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5377           token_start = ++l;
5378         }
5379       else
5380         break;
5381     }
5382
5383   if (!current_templates)
5384     {
5385       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5386          Check if we should swap operand or force 32bit displacement in
5387          encoding.  */
5388       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5389         i.dir_encoding = dir_encoding_swap;
5390       else if (mnem_p - 3 == dot_p
5391                && dot_p[1] == 'd'
5392                && dot_p[2] == '8')
5393         i.disp_encoding = disp_encoding_8bit;
5394       else if (mnem_p - 4 == dot_p
5395                && dot_p[1] == 'd'
5396                && dot_p[2] == '3'
5397                && dot_p[3] == '2')
5398         i.disp_encoding = disp_encoding_32bit;
5399       else
5400         goto check_suffix;
5401       mnem_p = dot_p;
5402       *dot_p = '\0';
5403       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5404     }
5405
5406   if (!current_templates)
5407     {
5408     check_suffix:
5409       if (mnem_p > mnemonic)
5410         {
5411           /* See if we can get a match by trimming off a suffix.  */
5412           switch (mnem_p[-1])
5413             {
5414             case WORD_MNEM_SUFFIX:
5415               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5416                 i.suffix = SHORT_MNEM_SUFFIX;
5417               else
5418                 /* Fall through.  */
5419               case BYTE_MNEM_SUFFIX:
5420               case QWORD_MNEM_SUFFIX:
5421                 i.suffix = mnem_p[-1];
5422               mnem_p[-1] = '\0';
5423               current_templates
5424                 = (const templates *) str_hash_find (op_hash, mnemonic);
5425               break;
5426             case SHORT_MNEM_SUFFIX:
5427             case LONG_MNEM_SUFFIX:
5428               if (!intel_syntax)
5429                 {
5430                   i.suffix = mnem_p[-1];
5431                   mnem_p[-1] = '\0';
5432                   current_templates
5433                     = (const templates *) str_hash_find (op_hash, mnemonic);
5434                 }
5435               break;
5436
5437               /* Intel Syntax.  */
5438             case 'd':
5439               if (intel_syntax)
5440                 {
5441                   if (intel_float_operand (mnemonic) == 1)
5442                     i.suffix = SHORT_MNEM_SUFFIX;
5443                   else
5444                     i.suffix = LONG_MNEM_SUFFIX;
5445                   mnem_p[-1] = '\0';
5446                   current_templates
5447                     = (const templates *) str_hash_find (op_hash, mnemonic);
5448                 }
5449               break;
5450             }
5451         }
5452
5453       if (!current_templates)
5454         {
5455           as_bad (_("no such instruction: `%s'"), token_start);
5456           return NULL;
5457         }
5458     }
5459
5460   if (current_templates->start->opcode_modifier.jump == JUMP
5461       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5462     {
5463       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5464          predict taken and predict not taken respectively.
5465          I'm not sure that branch hints actually do anything on loop
5466          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5467          may work in the future and it doesn't hurt to accept them
5468          now.  */
5469       if (l[0] == ',' && l[1] == 'p')
5470         {
5471           if (l[2] == 't')
5472             {
5473               if (!add_prefix (DS_PREFIX_OPCODE))
5474                 return NULL;
5475               l += 3;
5476             }
5477           else if (l[2] == 'n')
5478             {
5479               if (!add_prefix (CS_PREFIX_OPCODE))
5480                 return NULL;
5481               l += 3;
5482             }
5483         }
5484     }
5485   /* Any other comma loses.  */
5486   if (*l == ',')
5487     {
5488       as_bad (_("invalid character %s in mnemonic"),
5489               output_invalid (*l));
5490       return NULL;
5491     }
5492
5493   /* Check if instruction is supported on specified architecture.  */
5494   supported = 0;
5495   for (t = current_templates->start; t < current_templates->end; ++t)
5496     {
5497       supported |= cpu_flags_match (t);
5498       if (supported == CPU_FLAGS_PERFECT_MATCH)
5499         {
5500           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5501             as_warn (_("use .code16 to ensure correct addressing mode"));
5502
5503           return l;
5504         }
5505     }
5506
5507   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5508     as_bad (flag_code == CODE_64BIT
5509             ? _("`%s' is not supported in 64-bit mode")
5510             : _("`%s' is only supported in 64-bit mode"),
5511             current_templates->start->name);
5512   else
5513     as_bad (_("`%s' is not supported on `%s%s'"),
5514             current_templates->start->name,
5515             cpu_arch_name ? cpu_arch_name : default_arch,
5516             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5517
5518   return NULL;
5519 }
5520
5521 static char *
5522 parse_operands (char *l, const char *mnemonic)
5523 {
5524   char *token_start;
5525
5526   /* 1 if operand is pending after ','.  */
5527   unsigned int expecting_operand = 0;
5528
5529   while (*l != END_OF_INSN)
5530     {
5531       /* Non-zero if operand parens not balanced.  */
5532       unsigned int paren_not_balanced = 0;
5533       /* True if inside double quotes.  */
5534       bool in_quotes = false;
5535
5536       /* Skip optional white space before operand.  */
5537       if (is_space_char (*l))
5538         ++l;
5539       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5540         {
5541           as_bad (_("invalid character %s before operand %d"),
5542                   output_invalid (*l),
5543                   i.operands + 1);
5544           return NULL;
5545         }
5546       token_start = l;  /* After white space.  */
5547       while (in_quotes || paren_not_balanced || *l != ',')
5548         {
5549           if (*l == END_OF_INSN)
5550             {
5551               if (in_quotes)
5552                 {
5553                   as_bad (_("unbalanced double quotes in operand %d."),
5554                           i.operands + 1);
5555                   return NULL;
5556                 }
5557               if (paren_not_balanced)
5558                 {
5559                   know (!intel_syntax);
5560                   as_bad (_("unbalanced parenthesis in operand %d."),
5561                           i.operands + 1);
5562                   return NULL;
5563                 }
5564               else
5565                 break;  /* we are done */
5566             }
5567           else if (*l == '\\' && l[1] == '"')
5568             ++l;
5569           else if (*l == '"')
5570             in_quotes = !in_quotes;
5571           else if (!in_quotes && !is_operand_char (*l) && !is_space_char (*l))
5572             {
5573               as_bad (_("invalid character %s in operand %d"),
5574                       output_invalid (*l),
5575                       i.operands + 1);
5576               return NULL;
5577             }
5578           if (!intel_syntax && !in_quotes)
5579             {
5580               if (*l == '(')
5581                 ++paren_not_balanced;
5582               if (*l == ')')
5583                 --paren_not_balanced;
5584             }
5585           l++;
5586         }
5587       if (l != token_start)
5588         {                       /* Yes, we've read in another operand.  */
5589           unsigned int operand_ok;
5590           this_operand = i.operands++;
5591           if (i.operands > MAX_OPERANDS)
5592             {
5593               as_bad (_("spurious operands; (%d operands/instruction max)"),
5594                       MAX_OPERANDS);
5595               return NULL;
5596             }
5597           i.types[this_operand].bitfield.unspecified = 1;
5598           /* Now parse operand adding info to 'i' as we go along.  */
5599           END_STRING_AND_SAVE (l);
5600
5601           if (i.mem_operands > 1)
5602             {
5603               as_bad (_("too many memory references for `%s'"),
5604                       mnemonic);
5605               return 0;
5606             }
5607
5608           if (intel_syntax)
5609             operand_ok =
5610               i386_intel_operand (token_start,
5611                                   intel_float_operand (mnemonic));
5612           else
5613             operand_ok = i386_att_operand (token_start);
5614
5615           RESTORE_END_STRING (l);
5616           if (!operand_ok)
5617             return NULL;
5618         }
5619       else
5620         {
5621           if (expecting_operand)
5622             {
5623             expecting_operand_after_comma:
5624               as_bad (_("expecting operand after ','; got nothing"));
5625               return NULL;
5626             }
5627           if (*l == ',')
5628             {
5629               as_bad (_("expecting operand before ','; got nothing"));
5630               return NULL;
5631             }
5632         }
5633
5634       /* Now *l must be either ',' or END_OF_INSN.  */
5635       if (*l == ',')
5636         {
5637           if (*++l == END_OF_INSN)
5638             {
5639               /* Just skip it, if it's \n complain.  */
5640               goto expecting_operand_after_comma;
5641             }
5642           expecting_operand = 1;
5643         }
5644     }
5645   return l;
5646 }
5647
5648 static void
5649 swap_2_operands (unsigned int xchg1, unsigned int xchg2)
5650 {
5651   union i386_op temp_op;
5652   i386_operand_type temp_type;
5653   unsigned int temp_flags;
5654   enum bfd_reloc_code_real temp_reloc;
5655
5656   temp_type = i.types[xchg2];
5657   i.types[xchg2] = i.types[xchg1];
5658   i.types[xchg1] = temp_type;
5659
5660   temp_flags = i.flags[xchg2];
5661   i.flags[xchg2] = i.flags[xchg1];
5662   i.flags[xchg1] = temp_flags;
5663
5664   temp_op = i.op[xchg2];
5665   i.op[xchg2] = i.op[xchg1];
5666   i.op[xchg1] = temp_op;
5667
5668   temp_reloc = i.reloc[xchg2];
5669   i.reloc[xchg2] = i.reloc[xchg1];
5670   i.reloc[xchg1] = temp_reloc;
5671
5672   if (i.mask.reg)
5673     {
5674       if (i.mask.operand == xchg1)
5675         i.mask.operand = xchg2;
5676       else if (i.mask.operand == xchg2)
5677         i.mask.operand = xchg1;
5678     }
5679   if (i.broadcast.type)
5680     {
5681       if (i.broadcast.operand == xchg1)
5682         i.broadcast.operand = xchg2;
5683       else if (i.broadcast.operand == xchg2)
5684         i.broadcast.operand = xchg1;
5685     }
5686   if (i.rounding.type != rc_none)
5687     {
5688       if (i.rounding.operand == xchg1)
5689         i.rounding.operand = xchg2;
5690       else if (i.rounding.operand == xchg2)
5691         i.rounding.operand = xchg1;
5692     }
5693 }
5694
5695 static void
5696 swap_operands (void)
5697 {
5698   switch (i.operands)
5699     {
5700     case 5:
5701     case 4:
5702       swap_2_operands (1, i.operands - 2);
5703       /* Fall through.  */
5704     case 3:
5705     case 2:
5706       swap_2_operands (0, i.operands - 1);
5707       break;
5708     default:
5709       abort ();
5710     }
5711
5712   if (i.mem_operands == 2)
5713     {
5714       const reg_entry *temp_seg;
5715       temp_seg = i.seg[0];
5716       i.seg[0] = i.seg[1];
5717       i.seg[1] = temp_seg;
5718     }
5719 }
5720
5721 /* Try to ensure constant immediates are represented in the smallest
5722    opcode possible.  */
5723 static void
5724 optimize_imm (void)
5725 {
5726   char guess_suffix = 0;
5727   int op;
5728
5729   if (i.suffix)
5730     guess_suffix = i.suffix;
5731   else if (i.reg_operands)
5732     {
5733       /* Figure out a suffix from the last register operand specified.
5734          We can't do this properly yet, i.e. excluding special register
5735          instances, but the following works for instructions with
5736          immediates.  In any case, we can't set i.suffix yet.  */
5737       for (op = i.operands; --op >= 0;)
5738         if (i.types[op].bitfield.class != Reg)
5739           continue;
5740         else if (i.types[op].bitfield.byte)
5741           {
5742             guess_suffix = BYTE_MNEM_SUFFIX;
5743             break;
5744           }
5745         else if (i.types[op].bitfield.word)
5746           {
5747             guess_suffix = WORD_MNEM_SUFFIX;
5748             break;
5749           }
5750         else if (i.types[op].bitfield.dword)
5751           {
5752             guess_suffix = LONG_MNEM_SUFFIX;
5753             break;
5754           }
5755         else if (i.types[op].bitfield.qword)
5756           {
5757             guess_suffix = QWORD_MNEM_SUFFIX;
5758             break;
5759           }
5760     }
5761   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5762     guess_suffix = WORD_MNEM_SUFFIX;
5763
5764   for (op = i.operands; --op >= 0;)
5765     if (operand_type_check (i.types[op], imm))
5766       {
5767         switch (i.op[op].imms->X_op)
5768           {
5769           case O_constant:
5770             /* If a suffix is given, this operand may be shortened.  */
5771             switch (guess_suffix)
5772               {
5773               case LONG_MNEM_SUFFIX:
5774                 i.types[op].bitfield.imm32 = 1;
5775                 i.types[op].bitfield.imm64 = 1;
5776                 break;
5777               case WORD_MNEM_SUFFIX:
5778                 i.types[op].bitfield.imm16 = 1;
5779                 i.types[op].bitfield.imm32 = 1;
5780                 i.types[op].bitfield.imm32s = 1;
5781                 i.types[op].bitfield.imm64 = 1;
5782                 break;
5783               case BYTE_MNEM_SUFFIX:
5784                 i.types[op].bitfield.imm8 = 1;
5785                 i.types[op].bitfield.imm8s = 1;
5786                 i.types[op].bitfield.imm16 = 1;
5787                 i.types[op].bitfield.imm32 = 1;
5788                 i.types[op].bitfield.imm32s = 1;
5789                 i.types[op].bitfield.imm64 = 1;
5790                 break;
5791               }
5792
5793             /* If this operand is at most 16 bits, convert it
5794                to a signed 16 bit number before trying to see
5795                whether it will fit in an even smaller size.
5796                This allows a 16-bit operand such as $0xffe0 to
5797                be recognised as within Imm8S range.  */
5798             if ((i.types[op].bitfield.imm16)
5799                 && fits_in_unsigned_word (i.op[op].imms->X_add_number))
5800               {
5801                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5802                                                 ^ 0x8000) - 0x8000);
5803               }
5804 #ifdef BFD64
5805             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5806             if ((i.types[op].bitfield.imm32)
5807                 && fits_in_unsigned_long (i.op[op].imms->X_add_number))
5808               {
5809                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5810                                                 ^ ((offsetT) 1 << 31))
5811                                                - ((offsetT) 1 << 31));
5812               }
5813 #endif
5814             i.types[op]
5815               = operand_type_or (i.types[op],
5816                                  smallest_imm_type (i.op[op].imms->X_add_number));
5817
5818             /* We must avoid matching of Imm32 templates when 64bit
5819                only immediate is available.  */
5820             if (guess_suffix == QWORD_MNEM_SUFFIX)
5821               i.types[op].bitfield.imm32 = 0;
5822             break;
5823
5824           case O_absent:
5825           case O_register:
5826             abort ();
5827
5828             /* Symbols and expressions.  */
5829           default:
5830             /* Convert symbolic operand to proper sizes for matching, but don't
5831                prevent matching a set of insns that only supports sizes other
5832                than those matching the insn suffix.  */
5833             {
5834               i386_operand_type mask, allowed;
5835               const insn_template *t = current_templates->start;
5836
5837               operand_type_set (&mask, 0);
5838               allowed = t->operand_types[op];
5839
5840               while (++t < current_templates->end)
5841                 {
5842                   allowed = operand_type_and (allowed, anyimm);
5843                   allowed = operand_type_or (allowed, t->operand_types[op]);
5844                 }
5845               switch (guess_suffix)
5846                 {
5847                 case QWORD_MNEM_SUFFIX:
5848                   mask.bitfield.imm64 = 1;
5849                   mask.bitfield.imm32s = 1;
5850                   break;
5851                 case LONG_MNEM_SUFFIX:
5852                   mask.bitfield.imm32 = 1;
5853                   break;
5854                 case WORD_MNEM_SUFFIX:
5855                   mask.bitfield.imm16 = 1;
5856                   break;
5857                 case BYTE_MNEM_SUFFIX:
5858                   mask.bitfield.imm8 = 1;
5859                   break;
5860                 default:
5861                   break;
5862                 }
5863               allowed = operand_type_and (mask, allowed);
5864               if (!operand_type_all_zero (&allowed))
5865                 i.types[op] = operand_type_and (i.types[op], mask);
5866             }
5867             break;
5868           }
5869       }
5870 }
5871
5872 /* Try to use the smallest displacement type too.  */
5873 static void
5874 optimize_disp (void)
5875 {
5876   int op;
5877
5878   for (op = i.operands; --op >= 0;)
5879     if (operand_type_check (i.types[op], disp))
5880       {
5881         if (i.op[op].disps->X_op == O_constant)
5882           {
5883             offsetT op_disp = i.op[op].disps->X_add_number;
5884
5885             if (!op_disp && i.types[op].bitfield.baseindex)
5886               {
5887                 i.types[op].bitfield.disp8 = 0;
5888                 i.types[op].bitfield.disp16 = 0;
5889                 i.types[op].bitfield.disp32 = 0;
5890                 i.types[op].bitfield.disp32s = 0;
5891                 i.types[op].bitfield.disp64 = 0;
5892                 i.op[op].disps = 0;
5893                 i.disp_operands--;
5894                 continue;
5895               }
5896
5897             if (i.types[op].bitfield.disp16
5898                 && fits_in_unsigned_word (op_disp))
5899               {
5900                 /* If this operand is at most 16 bits, convert
5901                    to a signed 16 bit number and don't use 64bit
5902                    displacement.  */
5903                 op_disp = ((op_disp ^ 0x8000) - 0x8000);
5904                 i.types[op].bitfield.disp64 = 0;
5905               }
5906
5907 #ifdef BFD64
5908             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5909             if ((i.types[op].bitfield.disp32
5910                  || (flag_code == CODE_64BIT
5911                      && want_disp32 (current_templates->start)))
5912                 && fits_in_unsigned_long (op_disp))
5913               {
5914                 /* If this operand is at most 32 bits, convert
5915                    to a signed 32 bit number and don't use 64bit
5916                    displacement.  */
5917                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5918                 i.types[op].bitfield.disp64 = 0;
5919                 i.types[op].bitfield.disp32 = 1;
5920               }
5921
5922             if (flag_code == CODE_64BIT && fits_in_signed_long (op_disp))
5923               {
5924                 i.types[op].bitfield.disp64 = 0;
5925                 i.types[op].bitfield.disp32s = 1;
5926               }
5927 #endif
5928             if ((i.types[op].bitfield.disp32
5929                  || i.types[op].bitfield.disp32s
5930                  || i.types[op].bitfield.disp16)
5931                 && fits_in_disp8 (op_disp))
5932               i.types[op].bitfield.disp8 = 1;
5933
5934             i.op[op].disps->X_add_number = op_disp;
5935           }
5936         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5937                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5938           {
5939             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5940                          i.op[op].disps, 0, i.reloc[op]);
5941             i.types[op].bitfield.disp8 = 0;
5942             i.types[op].bitfield.disp16 = 0;
5943             i.types[op].bitfield.disp32 = 0;
5944             i.types[op].bitfield.disp32s = 0;
5945             i.types[op].bitfield.disp64 = 0;
5946           }
5947         else
5948           /* We only support 64bit displacement on constants.  */
5949           i.types[op].bitfield.disp64 = 0;
5950       }
5951 }
5952
5953 /* Return 1 if there is a match in broadcast bytes between operand
5954    GIVEN and instruction template T.   */
5955
5956 static INLINE int
5957 match_broadcast_size (const insn_template *t, unsigned int given)
5958 {
5959   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5960            && i.types[given].bitfield.byte)
5961           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5962               && i.types[given].bitfield.word)
5963           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5964               && i.types[given].bitfield.dword)
5965           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5966               && i.types[given].bitfield.qword));
5967 }
5968
5969 /* Check if operands are valid for the instruction.  */
5970
5971 static int
5972 check_VecOperands (const insn_template *t)
5973 {
5974   unsigned int op;
5975   i386_cpu_flags cpu;
5976
5977   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5978      any one operand are implicity requiring AVX512VL support if the actual
5979      operand size is YMMword or XMMword.  Since this function runs after
5980      template matching, there's no need to check for YMMword/XMMword in
5981      the template.  */
5982   cpu = cpu_flags_and (t->cpu_flags, avx512);
5983   if (!cpu_flags_all_zero (&cpu)
5984       && !t->cpu_flags.bitfield.cpuavx512vl
5985       && !cpu_arch_flags.bitfield.cpuavx512vl)
5986     {
5987       for (op = 0; op < t->operands; ++op)
5988         {
5989           if (t->operand_types[op].bitfield.zmmword
5990               && (i.types[op].bitfield.ymmword
5991                   || i.types[op].bitfield.xmmword))
5992             {
5993               i.error = unsupported;
5994               return 1;
5995             }
5996         }
5997     }
5998
5999   /* Without VSIB byte, we can't have a vector register for index.  */
6000   if (!t->opcode_modifier.sib
6001       && i.index_reg
6002       && (i.index_reg->reg_type.bitfield.xmmword
6003           || i.index_reg->reg_type.bitfield.ymmword
6004           || i.index_reg->reg_type.bitfield.zmmword))
6005     {
6006       i.error = unsupported_vector_index_register;
6007       return 1;
6008     }
6009
6010   /* Check if default mask is allowed.  */
6011   if (t->opcode_modifier.nodefmask
6012       && (!i.mask.reg || i.mask.reg->reg_num == 0))
6013     {
6014       i.error = no_default_mask;
6015       return 1;
6016     }
6017
6018   /* For VSIB byte, we need a vector register for index, and all vector
6019      registers must be distinct.  */
6020   if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
6021     {
6022       if (!i.index_reg
6023           || !((t->opcode_modifier.sib == VECSIB128
6024                 && i.index_reg->reg_type.bitfield.xmmword)
6025                || (t->opcode_modifier.sib == VECSIB256
6026                    && i.index_reg->reg_type.bitfield.ymmword)
6027                || (t->opcode_modifier.sib == VECSIB512
6028                    && i.index_reg->reg_type.bitfield.zmmword)))
6029       {
6030         i.error = invalid_vsib_address;
6031         return 1;
6032       }
6033
6034       gas_assert (i.reg_operands == 2 || i.mask.reg);
6035       if (i.reg_operands == 2 && !i.mask.reg)
6036         {
6037           gas_assert (i.types[0].bitfield.class == RegSIMD);
6038           gas_assert (i.types[0].bitfield.xmmword
6039                       || i.types[0].bitfield.ymmword);
6040           gas_assert (i.types[2].bitfield.class == RegSIMD);
6041           gas_assert (i.types[2].bitfield.xmmword
6042                       || i.types[2].bitfield.ymmword);
6043           if (operand_check == check_none)
6044             return 0;
6045           if (register_number (i.op[0].regs)
6046               != register_number (i.index_reg)
6047               && register_number (i.op[2].regs)
6048                  != register_number (i.index_reg)
6049               && register_number (i.op[0].regs)
6050                  != register_number (i.op[2].regs))
6051             return 0;
6052           if (operand_check == check_error)
6053             {
6054               i.error = invalid_vector_register_set;
6055               return 1;
6056             }
6057           as_warn (_("mask, index, and destination registers should be distinct"));
6058         }
6059       else if (i.reg_operands == 1 && i.mask.reg)
6060         {
6061           if (i.types[1].bitfield.class == RegSIMD
6062               && (i.types[1].bitfield.xmmword
6063                   || i.types[1].bitfield.ymmword
6064                   || i.types[1].bitfield.zmmword)
6065               && (register_number (i.op[1].regs)
6066                   == register_number (i.index_reg)))
6067             {
6068               if (operand_check == check_error)
6069                 {
6070                   i.error = invalid_vector_register_set;
6071                   return 1;
6072                 }
6073               if (operand_check != check_none)
6074                 as_warn (_("index and destination registers should be distinct"));
6075             }
6076         }
6077     }
6078
6079   /* For AMX instructions with three tmmword operands, all tmmword operand must be
6080      distinct */
6081   if (t->operand_types[0].bitfield.tmmword
6082       && i.reg_operands == 3)
6083     {
6084       if (register_number (i.op[0].regs)
6085           == register_number (i.op[1].regs)
6086           || register_number (i.op[0].regs)
6087              == register_number (i.op[2].regs)
6088           || register_number (i.op[1].regs)
6089              == register_number (i.op[2].regs))
6090         {
6091           i.error = invalid_tmm_register_set;
6092           return 1;
6093         }
6094     }
6095
6096   /* Check if broadcast is supported by the instruction and is applied
6097      to the memory operand.  */
6098   if (i.broadcast.type)
6099     {
6100       i386_operand_type type, overlap;
6101
6102       /* Check if specified broadcast is supported in this instruction,
6103          and its broadcast bytes match the memory operand.  */
6104       op = i.broadcast.operand;
6105       if (!t->opcode_modifier.broadcast
6106           || !(i.flags[op] & Operand_Mem)
6107           || (!i.types[op].bitfield.unspecified
6108               && !match_broadcast_size (t, op)))
6109         {
6110         bad_broadcast:
6111           i.error = unsupported_broadcast;
6112           return 1;
6113         }
6114
6115       i.broadcast.bytes = ((1 << (t->opcode_modifier.broadcast - 1))
6116                            * i.broadcast.type);
6117       operand_type_set (&type, 0);
6118       switch (i.broadcast.bytes)
6119         {
6120         case 2:
6121           type.bitfield.word = 1;
6122           break;
6123         case 4:
6124           type.bitfield.dword = 1;
6125           break;
6126         case 8:
6127           type.bitfield.qword = 1;
6128           break;
6129         case 16:
6130           type.bitfield.xmmword = 1;
6131           break;
6132         case 32:
6133           type.bitfield.ymmword = 1;
6134           break;
6135         case 64:
6136           type.bitfield.zmmword = 1;
6137           break;
6138         default:
6139           goto bad_broadcast;
6140         }
6141
6142       overlap = operand_type_and (type, t->operand_types[op]);
6143       if (t->operand_types[op].bitfield.class == RegSIMD
6144           && t->operand_types[op].bitfield.byte
6145              + t->operand_types[op].bitfield.word
6146              + t->operand_types[op].bitfield.dword
6147              + t->operand_types[op].bitfield.qword > 1)
6148         {
6149           overlap.bitfield.xmmword = 0;
6150           overlap.bitfield.ymmword = 0;
6151           overlap.bitfield.zmmword = 0;
6152         }
6153       if (operand_type_all_zero (&overlap))
6154           goto bad_broadcast;
6155
6156       if (t->opcode_modifier.checkregsize)
6157         {
6158           unsigned int j;
6159
6160           type.bitfield.baseindex = 1;
6161           for (j = 0; j < i.operands; ++j)
6162             {
6163               if (j != op
6164                   && !operand_type_register_match(i.types[j],
6165                                                   t->operand_types[j],
6166                                                   type,
6167                                                   t->operand_types[op]))
6168                 goto bad_broadcast;
6169             }
6170         }
6171     }
6172   /* If broadcast is supported in this instruction, we need to check if
6173      operand of one-element size isn't specified without broadcast.  */
6174   else if (t->opcode_modifier.broadcast && i.mem_operands)
6175     {
6176       /* Find memory operand.  */
6177       for (op = 0; op < i.operands; op++)
6178         if (i.flags[op] & Operand_Mem)
6179           break;
6180       gas_assert (op < i.operands);
6181       /* Check size of the memory operand.  */
6182       if (match_broadcast_size (t, op))
6183         {
6184           i.error = broadcast_needed;
6185           return 1;
6186         }
6187     }
6188   else
6189     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
6190
6191   /* Check if requested masking is supported.  */
6192   if (i.mask.reg)
6193     {
6194       switch (t->opcode_modifier.masking)
6195         {
6196         case BOTH_MASKING:
6197           break;
6198         case MERGING_MASKING:
6199           if (i.mask.zeroing)
6200             {
6201         case 0:
6202               i.error = unsupported_masking;
6203               return 1;
6204             }
6205           break;
6206         case DYNAMIC_MASKING:
6207           /* Memory destinations allow only merging masking.  */
6208           if (i.mask.zeroing && i.mem_operands)
6209             {
6210               /* Find memory operand.  */
6211               for (op = 0; op < i.operands; op++)
6212                 if (i.flags[op] & Operand_Mem)
6213                   break;
6214               gas_assert (op < i.operands);
6215               if (op == i.operands - 1)
6216                 {
6217                   i.error = unsupported_masking;
6218                   return 1;
6219                 }
6220             }
6221           break;
6222         default:
6223           abort ();
6224         }
6225     }
6226
6227   /* Check if masking is applied to dest operand.  */
6228   if (i.mask.reg && (i.mask.operand != i.operands - 1))
6229     {
6230       i.error = mask_not_on_destination;
6231       return 1;
6232     }
6233
6234   /* Check RC/SAE.  */
6235   if (i.rounding.type != rc_none)
6236     {
6237       if (!t->opcode_modifier.sae
6238           || (i.rounding.type != saeonly && !t->opcode_modifier.staticrounding))
6239         {
6240           i.error = unsupported_rc_sae;
6241           return 1;
6242         }
6243       /* If the instruction has several immediate operands and one of
6244          them is rounding, the rounding operand should be the last
6245          immediate operand.  */
6246       if (i.imm_operands > 1
6247           && i.rounding.operand != i.imm_operands - 1)
6248         {
6249           i.error = rc_sae_operand_not_last_imm;
6250           return 1;
6251         }
6252     }
6253
6254   /* Check the special Imm4 cases; must be the first operand.  */
6255   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6256     {
6257       if (i.op[0].imms->X_op != O_constant
6258           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6259         {
6260           i.error = bad_imm4;
6261           return 1;
6262         }
6263
6264       /* Turn off Imm<N> so that update_imm won't complain.  */
6265       operand_type_set (&i.types[0], 0);
6266     }
6267
6268   /* Check vector Disp8 operand.  */
6269   if (t->opcode_modifier.disp8memshift
6270       && i.disp_encoding != disp_encoding_32bit)
6271     {
6272       if (i.broadcast.type)
6273         i.memshift = t->opcode_modifier.broadcast - 1;
6274       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6275         i.memshift = t->opcode_modifier.disp8memshift;
6276       else
6277         {
6278           const i386_operand_type *type = NULL;
6279
6280           i.memshift = 0;
6281           for (op = 0; op < i.operands; op++)
6282             if (i.flags[op] & Operand_Mem)
6283               {
6284                 if (t->opcode_modifier.evex == EVEXLIG)
6285                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6286                 else if (t->operand_types[op].bitfield.xmmword
6287                          + t->operand_types[op].bitfield.ymmword
6288                          + t->operand_types[op].bitfield.zmmword <= 1)
6289                   type = &t->operand_types[op];
6290                 else if (!i.types[op].bitfield.unspecified)
6291                   type = &i.types[op];
6292               }
6293             else if (i.types[op].bitfield.class == RegSIMD
6294                      && t->opcode_modifier.evex != EVEXLIG)
6295               {
6296                 if (i.types[op].bitfield.zmmword)
6297                   i.memshift = 6;
6298                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6299                   i.memshift = 5;
6300                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6301                   i.memshift = 4;
6302               }
6303
6304           if (type)
6305             {
6306               if (type->bitfield.zmmword)
6307                 i.memshift = 6;
6308               else if (type->bitfield.ymmword)
6309                 i.memshift = 5;
6310               else if (type->bitfield.xmmword)
6311                 i.memshift = 4;
6312             }
6313
6314           /* For the check in fits_in_disp8().  */
6315           if (i.memshift == 0)
6316             i.memshift = -1;
6317         }
6318
6319       for (op = 0; op < i.operands; op++)
6320         if (operand_type_check (i.types[op], disp)
6321             && i.op[op].disps->X_op == O_constant)
6322           {
6323             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6324               {
6325                 i.types[op].bitfield.disp8 = 1;
6326                 return 0;
6327               }
6328             i.types[op].bitfield.disp8 = 0;
6329           }
6330     }
6331
6332   i.memshift = 0;
6333
6334   return 0;
6335 }
6336
6337 /* Check if encoding requirements are met by the instruction.  */
6338
6339 static int
6340 VEX_check_encoding (const insn_template *t)
6341 {
6342   if (i.vec_encoding == vex_encoding_error)
6343     {
6344       i.error = unsupported;
6345       return 1;
6346     }
6347
6348   if (i.vec_encoding == vex_encoding_evex)
6349     {
6350       /* This instruction must be encoded with EVEX prefix.  */
6351       if (!is_evex_encoding (t))
6352         {
6353           i.error = unsupported;
6354           return 1;
6355         }
6356       return 0;
6357     }
6358
6359   if (!t->opcode_modifier.vex)
6360     {
6361       /* This instruction template doesn't have VEX prefix.  */
6362       if (i.vec_encoding != vex_encoding_default)
6363         {
6364           i.error = unsupported;
6365           return 1;
6366         }
6367       return 0;
6368     }
6369
6370   return 0;
6371 }
6372
6373 static const insn_template *
6374 match_template (char mnem_suffix)
6375 {
6376   /* Points to template once we've found it.  */
6377   const insn_template *t;
6378   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6379   i386_operand_type overlap4;
6380   unsigned int found_reverse_match;
6381   i386_opcode_modifier suffix_check;
6382   i386_operand_type operand_types [MAX_OPERANDS];
6383   int addr_prefix_disp;
6384   unsigned int j, size_match, check_register;
6385   enum i386_error specific_error = 0;
6386
6387 #if MAX_OPERANDS != 5
6388 # error "MAX_OPERANDS must be 5."
6389 #endif
6390
6391   found_reverse_match = 0;
6392   addr_prefix_disp = -1;
6393
6394   /* Prepare for mnemonic suffix check.  */
6395   memset (&suffix_check, 0, sizeof (suffix_check));
6396   switch (mnem_suffix)
6397     {
6398     case BYTE_MNEM_SUFFIX:
6399       suffix_check.no_bsuf = 1;
6400       break;
6401     case WORD_MNEM_SUFFIX:
6402       suffix_check.no_wsuf = 1;
6403       break;
6404     case SHORT_MNEM_SUFFIX:
6405       suffix_check.no_ssuf = 1;
6406       break;
6407     case LONG_MNEM_SUFFIX:
6408       suffix_check.no_lsuf = 1;
6409       break;
6410     case QWORD_MNEM_SUFFIX:
6411       suffix_check.no_qsuf = 1;
6412       break;
6413     default:
6414       /* NB: In Intel syntax, normally we can check for memory operand
6415          size when there is no mnemonic suffix.  But jmp and call have
6416          2 different encodings with Dword memory operand size, one with
6417          No_ldSuf and the other without.  i.suffix is set to
6418          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6419       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6420         suffix_check.no_ldsuf = 1;
6421     }
6422
6423   /* Must have right number of operands.  */
6424   i.error = number_of_operands_mismatch;
6425
6426   for (t = current_templates->start; t < current_templates->end; t++)
6427     {
6428       addr_prefix_disp = -1;
6429       found_reverse_match = 0;
6430
6431       if (i.operands != t->operands)
6432         continue;
6433
6434       /* Check processor support.  */
6435       i.error = unsupported;
6436       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6437         continue;
6438
6439       /* Check Pseudo Prefix.  */
6440       i.error = unsupported;
6441       if (t->opcode_modifier.pseudovexprefix
6442           && !(i.vec_encoding == vex_encoding_vex
6443               || i.vec_encoding == vex_encoding_vex3))
6444         continue;
6445
6446       /* Check AT&T mnemonic.   */
6447       i.error = unsupported_with_intel_mnemonic;
6448       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6449         continue;
6450
6451       /* Check AT&T/Intel syntax.  */
6452       i.error = unsupported_syntax;
6453       if ((intel_syntax && t->opcode_modifier.attsyntax)
6454           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6455         continue;
6456
6457       /* Check Intel64/AMD64 ISA.   */
6458       switch (isa64)
6459         {
6460         default:
6461           /* Default: Don't accept Intel64.  */
6462           if (t->opcode_modifier.isa64 == INTEL64)
6463             continue;
6464           break;
6465         case amd64:
6466           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6467           if (t->opcode_modifier.isa64 >= INTEL64)
6468             continue;
6469           break;
6470         case intel64:
6471           /* -mintel64: Don't accept AMD64.  */
6472           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6473             continue;
6474           break;
6475         }
6476
6477       /* Check the suffix.  */
6478       i.error = invalid_instruction_suffix;
6479       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6480           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6481           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6482           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6483           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6484           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6485         continue;
6486
6487       size_match = operand_size_match (t);
6488       if (!size_match)
6489         continue;
6490
6491       /* This is intentionally not
6492
6493          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6494
6495          as the case of a missing * on the operand is accepted (perhaps with
6496          a warning, issued further down).  */
6497       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6498         {
6499           i.error = operand_type_mismatch;
6500           continue;
6501         }
6502
6503       for (j = 0; j < MAX_OPERANDS; j++)
6504         operand_types[j] = t->operand_types[j];
6505
6506       /* In general, don't allow
6507          - 64-bit operands outside of 64-bit mode,
6508          - 32-bit operands on pre-386.  */
6509       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6510       if (((i.suffix == QWORD_MNEM_SUFFIX
6511             && flag_code != CODE_64BIT
6512             && !(t->opcode_modifier.opcodespace == SPACE_0F
6513                  && t->base_opcode == 0xc7
6514                  && t->opcode_modifier.opcodeprefix == PREFIX_NONE
6515                  && t->extension_opcode == 1) /* cmpxchg8b */)
6516            || (i.suffix == LONG_MNEM_SUFFIX
6517                && !cpu_arch_flags.bitfield.cpui386))
6518           && (intel_syntax
6519               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6520                  && !intel_float_operand (t->name))
6521               : intel_float_operand (t->name) != 2)
6522           && (t->operands == i.imm_operands
6523               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6524                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6525                && operand_types[i.imm_operands].bitfield.class != RegMask)
6526               || (operand_types[j].bitfield.class != RegMMX
6527                   && operand_types[j].bitfield.class != RegSIMD
6528                   && operand_types[j].bitfield.class != RegMask))
6529           && !t->opcode_modifier.sib)
6530         continue;
6531
6532       /* Do not verify operands when there are none.  */
6533       if (!t->operands)
6534         {
6535           if (VEX_check_encoding (t))
6536             {
6537               specific_error = i.error;
6538               continue;
6539             }
6540
6541           /* We've found a match; break out of loop.  */
6542           break;
6543         }
6544
6545       if (!t->opcode_modifier.jump
6546           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6547         {
6548           /* There should be only one Disp operand.  */
6549           for (j = 0; j < MAX_OPERANDS; j++)
6550             if (operand_type_check (operand_types[j], disp))
6551               break;
6552           if (j < MAX_OPERANDS)
6553             {
6554               bool override = (i.prefix[ADDR_PREFIX] != 0);
6555
6556               addr_prefix_disp = j;
6557
6558               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6559                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6560               switch (flag_code)
6561                 {
6562                 case CODE_16BIT:
6563                   override = !override;
6564                   /* Fall through.  */
6565                 case CODE_32BIT:
6566                   if (operand_types[j].bitfield.disp32
6567                       && operand_types[j].bitfield.disp16)
6568                     {
6569                       operand_types[j].bitfield.disp16 = override;
6570                       operand_types[j].bitfield.disp32 = !override;
6571                     }
6572                   operand_types[j].bitfield.disp32s = 0;
6573                   operand_types[j].bitfield.disp64 = 0;
6574                   break;
6575
6576                 case CODE_64BIT:
6577                   if (operand_types[j].bitfield.disp32s
6578                       || operand_types[j].bitfield.disp64)
6579                     {
6580                       operand_types[j].bitfield.disp64 &= !override;
6581                       operand_types[j].bitfield.disp32s &= !override;
6582                       operand_types[j].bitfield.disp32 = override;
6583                     }
6584                   operand_types[j].bitfield.disp16 = 0;
6585                   break;
6586                 }
6587             }
6588         }
6589
6590       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6591       if (i.reloc[0] == BFD_RELOC_386_GOT32
6592           && t->base_opcode == 0xa0
6593           && t->opcode_modifier.opcodespace == SPACE_BASE)
6594         continue;
6595
6596       /* We check register size if needed.  */
6597       if (t->opcode_modifier.checkregsize)
6598         {
6599           check_register = (1 << t->operands) - 1;
6600           if (i.broadcast.type)
6601             check_register &= ~(1 << i.broadcast.operand);
6602         }
6603       else
6604         check_register = 0;
6605
6606       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6607       switch (t->operands)
6608         {
6609         case 1:
6610           if (!operand_type_match (overlap0, i.types[0]))
6611             continue;
6612           break;
6613         case 2:
6614           /* xchg %eax, %eax is a special case. It is an alias for nop
6615              only in 32bit mode and we can use opcode 0x90.  In 64bit
6616              mode, we can't use 0x90 for xchg %eax, %eax since it should
6617              zero-extend %eax to %rax.  */
6618           if (flag_code == CODE_64BIT
6619               && t->base_opcode == 0x90
6620               && t->opcode_modifier.opcodespace == SPACE_BASE
6621               && i.types[0].bitfield.instance == Accum
6622               && i.types[0].bitfield.dword
6623               && i.types[1].bitfield.instance == Accum
6624               && i.types[1].bitfield.dword)
6625             continue;
6626           /* xrelease mov %eax, <disp> is another special case. It must not
6627              match the accumulator-only encoding of mov.  */
6628           if (flag_code != CODE_64BIT
6629               && i.hle_prefix
6630               && t->base_opcode == 0xa0
6631               && t->opcode_modifier.opcodespace == SPACE_BASE
6632               && i.types[0].bitfield.instance == Accum
6633               && (i.flags[1] & Operand_Mem))
6634             continue;
6635           /* Fall through.  */
6636
6637         case 3:
6638           if (!(size_match & MATCH_STRAIGHT))
6639             goto check_reverse;
6640           /* Reverse direction of operands if swapping is possible in the first
6641              place (operands need to be symmetric) and
6642              - the load form is requested, and the template is a store form,
6643              - the store form is requested, and the template is a load form,
6644              - the non-default (swapped) form is requested.  */
6645           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6646           if (t->opcode_modifier.d && i.reg_operands == i.operands
6647               && !operand_type_all_zero (&overlap1))
6648             switch (i.dir_encoding)
6649               {
6650               case dir_encoding_load:
6651                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6652                     || t->opcode_modifier.regmem)
6653                   goto check_reverse;
6654                 break;
6655
6656               case dir_encoding_store:
6657                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6658                     && !t->opcode_modifier.regmem)
6659                   goto check_reverse;
6660                 break;
6661
6662               case dir_encoding_swap:
6663                 goto check_reverse;
6664
6665               case dir_encoding_default:
6666                 break;
6667               }
6668           /* If we want store form, we skip the current load.  */
6669           if ((i.dir_encoding == dir_encoding_store
6670                || i.dir_encoding == dir_encoding_swap)
6671               && i.mem_operands == 0
6672               && t->opcode_modifier.load)
6673             continue;
6674           /* Fall through.  */
6675         case 4:
6676         case 5:
6677           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6678           if (!operand_type_match (overlap0, i.types[0])
6679               || !operand_type_match (overlap1, i.types[1])
6680               || ((check_register & 3) == 3
6681                   && !operand_type_register_match (i.types[0],
6682                                                    operand_types[0],
6683                                                    i.types[1],
6684                                                    operand_types[1])))
6685             {
6686               /* Check if other direction is valid ...  */
6687               if (!t->opcode_modifier.d)
6688                 continue;
6689
6690             check_reverse:
6691               if (!(size_match & MATCH_REVERSE))
6692                 continue;
6693               /* Try reversing direction of operands.  */
6694               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6695               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6696               if (!operand_type_match (overlap0, i.types[0])
6697                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6698                   || (check_register
6699                       && !operand_type_register_match (i.types[0],
6700                                                        operand_types[i.operands - 1],
6701                                                        i.types[i.operands - 1],
6702                                                        operand_types[0])))
6703                 {
6704                   /* Does not match either direction.  */
6705                   continue;
6706                 }
6707               /* found_reverse_match holds which of D or FloatR
6708                  we've found.  */
6709               if (!t->opcode_modifier.d)
6710                 found_reverse_match = 0;
6711               else if (operand_types[0].bitfield.tbyte)
6712                 found_reverse_match = Opcode_FloatD;
6713               else if (operand_types[0].bitfield.xmmword
6714                        || operand_types[i.operands - 1].bitfield.xmmword
6715                        || operand_types[0].bitfield.class == RegMMX
6716                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6717                        || is_any_vex_encoding(t))
6718                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6719                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6720               else
6721                 found_reverse_match = Opcode_D;
6722               if (t->opcode_modifier.floatr)
6723                 found_reverse_match |= Opcode_FloatR;
6724             }
6725           else
6726             {
6727               /* Found a forward 2 operand match here.  */
6728               switch (t->operands)
6729                 {
6730                 case 5:
6731                   overlap4 = operand_type_and (i.types[4],
6732                                                operand_types[4]);
6733                   /* Fall through.  */
6734                 case 4:
6735                   overlap3 = operand_type_and (i.types[3],
6736                                                operand_types[3]);
6737                   /* Fall through.  */
6738                 case 3:
6739                   overlap2 = operand_type_and (i.types[2],
6740                                                operand_types[2]);
6741                   break;
6742                 }
6743
6744               switch (t->operands)
6745                 {
6746                 case 5:
6747                   if (!operand_type_match (overlap4, i.types[4])
6748                       || !operand_type_register_match (i.types[3],
6749                                                        operand_types[3],
6750                                                        i.types[4],
6751                                                        operand_types[4]))
6752                     continue;
6753                   /* Fall through.  */
6754                 case 4:
6755                   if (!operand_type_match (overlap3, i.types[3])
6756                       || ((check_register & 0xa) == 0xa
6757                           && !operand_type_register_match (i.types[1],
6758                                                             operand_types[1],
6759                                                             i.types[3],
6760                                                             operand_types[3]))
6761                       || ((check_register & 0xc) == 0xc
6762                           && !operand_type_register_match (i.types[2],
6763                                                             operand_types[2],
6764                                                             i.types[3],
6765                                                             operand_types[3])))
6766                     continue;
6767                   /* Fall through.  */
6768                 case 3:
6769                   /* Here we make use of the fact that there are no
6770                      reverse match 3 operand instructions.  */
6771                   if (!operand_type_match (overlap2, i.types[2])
6772                       || ((check_register & 5) == 5
6773                           && !operand_type_register_match (i.types[0],
6774                                                             operand_types[0],
6775                                                             i.types[2],
6776                                                             operand_types[2]))
6777                       || ((check_register & 6) == 6
6778                           && !operand_type_register_match (i.types[1],
6779                                                             operand_types[1],
6780                                                             i.types[2],
6781                                                             operand_types[2])))
6782                     continue;
6783                   break;
6784                 }
6785             }
6786           /* Found either forward/reverse 2, 3 or 4 operand match here:
6787              slip through to break.  */
6788         }
6789
6790       /* Check if vector operands are valid.  */
6791       if (check_VecOperands (t))
6792         {
6793           specific_error = i.error;
6794           continue;
6795         }
6796
6797       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6798       if (VEX_check_encoding (t))
6799         {
6800           specific_error = i.error;
6801           continue;
6802         }
6803
6804       /* We've found a match; break out of loop.  */
6805       break;
6806     }
6807
6808   if (t == current_templates->end)
6809     {
6810       /* We found no match.  */
6811       const char *err_msg;
6812       switch (specific_error ? specific_error : i.error)
6813         {
6814         default:
6815           abort ();
6816         case operand_size_mismatch:
6817           err_msg = _("operand size mismatch");
6818           break;
6819         case operand_type_mismatch:
6820           err_msg = _("operand type mismatch");
6821           break;
6822         case register_type_mismatch:
6823           err_msg = _("register type mismatch");
6824           break;
6825         case number_of_operands_mismatch:
6826           err_msg = _("number of operands mismatch");
6827           break;
6828         case invalid_instruction_suffix:
6829           err_msg = _("invalid instruction suffix");
6830           break;
6831         case bad_imm4:
6832           err_msg = _("constant doesn't fit in 4 bits");
6833           break;
6834         case unsupported_with_intel_mnemonic:
6835           err_msg = _("unsupported with Intel mnemonic");
6836           break;
6837         case unsupported_syntax:
6838           err_msg = _("unsupported syntax");
6839           break;
6840         case unsupported:
6841           as_bad (_("unsupported instruction `%s'"),
6842                   current_templates->start->name);
6843           return NULL;
6844         case invalid_sib_address:
6845           err_msg = _("invalid SIB address");
6846           break;
6847         case invalid_vsib_address:
6848           err_msg = _("invalid VSIB address");
6849           break;
6850         case invalid_vector_register_set:
6851           err_msg = _("mask, index, and destination registers must be distinct");
6852           break;
6853         case invalid_tmm_register_set:
6854           err_msg = _("all tmm registers must be distinct");
6855           break;
6856         case unsupported_vector_index_register:
6857           err_msg = _("unsupported vector index register");
6858           break;
6859         case unsupported_broadcast:
6860           err_msg = _("unsupported broadcast");
6861           break;
6862         case broadcast_needed:
6863           err_msg = _("broadcast is needed for operand of such type");
6864           break;
6865         case unsupported_masking:
6866           err_msg = _("unsupported masking");
6867           break;
6868         case mask_not_on_destination:
6869           err_msg = _("mask not on destination operand");
6870           break;
6871         case no_default_mask:
6872           err_msg = _("default mask isn't allowed");
6873           break;
6874         case unsupported_rc_sae:
6875           err_msg = _("unsupported static rounding/sae");
6876           break;
6877         case rc_sae_operand_not_last_imm:
6878           if (intel_syntax)
6879             err_msg = _("RC/SAE operand must precede immediate operands");
6880           else
6881             err_msg = _("RC/SAE operand must follow immediate operands");
6882           break;
6883         case invalid_register_operand:
6884           err_msg = _("invalid register operand");
6885           break;
6886         }
6887       as_bad (_("%s for `%s'"), err_msg,
6888               current_templates->start->name);
6889       return NULL;
6890     }
6891
6892   if (!quiet_warnings)
6893     {
6894       if (!intel_syntax
6895           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6896         as_warn (_("indirect %s without `*'"), t->name);
6897
6898       if (t->opcode_modifier.isprefix
6899           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6900         {
6901           /* Warn them that a data or address size prefix doesn't
6902              affect assembly of the next line of code.  */
6903           as_warn (_("stand-alone `%s' prefix"), t->name);
6904         }
6905     }
6906
6907   /* Copy the template we found.  */
6908   install_template (t);
6909
6910   if (addr_prefix_disp != -1)
6911     i.tm.operand_types[addr_prefix_disp]
6912       = operand_types[addr_prefix_disp];
6913
6914   if (found_reverse_match)
6915     {
6916       /* If we found a reverse match we must alter the opcode direction
6917          bit and clear/flip the regmem modifier one.  found_reverse_match
6918          holds bits to change (different for int & float insns).  */
6919
6920       i.tm.base_opcode ^= found_reverse_match;
6921
6922       i.tm.operand_types[0] = operand_types[i.operands - 1];
6923       i.tm.operand_types[i.operands - 1] = operand_types[0];
6924
6925       /* Certain SIMD insns have their load forms specified in the opcode
6926          table, and hence we need to _set_ RegMem instead of clearing it.
6927          We need to avoid setting the bit though on insns like KMOVW.  */
6928       i.tm.opcode_modifier.regmem
6929         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6930           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6931           && !i.tm.opcode_modifier.regmem;
6932     }
6933
6934   return t;
6935 }
6936
6937 static int
6938 check_string (void)
6939 {
6940   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6941   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6942
6943   if (i.seg[op] != NULL && i.seg[op] != reg_es)
6944     {
6945       as_bad (_("`%s' operand %u must use `%ses' segment"),
6946               i.tm.name,
6947               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6948               register_prefix);
6949       return 0;
6950     }
6951
6952   /* There's only ever one segment override allowed per instruction.
6953      This instruction possibly has a legal segment override on the
6954      second operand, so copy the segment to where non-string
6955      instructions store it, allowing common code.  */
6956   i.seg[op] = i.seg[1];
6957
6958   return 1;
6959 }
6960
6961 static int
6962 process_suffix (void)
6963 {
6964   bool is_crc32 = false, is_movx = false;
6965
6966   /* If matched instruction specifies an explicit instruction mnemonic
6967      suffix, use it.  */
6968   if (i.tm.opcode_modifier.size == SIZE16)
6969     i.suffix = WORD_MNEM_SUFFIX;
6970   else if (i.tm.opcode_modifier.size == SIZE32)
6971     i.suffix = LONG_MNEM_SUFFIX;
6972   else if (i.tm.opcode_modifier.size == SIZE64)
6973     i.suffix = QWORD_MNEM_SUFFIX;
6974   else if (i.reg_operands
6975            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6976            && !i.tm.opcode_modifier.addrprefixopreg)
6977     {
6978       unsigned int numop = i.operands;
6979
6980       /* MOVSX/MOVZX */
6981       is_movx = (i.tm.opcode_modifier.opcodespace == SPACE_0F
6982                  && (i.tm.base_opcode | 8) == 0xbe)
6983                 || (i.tm.opcode_modifier.opcodespace == SPACE_BASE
6984                     && i.tm.base_opcode == 0x63
6985                     && i.tm.cpu_flags.bitfield.cpu64);
6986
6987       /* CRC32 */
6988       is_crc32 = (i.tm.base_opcode == 0xf0
6989                   && i.tm.opcode_modifier.opcodespace == SPACE_0F38
6990                   && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2);
6991
6992       /* movsx/movzx want only their source operand considered here, for the
6993          ambiguity checking below.  The suffix will be replaced afterwards
6994          to represent the destination (register).  */
6995       if (is_movx && (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63))
6996         --i.operands;
6997
6998       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6999       if (is_crc32 && i.tm.operand_types[1].bitfield.qword)
7000         i.rex |= REX_W;
7001
7002       /* If there's no instruction mnemonic suffix we try to invent one
7003          based on GPR operands.  */
7004       if (!i.suffix)
7005         {
7006           /* We take i.suffix from the last register operand specified,
7007              Destination register type is more significant than source
7008              register type.  crc32 in SSE4.2 prefers source register
7009              type. */
7010           unsigned int op = is_crc32 ? 1 : i.operands;
7011
7012           while (op--)
7013             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
7014                 || i.tm.operand_types[op].bitfield.instance == Accum)
7015               {
7016                 if (i.types[op].bitfield.class != Reg)
7017                   continue;
7018                 if (i.types[op].bitfield.byte)
7019                   i.suffix = BYTE_MNEM_SUFFIX;
7020                 else if (i.types[op].bitfield.word)
7021                   i.suffix = WORD_MNEM_SUFFIX;
7022                 else if (i.types[op].bitfield.dword)
7023                   i.suffix = LONG_MNEM_SUFFIX;
7024                 else if (i.types[op].bitfield.qword)
7025                   i.suffix = QWORD_MNEM_SUFFIX;
7026                 else
7027                   continue;
7028                 break;
7029               }
7030
7031           /* As an exception, movsx/movzx silently default to a byte source
7032              in AT&T mode.  */
7033           if (is_movx && i.tm.opcode_modifier.w && !i.suffix && !intel_syntax)
7034             i.suffix = BYTE_MNEM_SUFFIX;
7035         }
7036       else if (i.suffix == BYTE_MNEM_SUFFIX)
7037         {
7038           if (intel_syntax
7039               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
7040               && i.tm.opcode_modifier.no_bsuf)
7041             i.suffix = 0;
7042           else if (!check_byte_reg ())
7043             return 0;
7044         }
7045       else if (i.suffix == LONG_MNEM_SUFFIX)
7046         {
7047           if (intel_syntax
7048               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
7049               && i.tm.opcode_modifier.no_lsuf
7050               && !i.tm.opcode_modifier.todword
7051               && !i.tm.opcode_modifier.toqword)
7052             i.suffix = 0;
7053           else if (!check_long_reg ())
7054             return 0;
7055         }
7056       else if (i.suffix == QWORD_MNEM_SUFFIX)
7057         {
7058           if (intel_syntax
7059               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
7060               && i.tm.opcode_modifier.no_qsuf
7061               && !i.tm.opcode_modifier.todword
7062               && !i.tm.opcode_modifier.toqword)
7063             i.suffix = 0;
7064           else if (!check_qword_reg ())
7065             return 0;
7066         }
7067       else if (i.suffix == WORD_MNEM_SUFFIX)
7068         {
7069           if (intel_syntax
7070               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
7071               && i.tm.opcode_modifier.no_wsuf)
7072             i.suffix = 0;
7073           else if (!check_word_reg ())
7074             return 0;
7075         }
7076       else if (intel_syntax
7077                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
7078         /* Do nothing if the instruction is going to ignore the prefix.  */
7079         ;
7080       else
7081         abort ();
7082
7083       /* Undo the movsx/movzx change done above.  */
7084       i.operands = numop;
7085     }
7086   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
7087            && !i.suffix)
7088     {
7089       i.suffix = stackop_size;
7090       if (stackop_size == LONG_MNEM_SUFFIX)
7091         {
7092           /* stackop_size is set to LONG_MNEM_SUFFIX for the
7093              .code16gcc directive to support 16-bit mode with
7094              32-bit address.  For IRET without a suffix, generate
7095              16-bit IRET (opcode 0xcf) to return from an interrupt
7096              handler.  */
7097           if (i.tm.base_opcode == 0xcf)
7098             {
7099               i.suffix = WORD_MNEM_SUFFIX;
7100               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
7101             }
7102           /* Warn about changed behavior for segment register push/pop.  */
7103           else if ((i.tm.base_opcode | 1) == 0x07)
7104             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
7105                      i.tm.name);
7106         }
7107     }
7108   else if (!i.suffix
7109            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
7110                || i.tm.opcode_modifier.jump == JUMP_BYTE
7111                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
7112                || (i.tm.opcode_modifier.opcodespace == SPACE_0F
7113                    && i.tm.base_opcode == 0x01 /* [ls][gi]dt */
7114                    && i.tm.extension_opcode <= 3)))
7115     {
7116       switch (flag_code)
7117         {
7118         case CODE_64BIT:
7119           if (!i.tm.opcode_modifier.no_qsuf)
7120             {
7121               if (i.tm.opcode_modifier.jump == JUMP_BYTE
7122                   || i.tm.opcode_modifier.no_lsuf)
7123                 i.suffix = QWORD_MNEM_SUFFIX;
7124               break;
7125             }
7126           /* Fall through.  */
7127         case CODE_32BIT:
7128           if (!i.tm.opcode_modifier.no_lsuf)
7129             i.suffix = LONG_MNEM_SUFFIX;
7130           break;
7131         case CODE_16BIT:
7132           if (!i.tm.opcode_modifier.no_wsuf)
7133             i.suffix = WORD_MNEM_SUFFIX;
7134           break;
7135         }
7136     }
7137
7138   if (!i.suffix
7139       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7140           /* Also cover lret/retf/iret in 64-bit mode.  */
7141           || (flag_code == CODE_64BIT
7142               && !i.tm.opcode_modifier.no_lsuf
7143               && !i.tm.opcode_modifier.no_qsuf))
7144       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7145       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
7146       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
7147       /* Accept FLDENV et al without suffix.  */
7148       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
7149     {
7150       unsigned int suffixes, evex = 0;
7151
7152       suffixes = !i.tm.opcode_modifier.no_bsuf;
7153       if (!i.tm.opcode_modifier.no_wsuf)
7154         suffixes |= 1 << 1;
7155       if (!i.tm.opcode_modifier.no_lsuf)
7156         suffixes |= 1 << 2;
7157       if (!i.tm.opcode_modifier.no_ldsuf)
7158         suffixes |= 1 << 3;
7159       if (!i.tm.opcode_modifier.no_ssuf)
7160         suffixes |= 1 << 4;
7161       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
7162         suffixes |= 1 << 5;
7163
7164       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
7165          also suitable for AT&T syntax mode, it was requested that this be
7166          restricted to just Intel syntax.  */
7167       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast.type)
7168         {
7169           unsigned int op;
7170
7171           for (op = 0; op < i.tm.operands; ++op)
7172             {
7173               if (is_evex_encoding (&i.tm)
7174                   && !cpu_arch_flags.bitfield.cpuavx512vl)
7175                 {
7176                   if (i.tm.operand_types[op].bitfield.ymmword)
7177                     i.tm.operand_types[op].bitfield.xmmword = 0;
7178                   if (i.tm.operand_types[op].bitfield.zmmword)
7179                     i.tm.operand_types[op].bitfield.ymmword = 0;
7180                   if (!i.tm.opcode_modifier.evex
7181                       || i.tm.opcode_modifier.evex == EVEXDYN)
7182                     i.tm.opcode_modifier.evex = EVEX512;
7183                 }
7184
7185               if (i.tm.operand_types[op].bitfield.xmmword
7186                   + i.tm.operand_types[op].bitfield.ymmword
7187                   + i.tm.operand_types[op].bitfield.zmmword < 2)
7188                 continue;
7189
7190               /* Any properly sized operand disambiguates the insn.  */
7191               if (i.types[op].bitfield.xmmword
7192                   || i.types[op].bitfield.ymmword
7193                   || i.types[op].bitfield.zmmword)
7194                 {
7195                   suffixes &= ~(7 << 6);
7196                   evex = 0;
7197                   break;
7198                 }
7199
7200               if ((i.flags[op] & Operand_Mem)
7201                   && i.tm.operand_types[op].bitfield.unspecified)
7202                 {
7203                   if (i.tm.operand_types[op].bitfield.xmmword)
7204                     suffixes |= 1 << 6;
7205                   if (i.tm.operand_types[op].bitfield.ymmword)
7206                     suffixes |= 1 << 7;
7207                   if (i.tm.operand_types[op].bitfield.zmmword)
7208                     suffixes |= 1 << 8;
7209                   if (is_evex_encoding (&i.tm))
7210                     evex = EVEX512;
7211                 }
7212             }
7213         }
7214
7215       /* Are multiple suffixes / operand sizes allowed?  */
7216       if (suffixes & (suffixes - 1))
7217         {
7218           if (intel_syntax
7219               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7220                   || operand_check == check_error))
7221             {
7222               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
7223               return 0;
7224             }
7225           if (operand_check == check_error)
7226             {
7227               as_bad (_("no instruction mnemonic suffix given and "
7228                         "no register operands; can't size `%s'"), i.tm.name);
7229               return 0;
7230             }
7231           if (operand_check == check_warning)
7232             as_warn (_("%s; using default for `%s'"),
7233                        intel_syntax
7234                        ? _("ambiguous operand size")
7235                        : _("no instruction mnemonic suffix given and "
7236                            "no register operands"),
7237                        i.tm.name);
7238
7239           if (i.tm.opcode_modifier.floatmf)
7240             i.suffix = SHORT_MNEM_SUFFIX;
7241           else if (is_movx)
7242             /* handled below */;
7243           else if (evex)
7244             i.tm.opcode_modifier.evex = evex;
7245           else if (flag_code == CODE_16BIT)
7246             i.suffix = WORD_MNEM_SUFFIX;
7247           else if (!i.tm.opcode_modifier.no_lsuf)
7248             i.suffix = LONG_MNEM_SUFFIX;
7249           else
7250             i.suffix = QWORD_MNEM_SUFFIX;
7251         }
7252     }
7253
7254   if (is_movx)
7255     {
7256       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7257          In AT&T syntax, if there is no suffix (warned about above), the default
7258          will be byte extension.  */
7259       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7260         i.tm.base_opcode |= 1;
7261
7262       /* For further processing, the suffix should represent the destination
7263          (register).  This is already the case when one was used with
7264          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7265          no suffix to begin with.  */
7266       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7267         {
7268           if (i.types[1].bitfield.word)
7269             i.suffix = WORD_MNEM_SUFFIX;
7270           else if (i.types[1].bitfield.qword)
7271             i.suffix = QWORD_MNEM_SUFFIX;
7272           else
7273             i.suffix = LONG_MNEM_SUFFIX;
7274
7275           i.tm.opcode_modifier.w = 0;
7276         }
7277     }
7278
7279   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7280     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7281                    != (i.tm.operand_types[1].bitfield.class == Reg);
7282
7283   /* Change the opcode based on the operand size given by i.suffix.  */
7284   switch (i.suffix)
7285     {
7286     /* Size floating point instruction.  */
7287     case LONG_MNEM_SUFFIX:
7288       if (i.tm.opcode_modifier.floatmf)
7289         {
7290           i.tm.base_opcode ^= 4;
7291           break;
7292         }
7293     /* fall through */
7294     case WORD_MNEM_SUFFIX:
7295     case QWORD_MNEM_SUFFIX:
7296       /* It's not a byte, select word/dword operation.  */
7297       if (i.tm.opcode_modifier.w)
7298         {
7299           if (i.short_form)
7300             i.tm.base_opcode |= 8;
7301           else
7302             i.tm.base_opcode |= 1;
7303         }
7304     /* fall through */
7305     case SHORT_MNEM_SUFFIX:
7306       /* Now select between word & dword operations via the operand
7307          size prefix, except for instructions that will ignore this
7308          prefix anyway.  */
7309       if (i.suffix != QWORD_MNEM_SUFFIX
7310           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7311           && !i.tm.opcode_modifier.floatmf
7312           && !is_any_vex_encoding (&i.tm)
7313           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7314               || (flag_code == CODE_64BIT
7315                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7316         {
7317           unsigned int prefix = DATA_PREFIX_OPCODE;
7318
7319           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7320             prefix = ADDR_PREFIX_OPCODE;
7321
7322           if (!add_prefix (prefix))
7323             return 0;
7324         }
7325
7326       /* Set mode64 for an operand.  */
7327       if (i.suffix == QWORD_MNEM_SUFFIX
7328           && flag_code == CODE_64BIT
7329           && !i.tm.opcode_modifier.norex64
7330           && !i.tm.opcode_modifier.vexw
7331           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7332              need rex64. */
7333           && ! (i.operands == 2
7334                 && i.tm.base_opcode == 0x90
7335                 && i.tm.extension_opcode == None
7336                 && i.types[0].bitfield.instance == Accum
7337                 && i.types[0].bitfield.qword
7338                 && i.types[1].bitfield.instance == Accum
7339                 && i.types[1].bitfield.qword))
7340         i.rex |= REX_W;
7341
7342       break;
7343
7344     case 0:
7345       /* Select word/dword/qword operation with explicit data sizing prefix
7346          when there are no suitable register operands.  */
7347       if (i.tm.opcode_modifier.w
7348           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7349           && (!i.reg_operands
7350               || (i.reg_operands == 1
7351                       /* ShiftCount */
7352                   && (i.tm.operand_types[0].bitfield.instance == RegC
7353                       /* InOutPortReg */
7354                       || i.tm.operand_types[0].bitfield.instance == RegD
7355                       || i.tm.operand_types[1].bitfield.instance == RegD
7356                       /* CRC32 */
7357                       || is_crc32))))
7358         i.tm.base_opcode |= 1;
7359       break;
7360     }
7361
7362   if (i.tm.opcode_modifier.addrprefixopreg)
7363     {
7364       gas_assert (!i.suffix);
7365       gas_assert (i.reg_operands);
7366
7367       if (i.tm.operand_types[0].bitfield.instance == Accum
7368           || i.operands == 1)
7369         {
7370           /* The address size override prefix changes the size of the
7371              first operand.  */
7372           if (flag_code == CODE_64BIT
7373               && i.op[0].regs->reg_type.bitfield.word)
7374             {
7375               as_bad (_("16-bit addressing unavailable for `%s'"),
7376                       i.tm.name);
7377               return 0;
7378             }
7379
7380           if ((flag_code == CODE_32BIT
7381                ? i.op[0].regs->reg_type.bitfield.word
7382                : i.op[0].regs->reg_type.bitfield.dword)
7383               && !add_prefix (ADDR_PREFIX_OPCODE))
7384             return 0;
7385         }
7386       else
7387         {
7388           /* Check invalid register operand when the address size override
7389              prefix changes the size of register operands.  */
7390           unsigned int op;
7391           enum { need_word, need_dword, need_qword } need;
7392
7393           /* Check the register operand for the address size prefix if
7394              the memory operand has no real registers, like symbol, DISP
7395              or bogus (x32-only) symbol(%rip) when symbol(%eip) is meant.  */
7396           if (i.mem_operands == 1
7397               && i.reg_operands == 1
7398               && i.operands == 2
7399               && i.types[1].bitfield.class == Reg
7400               && (flag_code == CODE_32BIT
7401                   ? i.op[1].regs->reg_type.bitfield.word
7402                   : i.op[1].regs->reg_type.bitfield.dword)
7403               && ((i.base_reg == NULL && i.index_reg == NULL)
7404 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7405                   || (x86_elf_abi == X86_64_X32_ABI
7406                       && i.base_reg
7407                       && i.base_reg->reg_num == RegIP
7408                       && i.base_reg->reg_type.bitfield.qword))
7409 #else
7410                   || 0)
7411 #endif
7412               && !add_prefix (ADDR_PREFIX_OPCODE))
7413             return 0;
7414
7415           if (flag_code == CODE_32BIT)
7416             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7417           else if (i.prefix[ADDR_PREFIX])
7418             need = need_dword;
7419           else
7420             need = flag_code == CODE_64BIT ? need_qword : need_word;
7421
7422           for (op = 0; op < i.operands; op++)
7423             {
7424               if (i.types[op].bitfield.class != Reg)
7425                 continue;
7426
7427               switch (need)
7428                 {
7429                 case need_word:
7430                   if (i.op[op].regs->reg_type.bitfield.word)
7431                     continue;
7432                   break;
7433                 case need_dword:
7434                   if (i.op[op].regs->reg_type.bitfield.dword)
7435                     continue;
7436                   break;
7437                 case need_qword:
7438                   if (i.op[op].regs->reg_type.bitfield.qword)
7439                     continue;
7440                   break;
7441                 }
7442
7443               as_bad (_("invalid register operand size for `%s'"),
7444                       i.tm.name);
7445               return 0;
7446             }
7447         }
7448     }
7449
7450   return 1;
7451 }
7452
7453 static int
7454 check_byte_reg (void)
7455 {
7456   int op;
7457
7458   for (op = i.operands; --op >= 0;)
7459     {
7460       /* Skip non-register operands. */
7461       if (i.types[op].bitfield.class != Reg)
7462         continue;
7463
7464       /* If this is an eight bit register, it's OK.  If it's the 16 or
7465          32 bit version of an eight bit register, we will just use the
7466          low portion, and that's OK too.  */
7467       if (i.types[op].bitfield.byte)
7468         continue;
7469
7470       /* I/O port address operands are OK too.  */
7471       if (i.tm.operand_types[op].bitfield.instance == RegD
7472           && i.tm.operand_types[op].bitfield.word)
7473         continue;
7474
7475       /* crc32 only wants its source operand checked here.  */
7476       if (i.tm.base_opcode == 0xf0
7477           && i.tm.opcode_modifier.opcodespace == SPACE_0F38
7478           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2
7479           && op != 0)
7480         continue;
7481
7482       /* Any other register is bad.  */
7483       as_bad (_("`%s%s' not allowed with `%s%c'"),
7484               register_prefix, i.op[op].regs->reg_name,
7485               i.tm.name, i.suffix);
7486       return 0;
7487     }
7488   return 1;
7489 }
7490
7491 static int
7492 check_long_reg (void)
7493 {
7494   int op;
7495
7496   for (op = i.operands; --op >= 0;)
7497     /* Skip non-register operands. */
7498     if (i.types[op].bitfield.class != Reg)
7499       continue;
7500     /* Reject eight bit registers, except where the template requires
7501        them. (eg. movzb)  */
7502     else if (i.types[op].bitfield.byte
7503              && (i.tm.operand_types[op].bitfield.class == Reg
7504                  || i.tm.operand_types[op].bitfield.instance == Accum)
7505              && (i.tm.operand_types[op].bitfield.word
7506                  || i.tm.operand_types[op].bitfield.dword))
7507       {
7508         as_bad (_("`%s%s' not allowed with `%s%c'"),
7509                 register_prefix,
7510                 i.op[op].regs->reg_name,
7511                 i.tm.name,
7512                 i.suffix);
7513         return 0;
7514       }
7515     /* Error if the e prefix on a general reg is missing.  */
7516     else if (i.types[op].bitfield.word
7517              && (i.tm.operand_types[op].bitfield.class == Reg
7518                  || i.tm.operand_types[op].bitfield.instance == Accum)
7519              && i.tm.operand_types[op].bitfield.dword)
7520       {
7521         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7522                 register_prefix, i.op[op].regs->reg_name,
7523                 i.suffix);
7524         return 0;
7525       }
7526     /* Warn if the r prefix on a general reg is present.  */
7527     else if (i.types[op].bitfield.qword
7528              && (i.tm.operand_types[op].bitfield.class == Reg
7529                  || i.tm.operand_types[op].bitfield.instance == Accum)
7530              && i.tm.operand_types[op].bitfield.dword)
7531       {
7532         if (intel_syntax
7533             && i.tm.opcode_modifier.toqword
7534             && i.types[0].bitfield.class != RegSIMD)
7535           {
7536             /* Convert to QWORD.  We want REX byte. */
7537             i.suffix = QWORD_MNEM_SUFFIX;
7538           }
7539         else
7540           {
7541             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7542                     register_prefix, i.op[op].regs->reg_name,
7543                     i.suffix);
7544             return 0;
7545           }
7546       }
7547   return 1;
7548 }
7549
7550 static int
7551 check_qword_reg (void)
7552 {
7553   int op;
7554
7555   for (op = i.operands; --op >= 0; )
7556     /* Skip non-register operands. */
7557     if (i.types[op].bitfield.class != Reg)
7558       continue;
7559     /* Reject eight bit registers, except where the template requires
7560        them. (eg. movzb)  */
7561     else if (i.types[op].bitfield.byte
7562              && (i.tm.operand_types[op].bitfield.class == Reg
7563                  || i.tm.operand_types[op].bitfield.instance == Accum)
7564              && (i.tm.operand_types[op].bitfield.word
7565                  || i.tm.operand_types[op].bitfield.dword))
7566       {
7567         as_bad (_("`%s%s' not allowed with `%s%c'"),
7568                 register_prefix,
7569                 i.op[op].regs->reg_name,
7570                 i.tm.name,
7571                 i.suffix);
7572         return 0;
7573       }
7574     /* Warn if the r prefix on a general reg is missing.  */
7575     else if ((i.types[op].bitfield.word
7576               || i.types[op].bitfield.dword)
7577              && (i.tm.operand_types[op].bitfield.class == Reg
7578                  || i.tm.operand_types[op].bitfield.instance == Accum)
7579              && i.tm.operand_types[op].bitfield.qword)
7580       {
7581         /* Prohibit these changes in the 64bit mode, since the
7582            lowering is more complicated.  */
7583         if (intel_syntax
7584             && i.tm.opcode_modifier.todword
7585             && i.types[0].bitfield.class != RegSIMD)
7586           {
7587             /* Convert to DWORD.  We don't want REX byte. */
7588             i.suffix = LONG_MNEM_SUFFIX;
7589           }
7590         else
7591           {
7592             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7593                     register_prefix, i.op[op].regs->reg_name,
7594                     i.suffix);
7595             return 0;
7596           }
7597       }
7598   return 1;
7599 }
7600
7601 static int
7602 check_word_reg (void)
7603 {
7604   int op;
7605   for (op = i.operands; --op >= 0;)
7606     /* Skip non-register operands. */
7607     if (i.types[op].bitfield.class != Reg)
7608       continue;
7609     /* Reject eight bit registers, except where the template requires
7610        them. (eg. movzb)  */
7611     else if (i.types[op].bitfield.byte
7612              && (i.tm.operand_types[op].bitfield.class == Reg
7613                  || i.tm.operand_types[op].bitfield.instance == Accum)
7614              && (i.tm.operand_types[op].bitfield.word
7615                  || i.tm.operand_types[op].bitfield.dword))
7616       {
7617         as_bad (_("`%s%s' not allowed with `%s%c'"),
7618                 register_prefix,
7619                 i.op[op].regs->reg_name,
7620                 i.tm.name,
7621                 i.suffix);
7622         return 0;
7623       }
7624     /* Error if the e or r prefix on a general reg is present.  */
7625     else if ((i.types[op].bitfield.dword
7626                  || i.types[op].bitfield.qword)
7627              && (i.tm.operand_types[op].bitfield.class == Reg
7628                  || i.tm.operand_types[op].bitfield.instance == Accum)
7629              && i.tm.operand_types[op].bitfield.word)
7630       {
7631         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7632                 register_prefix, i.op[op].regs->reg_name,
7633                 i.suffix);
7634         return 0;
7635       }
7636   return 1;
7637 }
7638
7639 static int
7640 update_imm (unsigned int j)
7641 {
7642   i386_operand_type overlap = i.types[j];
7643   if ((overlap.bitfield.imm8
7644        || overlap.bitfield.imm8s
7645        || overlap.bitfield.imm16
7646        || overlap.bitfield.imm32
7647        || overlap.bitfield.imm32s
7648        || overlap.bitfield.imm64)
7649       && !operand_type_equal (&overlap, &imm8)
7650       && !operand_type_equal (&overlap, &imm8s)
7651       && !operand_type_equal (&overlap, &imm16)
7652       && !operand_type_equal (&overlap, &imm32)
7653       && !operand_type_equal (&overlap, &imm32s)
7654       && !operand_type_equal (&overlap, &imm64))
7655     {
7656       if (i.suffix)
7657         {
7658           i386_operand_type temp;
7659
7660           operand_type_set (&temp, 0);
7661           if (i.suffix == BYTE_MNEM_SUFFIX)
7662             {
7663               temp.bitfield.imm8 = overlap.bitfield.imm8;
7664               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7665             }
7666           else if (i.suffix == WORD_MNEM_SUFFIX)
7667             temp.bitfield.imm16 = overlap.bitfield.imm16;
7668           else if (i.suffix == QWORD_MNEM_SUFFIX)
7669             {
7670               temp.bitfield.imm64 = overlap.bitfield.imm64;
7671               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7672             }
7673           else
7674             temp.bitfield.imm32 = overlap.bitfield.imm32;
7675           overlap = temp;
7676         }
7677       else if (operand_type_equal (&overlap, &imm16_32_32s)
7678                || operand_type_equal (&overlap, &imm16_32)
7679                || operand_type_equal (&overlap, &imm16_32s))
7680         {
7681           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7682             overlap = imm16;
7683           else
7684             overlap = imm32s;
7685         }
7686       else if (i.prefix[REX_PREFIX] & REX_W)
7687         overlap = operand_type_and (overlap, imm32s);
7688       else if (i.prefix[DATA_PREFIX])
7689         overlap = operand_type_and (overlap,
7690                                     flag_code != CODE_16BIT ? imm16 : imm32);
7691       if (!operand_type_equal (&overlap, &imm8)
7692           && !operand_type_equal (&overlap, &imm8s)
7693           && !operand_type_equal (&overlap, &imm16)
7694           && !operand_type_equal (&overlap, &imm32)
7695           && !operand_type_equal (&overlap, &imm32s)
7696           && !operand_type_equal (&overlap, &imm64))
7697         {
7698           as_bad (_("no instruction mnemonic suffix given; "
7699                     "can't determine immediate size"));
7700           return 0;
7701         }
7702     }
7703   i.types[j] = overlap;
7704
7705   return 1;
7706 }
7707
7708 static int
7709 finalize_imm (void)
7710 {
7711   unsigned int j, n;
7712
7713   /* Update the first 2 immediate operands.  */
7714   n = i.operands > 2 ? 2 : i.operands;
7715   if (n)
7716     {
7717       for (j = 0; j < n; j++)
7718         if (update_imm (j) == 0)
7719           return 0;
7720
7721       /* The 3rd operand can't be immediate operand.  */
7722       gas_assert (operand_type_check (i.types[2], imm) == 0);
7723     }
7724
7725   return 1;
7726 }
7727
7728 static int
7729 process_operands (void)
7730 {
7731   /* Default segment register this instruction will use for memory
7732      accesses.  0 means unknown.  This is only for optimizing out
7733      unnecessary segment overrides.  */
7734   const reg_entry *default_seg = NULL;
7735
7736   if (i.tm.opcode_modifier.sse2avx)
7737     {
7738       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7739          need converting.  */
7740       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7741       i.prefix[REX_PREFIX] = 0;
7742       i.rex_encoding = 0;
7743     }
7744   /* ImmExt should be processed after SSE2AVX.  */
7745   else if (i.tm.opcode_modifier.immext)
7746     process_immext ();
7747
7748   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7749     {
7750       unsigned int dupl = i.operands;
7751       unsigned int dest = dupl - 1;
7752       unsigned int j;
7753
7754       /* The destination must be an xmm register.  */
7755       gas_assert (i.reg_operands
7756                   && MAX_OPERANDS > dupl
7757                   && operand_type_equal (&i.types[dest], &regxmm));
7758
7759       if (i.tm.operand_types[0].bitfield.instance == Accum
7760           && i.tm.operand_types[0].bitfield.xmmword)
7761         {
7762           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7763             {
7764               /* Keep xmm0 for instructions with VEX prefix and 3
7765                  sources.  */
7766               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7767               i.tm.operand_types[0].bitfield.class = RegSIMD;
7768               goto duplicate;
7769             }
7770           else
7771             {
7772               /* We remove the first xmm0 and keep the number of
7773                  operands unchanged, which in fact duplicates the
7774                  destination.  */
7775               for (j = 1; j < i.operands; j++)
7776                 {
7777                   i.op[j - 1] = i.op[j];
7778                   i.types[j - 1] = i.types[j];
7779                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7780                   i.flags[j - 1] = i.flags[j];
7781                 }
7782             }
7783         }
7784       else if (i.tm.opcode_modifier.implicit1stxmm0)
7785         {
7786           gas_assert ((MAX_OPERANDS - 1) > dupl
7787                       && (i.tm.opcode_modifier.vexsources
7788                           == VEX3SOURCES));
7789
7790           /* Add the implicit xmm0 for instructions with VEX prefix
7791              and 3 sources.  */
7792           for (j = i.operands; j > 0; j--)
7793             {
7794               i.op[j] = i.op[j - 1];
7795               i.types[j] = i.types[j - 1];
7796               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7797               i.flags[j] = i.flags[j - 1];
7798             }
7799           i.op[0].regs
7800             = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7801           i.types[0] = regxmm;
7802           i.tm.operand_types[0] = regxmm;
7803
7804           i.operands += 2;
7805           i.reg_operands += 2;
7806           i.tm.operands += 2;
7807
7808           dupl++;
7809           dest++;
7810           i.op[dupl] = i.op[dest];
7811           i.types[dupl] = i.types[dest];
7812           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7813           i.flags[dupl] = i.flags[dest];
7814         }
7815       else
7816         {
7817         duplicate:
7818           i.operands++;
7819           i.reg_operands++;
7820           i.tm.operands++;
7821
7822           i.op[dupl] = i.op[dest];
7823           i.types[dupl] = i.types[dest];
7824           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7825           i.flags[dupl] = i.flags[dest];
7826         }
7827
7828        if (i.tm.opcode_modifier.immext)
7829          process_immext ();
7830     }
7831   else if (i.tm.operand_types[0].bitfield.instance == Accum
7832            && i.tm.operand_types[0].bitfield.xmmword)
7833     {
7834       unsigned int j;
7835
7836       for (j = 1; j < i.operands; j++)
7837         {
7838           i.op[j - 1] = i.op[j];
7839           i.types[j - 1] = i.types[j];
7840
7841           /* We need to adjust fields in i.tm since they are used by
7842              build_modrm_byte.  */
7843           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7844
7845           i.flags[j - 1] = i.flags[j];
7846         }
7847
7848       i.operands--;
7849       i.reg_operands--;
7850       i.tm.operands--;
7851     }
7852   else if (i.tm.opcode_modifier.implicitquadgroup)
7853     {
7854       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7855
7856       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7857       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7858       regnum = register_number (i.op[1].regs);
7859       first_reg_in_group = regnum & ~3;
7860       last_reg_in_group = first_reg_in_group + 3;
7861       if (regnum != first_reg_in_group)
7862         as_warn (_("source register `%s%s' implicitly denotes"
7863                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7864                  register_prefix, i.op[1].regs->reg_name,
7865                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7866                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7867                  i.tm.name);
7868     }
7869   else if (i.tm.opcode_modifier.regkludge)
7870     {
7871       /* The imul $imm, %reg instruction is converted into
7872          imul $imm, %reg, %reg, and the clr %reg instruction
7873          is converted into xor %reg, %reg.  */
7874
7875       unsigned int first_reg_op;
7876
7877       if (operand_type_check (i.types[0], reg))
7878         first_reg_op = 0;
7879       else
7880         first_reg_op = 1;
7881       /* Pretend we saw the extra register operand.  */
7882       gas_assert (i.reg_operands == 1
7883                   && i.op[first_reg_op + 1].regs == 0);
7884       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7885       i.types[first_reg_op + 1] = i.types[first_reg_op];
7886       i.operands++;
7887       i.reg_operands++;
7888     }
7889
7890   if (i.tm.opcode_modifier.modrm)
7891     {
7892       /* The opcode is completed (modulo i.tm.extension_opcode which
7893          must be put into the modrm byte).  Now, we make the modrm and
7894          index base bytes based on all the info we've collected.  */
7895
7896       default_seg = build_modrm_byte ();
7897     }
7898   else if (i.types[0].bitfield.class == SReg)
7899     {
7900       if (flag_code != CODE_64BIT
7901           ? i.tm.base_opcode == POP_SEG_SHORT
7902             && i.op[0].regs->reg_num == 1
7903           : (i.tm.base_opcode | 1) == (POP_SEG386_SHORT & 0xff)
7904             && i.op[0].regs->reg_num < 4)
7905         {
7906           as_bad (_("you can't `%s %s%s'"),
7907                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7908           return 0;
7909         }
7910       if (i.op[0].regs->reg_num > 3
7911           && i.tm.opcode_modifier.opcodespace == SPACE_BASE )
7912         {
7913           i.tm.base_opcode ^= (POP_SEG_SHORT ^ POP_SEG386_SHORT) & 0xff;
7914           i.tm.opcode_modifier.opcodespace = SPACE_0F;
7915         }
7916       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7917     }
7918   else if (i.tm.opcode_modifier.opcodespace == SPACE_BASE
7919            && (i.tm.base_opcode & ~3) == MOV_AX_DISP32)
7920     {
7921       default_seg = reg_ds;
7922     }
7923   else if (i.tm.opcode_modifier.isstring)
7924     {
7925       /* For the string instructions that allow a segment override
7926          on one of their operands, the default segment is ds.  */
7927       default_seg = reg_ds;
7928     }
7929   else if (i.short_form)
7930     {
7931       /* The register or float register operand is in operand
7932          0 or 1.  */
7933       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7934
7935       /* Register goes in low 3 bits of opcode.  */
7936       i.tm.base_opcode |= i.op[op].regs->reg_num;
7937       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7938         i.rex |= REX_B;
7939       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7940         {
7941           /* Warn about some common errors, but press on regardless.
7942              The first case can be generated by gcc (<= 2.8.1).  */
7943           if (i.operands == 2)
7944             {
7945               /* Reversed arguments on faddp, fsubp, etc.  */
7946               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7947                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7948                        register_prefix, i.op[intel_syntax].regs->reg_name);
7949             }
7950           else
7951             {
7952               /* Extraneous `l' suffix on fp insn.  */
7953               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7954                        register_prefix, i.op[0].regs->reg_name);
7955             }
7956         }
7957     }
7958
7959   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7960       && i.tm.base_opcode == 0x8d /* lea */
7961       && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7962       && !is_any_vex_encoding(&i.tm))
7963     {
7964       if (!quiet_warnings)
7965         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7966       if (optimize)
7967         {
7968           i.seg[0] = NULL;
7969           i.prefix[SEG_PREFIX] = 0;
7970         }
7971     }
7972
7973   /* If a segment was explicitly specified, and the specified segment
7974      is neither the default nor the one already recorded from a prefix,
7975      use an opcode prefix to select it.  If we never figured out what
7976      the default segment is, then default_seg will be zero at this
7977      point, and the specified segment prefix will always be used.  */
7978   if (i.seg[0]
7979       && i.seg[0] != default_seg
7980       && i386_seg_prefixes[i.seg[0]->reg_num] != i.prefix[SEG_PREFIX])
7981     {
7982       if (!add_prefix (i386_seg_prefixes[i.seg[0]->reg_num]))
7983         return 0;
7984     }
7985   return 1;
7986 }
7987
7988 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7989                                  bool do_sse2avx)
7990 {
7991   if (r->reg_flags & RegRex)
7992     {
7993       if (i.rex & rex_bit)
7994         as_bad (_("same type of prefix used twice"));
7995       i.rex |= rex_bit;
7996     }
7997   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7998     {
7999       gas_assert (i.vex.register_specifier == r);
8000       i.vex.register_specifier += 8;
8001     }
8002
8003   if (r->reg_flags & RegVRex)
8004     i.vrex |= rex_bit;
8005 }
8006
8007 static const reg_entry *
8008 build_modrm_byte (void)
8009 {
8010   const reg_entry *default_seg = NULL;
8011   unsigned int source, dest;
8012   int vex_3_sources;
8013
8014   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
8015   if (vex_3_sources)
8016     {
8017       unsigned int nds, reg_slot;
8018       expressionS *exp;
8019
8020       dest = i.operands - 1;
8021       nds = dest - 1;
8022
8023       /* There are 2 kinds of instructions:
8024          1. 5 operands: 4 register operands or 3 register operands
8025          plus 1 memory operand plus one Imm4 operand, VexXDS, and
8026          VexW0 or VexW1.  The destination must be either XMM, YMM or
8027          ZMM register.
8028          2. 4 operands: 4 register operands or 3 register operands
8029          plus 1 memory operand, with VexXDS.  */
8030       gas_assert ((i.reg_operands == 4
8031                    || (i.reg_operands == 3 && i.mem_operands == 1))
8032                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
8033                   && i.tm.opcode_modifier.vexw
8034                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
8035
8036       /* If VexW1 is set, the first non-immediate operand is the source and
8037          the second non-immediate one is encoded in the immediate operand.  */
8038       if (i.tm.opcode_modifier.vexw == VEXW1)
8039         {
8040           source = i.imm_operands;
8041           reg_slot = i.imm_operands + 1;
8042         }
8043       else
8044         {
8045           source = i.imm_operands + 1;
8046           reg_slot = i.imm_operands;
8047         }
8048
8049       if (i.imm_operands == 0)
8050         {
8051           /* When there is no immediate operand, generate an 8bit
8052              immediate operand to encode the first operand.  */
8053           exp = &im_expressions[i.imm_operands++];
8054           i.op[i.operands].imms = exp;
8055           i.types[i.operands] = imm8;
8056           i.operands++;
8057
8058           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
8059           exp->X_op = O_constant;
8060           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
8061           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
8062         }
8063       else
8064         {
8065           gas_assert (i.imm_operands == 1);
8066           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
8067           gas_assert (!i.tm.opcode_modifier.immext);
8068
8069           /* Turn on Imm8 again so that output_imm will generate it.  */
8070           i.types[0].bitfield.imm8 = 1;
8071
8072           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
8073           i.op[0].imms->X_add_number
8074               |= register_number (i.op[reg_slot].regs) << 4;
8075           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
8076         }
8077
8078       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
8079       i.vex.register_specifier = i.op[nds].regs;
8080     }
8081   else
8082     source = dest = 0;
8083
8084   /* i.reg_operands MUST be the number of real register operands;
8085      implicit registers do not count.  If there are 3 register
8086      operands, it must be a instruction with VexNDS.  For a
8087      instruction with VexNDD, the destination register is encoded
8088      in VEX prefix.  If there are 4 register operands, it must be
8089      a instruction with VEX prefix and 3 sources.  */
8090   if (i.mem_operands == 0
8091       && ((i.reg_operands == 2
8092            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
8093           || (i.reg_operands == 3
8094               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
8095           || (i.reg_operands == 4 && vex_3_sources)))
8096     {
8097       switch (i.operands)
8098         {
8099         case 2:
8100           source = 0;
8101           break;
8102         case 3:
8103           /* When there are 3 operands, one of them may be immediate,
8104              which may be the first or the last operand.  Otherwise,
8105              the first operand must be shift count register (cl) or it
8106              is an instruction with VexNDS. */
8107           gas_assert (i.imm_operands == 1
8108                       || (i.imm_operands == 0
8109                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
8110                               || (i.types[0].bitfield.instance == RegC
8111                                   && i.types[0].bitfield.byte))));
8112           if (operand_type_check (i.types[0], imm)
8113               || (i.types[0].bitfield.instance == RegC
8114                   && i.types[0].bitfield.byte))
8115             source = 1;
8116           else
8117             source = 0;
8118           break;
8119         case 4:
8120           /* When there are 4 operands, the first two must be 8bit
8121              immediate operands. The source operand will be the 3rd
8122              one.
8123
8124              For instructions with VexNDS, if the first operand
8125              an imm8, the source operand is the 2nd one.  If the last
8126              operand is imm8, the source operand is the first one.  */
8127           gas_assert ((i.imm_operands == 2
8128                        && i.types[0].bitfield.imm8
8129                        && i.types[1].bitfield.imm8)
8130                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
8131                           && i.imm_operands == 1
8132                           && (i.types[0].bitfield.imm8
8133                               || i.types[i.operands - 1].bitfield.imm8
8134                               || i.rounding.type != rc_none)));
8135           if (i.imm_operands == 2)
8136             source = 2;
8137           else
8138             {
8139               if (i.types[0].bitfield.imm8)
8140                 source = 1;
8141               else
8142                 source = 0;
8143             }
8144           break;
8145         case 5:
8146           if (is_evex_encoding (&i.tm))
8147             {
8148               /* For EVEX instructions, when there are 5 operands, the
8149                  first one must be immediate operand.  If the second one
8150                  is immediate operand, the source operand is the 3th
8151                  one.  If the last one is immediate operand, the source
8152                  operand is the 2nd one.  */
8153               gas_assert (i.imm_operands == 2
8154                           && i.tm.opcode_modifier.sae
8155                           && operand_type_check (i.types[0], imm));
8156               if (operand_type_check (i.types[1], imm))
8157                 source = 2;
8158               else if (operand_type_check (i.types[4], imm))
8159                 source = 1;
8160               else
8161                 abort ();
8162             }
8163           break;
8164         default:
8165           abort ();
8166         }
8167
8168       if (!vex_3_sources)
8169         {
8170           dest = source + 1;
8171
8172           /* RC/SAE operand could be between DEST and SRC.  That happens
8173              when one operand is GPR and the other one is XMM/YMM/ZMM
8174              register.  */
8175           if (i.rounding.type != rc_none && i.rounding.operand == dest)
8176             dest++;
8177
8178           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8179             {
8180               /* For instructions with VexNDS, the register-only source
8181                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
8182                  register.  It is encoded in VEX prefix.  */
8183
8184               i386_operand_type op;
8185               unsigned int vvvv;
8186
8187               /* Swap two source operands if needed.  */
8188               if (i.tm.opcode_modifier.swapsources)
8189                 {
8190                   vvvv = source;
8191                   source = dest;
8192                 }
8193               else
8194                 vvvv = dest;
8195
8196               op = i.tm.operand_types[vvvv];
8197               if ((dest + 1) >= i.operands
8198                   || ((op.bitfield.class != Reg
8199                        || (!op.bitfield.dword && !op.bitfield.qword))
8200                       && op.bitfield.class != RegSIMD
8201                       && !operand_type_equal (&op, &regmask)))
8202                 abort ();
8203               i.vex.register_specifier = i.op[vvvv].regs;
8204               dest++;
8205             }
8206         }
8207
8208       i.rm.mode = 3;
8209       /* One of the register operands will be encoded in the i.rm.reg
8210          field, the other in the combined i.rm.mode and i.rm.regmem
8211          fields.  If no form of this instruction supports a memory
8212          destination operand, then we assume the source operand may
8213          sometimes be a memory operand and so we need to store the
8214          destination in the i.rm.reg field.  */
8215       if (!i.tm.opcode_modifier.regmem
8216           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
8217         {
8218           i.rm.reg = i.op[dest].regs->reg_num;
8219           i.rm.regmem = i.op[source].regs->reg_num;
8220           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
8221           set_rex_vrex (i.op[source].regs, REX_B, false);
8222         }
8223       else
8224         {
8225           i.rm.reg = i.op[source].regs->reg_num;
8226           i.rm.regmem = i.op[dest].regs->reg_num;
8227           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8228           set_rex_vrex (i.op[source].regs, REX_R, false);
8229         }
8230       if (flag_code != CODE_64BIT && (i.rex & REX_R))
8231         {
8232           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8233             abort ();
8234           i.rex &= ~REX_R;
8235           add_prefix (LOCK_PREFIX_OPCODE);
8236         }
8237     }
8238   else
8239     {                   /* If it's not 2 reg operands...  */
8240       unsigned int mem;
8241
8242       if (i.mem_operands)
8243         {
8244           unsigned int fake_zero_displacement = 0;
8245           unsigned int op;
8246
8247           for (op = 0; op < i.operands; op++)
8248             if (i.flags[op] & Operand_Mem)
8249               break;
8250           gas_assert (op < i.operands);
8251
8252           if (i.tm.opcode_modifier.sib)
8253             {
8254               /* The index register of VSIB shouldn't be RegIZ.  */
8255               if (i.tm.opcode_modifier.sib != SIBMEM
8256                   && i.index_reg->reg_num == RegIZ)
8257                 abort ();
8258
8259               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8260               if (!i.base_reg)
8261                 {
8262                   i.sib.base = NO_BASE_REGISTER;
8263                   i.sib.scale = i.log2_scale_factor;
8264                   i.types[op].bitfield.disp8 = 0;
8265                   i.types[op].bitfield.disp16 = 0;
8266                   i.types[op].bitfield.disp64 = 0;
8267                   if (want_disp32 (&i.tm))
8268                     {
8269                       /* Must be 32 bit */
8270                       i.types[op].bitfield.disp32 = 1;
8271                       i.types[op].bitfield.disp32s = 0;
8272                     }
8273                   else
8274                     {
8275                       i.types[op].bitfield.disp32 = 0;
8276                       i.types[op].bitfield.disp32s = 1;
8277                     }
8278                 }
8279
8280               /* Since the mandatory SIB always has index register, so
8281                  the code logic remains unchanged. The non-mandatory SIB
8282                  without index register is allowed and will be handled
8283                  later.  */
8284               if (i.index_reg)
8285                 {
8286                   if (i.index_reg->reg_num == RegIZ)
8287                     i.sib.index = NO_INDEX_REGISTER;
8288                   else
8289                     i.sib.index = i.index_reg->reg_num;
8290                   set_rex_vrex (i.index_reg, REX_X, false);
8291                 }
8292             }
8293
8294           default_seg = reg_ds;
8295
8296           if (i.base_reg == 0)
8297             {
8298               i.rm.mode = 0;
8299               if (!i.disp_operands)
8300                 fake_zero_displacement = 1;
8301               if (i.index_reg == 0)
8302                 {
8303                   i386_operand_type newdisp;
8304
8305                   /* Both check for VSIB and mandatory non-vector SIB. */
8306                   gas_assert (!i.tm.opcode_modifier.sib
8307                               || i.tm.opcode_modifier.sib == SIBMEM);
8308                   /* Operand is just <disp>  */
8309                   if (flag_code == CODE_64BIT)
8310                     {
8311                       /* 64bit mode overwrites the 32bit absolute
8312                          addressing by RIP relative addressing and
8313                          absolute addressing is encoded by one of the
8314                          redundant SIB forms.  */
8315                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8316                       i.sib.base = NO_BASE_REGISTER;
8317                       i.sib.index = NO_INDEX_REGISTER;
8318                       newdisp = (want_disp32(&i.tm) ? disp32 : disp32s);
8319                     }
8320                   else if ((flag_code == CODE_16BIT)
8321                            ^ (i.prefix[ADDR_PREFIX] != 0))
8322                     {
8323                       i.rm.regmem = NO_BASE_REGISTER_16;
8324                       newdisp = disp16;
8325                     }
8326                   else
8327                     {
8328                       i.rm.regmem = NO_BASE_REGISTER;
8329                       newdisp = disp32;
8330                     }
8331                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8332                   i.types[op] = operand_type_or (i.types[op], newdisp);
8333                 }
8334               else if (!i.tm.opcode_modifier.sib)
8335                 {
8336                   /* !i.base_reg && i.index_reg  */
8337                   if (i.index_reg->reg_num == RegIZ)
8338                     i.sib.index = NO_INDEX_REGISTER;
8339                   else
8340                     i.sib.index = i.index_reg->reg_num;
8341                   i.sib.base = NO_BASE_REGISTER;
8342                   i.sib.scale = i.log2_scale_factor;
8343                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8344                   i.types[op].bitfield.disp8 = 0;
8345                   i.types[op].bitfield.disp16 = 0;
8346                   i.types[op].bitfield.disp64 = 0;
8347                   if (want_disp32 (&i.tm))
8348                     {
8349                       /* Must be 32 bit */
8350                       i.types[op].bitfield.disp32 = 1;
8351                       i.types[op].bitfield.disp32s = 0;
8352                     }
8353                   else
8354                     {
8355                       i.types[op].bitfield.disp32 = 0;
8356                       i.types[op].bitfield.disp32s = 1;
8357                     }
8358                   if ((i.index_reg->reg_flags & RegRex) != 0)
8359                     i.rex |= REX_X;
8360                 }
8361             }
8362           /* RIP addressing for 64bit mode.  */
8363           else if (i.base_reg->reg_num == RegIP)
8364             {
8365               gas_assert (!i.tm.opcode_modifier.sib);
8366               i.rm.regmem = NO_BASE_REGISTER;
8367               i.types[op].bitfield.disp8 = 0;
8368               i.types[op].bitfield.disp16 = 0;
8369               i.types[op].bitfield.disp32 = 0;
8370               i.types[op].bitfield.disp32s = 1;
8371               i.types[op].bitfield.disp64 = 0;
8372               i.flags[op] |= Operand_PCrel;
8373               if (! i.disp_operands)
8374                 fake_zero_displacement = 1;
8375             }
8376           else if (i.base_reg->reg_type.bitfield.word)
8377             {
8378               gas_assert (!i.tm.opcode_modifier.sib);
8379               switch (i.base_reg->reg_num)
8380                 {
8381                 case 3: /* (%bx)  */
8382                   if (i.index_reg == 0)
8383                     i.rm.regmem = 7;
8384                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8385                     i.rm.regmem = i.index_reg->reg_num - 6;
8386                   break;
8387                 case 5: /* (%bp)  */
8388                   default_seg = reg_ss;
8389                   if (i.index_reg == 0)
8390                     {
8391                       i.rm.regmem = 6;
8392                       if (operand_type_check (i.types[op], disp) == 0)
8393                         {
8394                           /* fake (%bp) into 0(%bp)  */
8395                           if (i.disp_encoding == disp_encoding_16bit)
8396                             i.types[op].bitfield.disp16 = 1;
8397                           else
8398                             i.types[op].bitfield.disp8 = 1;
8399                           fake_zero_displacement = 1;
8400                         }
8401                     }
8402                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8403                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8404                   break;
8405                 default: /* (%si) -> 4 or (%di) -> 5  */
8406                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8407                 }
8408               if (!fake_zero_displacement
8409                   && !i.disp_operands
8410                   && i.disp_encoding)
8411                 {
8412                   fake_zero_displacement = 1;
8413                   if (i.disp_encoding == disp_encoding_8bit)
8414                     i.types[op].bitfield.disp8 = 1;
8415                   else
8416                     i.types[op].bitfield.disp16 = 1;
8417                 }
8418               i.rm.mode = mode_from_disp_size (i.types[op]);
8419             }
8420           else /* i.base_reg and 32/64 bit mode  */
8421             {
8422               if (operand_type_check (i.types[op], disp))
8423                 {
8424                   i.types[op].bitfield.disp16 = 0;
8425                   i.types[op].bitfield.disp64 = 0;
8426                   if (!want_disp32 (&i.tm))
8427                     {
8428                       i.types[op].bitfield.disp32 = 0;
8429                       i.types[op].bitfield.disp32s = 1;
8430                     }
8431                   else
8432                     {
8433                       i.types[op].bitfield.disp32 = 1;
8434                       i.types[op].bitfield.disp32s = 0;
8435                     }
8436                 }
8437
8438               if (!i.tm.opcode_modifier.sib)
8439                 i.rm.regmem = i.base_reg->reg_num;
8440               if ((i.base_reg->reg_flags & RegRex) != 0)
8441                 i.rex |= REX_B;
8442               i.sib.base = i.base_reg->reg_num;
8443               /* x86-64 ignores REX prefix bit here to avoid decoder
8444                  complications.  */
8445               if (!(i.base_reg->reg_flags & RegRex)
8446                   && (i.base_reg->reg_num == EBP_REG_NUM
8447                    || i.base_reg->reg_num == ESP_REG_NUM))
8448                   default_seg = reg_ss;
8449               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8450                 {
8451                   fake_zero_displacement = 1;
8452                   if (i.disp_encoding == disp_encoding_32bit)
8453                     i.types[op].bitfield.disp32 = 1;
8454                   else
8455                     i.types[op].bitfield.disp8 = 1;
8456                 }
8457               i.sib.scale = i.log2_scale_factor;
8458               if (i.index_reg == 0)
8459                 {
8460                   /* Only check for VSIB. */
8461                   gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8462                               && i.tm.opcode_modifier.sib != VECSIB256
8463                               && i.tm.opcode_modifier.sib != VECSIB512);
8464
8465                   /* <disp>(%esp) becomes two byte modrm with no index
8466                      register.  We've already stored the code for esp
8467                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8468                      Any base register besides %esp will not use the
8469                      extra modrm byte.  */
8470                   i.sib.index = NO_INDEX_REGISTER;
8471                 }
8472               else if (!i.tm.opcode_modifier.sib)
8473                 {
8474                   if (i.index_reg->reg_num == RegIZ)
8475                     i.sib.index = NO_INDEX_REGISTER;
8476                   else
8477                     i.sib.index = i.index_reg->reg_num;
8478                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8479                   if ((i.index_reg->reg_flags & RegRex) != 0)
8480                     i.rex |= REX_X;
8481                 }
8482
8483               if (i.disp_operands
8484                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8485                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8486                 i.rm.mode = 0;
8487               else
8488                 {
8489                   if (!fake_zero_displacement
8490                       && !i.disp_operands
8491                       && i.disp_encoding)
8492                     {
8493                       fake_zero_displacement = 1;
8494                       if (i.disp_encoding == disp_encoding_8bit)
8495                         i.types[op].bitfield.disp8 = 1;
8496                       else
8497                         i.types[op].bitfield.disp32 = 1;
8498                     }
8499                   i.rm.mode = mode_from_disp_size (i.types[op]);
8500                 }
8501             }
8502
8503           if (fake_zero_displacement)
8504             {
8505               /* Fakes a zero displacement assuming that i.types[op]
8506                  holds the correct displacement size.  */
8507               expressionS *exp;
8508
8509               gas_assert (i.op[op].disps == 0);
8510               exp = &disp_expressions[i.disp_operands++];
8511               i.op[op].disps = exp;
8512               exp->X_op = O_constant;
8513               exp->X_add_number = 0;
8514               exp->X_add_symbol = (symbolS *) 0;
8515               exp->X_op_symbol = (symbolS *) 0;
8516             }
8517
8518           mem = op;
8519         }
8520       else
8521         mem = ~0;
8522
8523       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8524         {
8525           if (operand_type_check (i.types[0], imm))
8526             i.vex.register_specifier = NULL;
8527           else
8528             {
8529               /* VEX.vvvv encodes one of the sources when the first
8530                  operand is not an immediate.  */
8531               if (i.tm.opcode_modifier.vexw == VEXW0)
8532                 i.vex.register_specifier = i.op[0].regs;
8533               else
8534                 i.vex.register_specifier = i.op[1].regs;
8535             }
8536
8537           /* Destination is a XMM register encoded in the ModRM.reg
8538              and VEX.R bit.  */
8539           i.rm.reg = i.op[2].regs->reg_num;
8540           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8541             i.rex |= REX_R;
8542
8543           /* ModRM.rm and VEX.B encodes the other source.  */
8544           if (!i.mem_operands)
8545             {
8546               i.rm.mode = 3;
8547
8548               if (i.tm.opcode_modifier.vexw == VEXW0)
8549                 i.rm.regmem = i.op[1].regs->reg_num;
8550               else
8551                 i.rm.regmem = i.op[0].regs->reg_num;
8552
8553               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8554                 i.rex |= REX_B;
8555             }
8556         }
8557       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8558         {
8559           i.vex.register_specifier = i.op[2].regs;
8560           if (!i.mem_operands)
8561             {
8562               i.rm.mode = 3;
8563               i.rm.regmem = i.op[1].regs->reg_num;
8564               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8565                 i.rex |= REX_B;
8566             }
8567         }
8568       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8569          (if any) based on i.tm.extension_opcode.  Again, we must be
8570          careful to make sure that segment/control/debug/test/MMX
8571          registers are coded into the i.rm.reg field.  */
8572       else if (i.reg_operands)
8573         {
8574           unsigned int op;
8575           unsigned int vex_reg = ~0;
8576
8577           for (op = 0; op < i.operands; op++)
8578             if (i.types[op].bitfield.class == Reg
8579                 || i.types[op].bitfield.class == RegBND
8580                 || i.types[op].bitfield.class == RegMask
8581                 || i.types[op].bitfield.class == SReg
8582                 || i.types[op].bitfield.class == RegCR
8583                 || i.types[op].bitfield.class == RegDR
8584                 || i.types[op].bitfield.class == RegTR
8585                 || i.types[op].bitfield.class == RegSIMD
8586                 || i.types[op].bitfield.class == RegMMX)
8587               break;
8588
8589           if (vex_3_sources)
8590             op = dest;
8591           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8592             {
8593               /* For instructions with VexNDS, the register-only
8594                  source operand is encoded in VEX prefix. */
8595               gas_assert (mem != (unsigned int) ~0);
8596
8597               if (op > mem)
8598                 {
8599                   vex_reg = op++;
8600                   gas_assert (op < i.operands);
8601                 }
8602               else
8603                 {
8604                   /* Check register-only source operand when two source
8605                      operands are swapped.  */
8606                   if (!i.tm.operand_types[op].bitfield.baseindex
8607                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8608                     {
8609                       vex_reg = op;
8610                       op += 2;
8611                       gas_assert (mem == (vex_reg + 1)
8612                                   && op < i.operands);
8613                     }
8614                   else
8615                     {
8616                       vex_reg = op + 1;
8617                       gas_assert (vex_reg < i.operands);
8618                     }
8619                 }
8620             }
8621           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8622             {
8623               /* For instructions with VexNDD, the register destination
8624                  is encoded in VEX prefix.  */
8625               if (i.mem_operands == 0)
8626                 {
8627                   /* There is no memory operand.  */
8628                   gas_assert ((op + 2) == i.operands);
8629                   vex_reg = op + 1;
8630                 }
8631               else
8632                 {
8633                   /* There are only 2 non-immediate operands.  */
8634                   gas_assert (op < i.imm_operands + 2
8635                               && i.operands == i.imm_operands + 2);
8636                   vex_reg = i.imm_operands + 1;
8637                 }
8638             }
8639           else
8640             gas_assert (op < i.operands);
8641
8642           if (vex_reg != (unsigned int) ~0)
8643             {
8644               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8645
8646               if ((type->bitfield.class != Reg
8647                    || (!type->bitfield.dword && !type->bitfield.qword))
8648                   && type->bitfield.class != RegSIMD
8649                   && !operand_type_equal (type, &regmask))
8650                 abort ();
8651
8652               i.vex.register_specifier = i.op[vex_reg].regs;
8653             }
8654
8655           /* Don't set OP operand twice.  */
8656           if (vex_reg != op)
8657             {
8658               /* If there is an extension opcode to put here, the
8659                  register number must be put into the regmem field.  */
8660               if (i.tm.extension_opcode != None)
8661                 {
8662                   i.rm.regmem = i.op[op].regs->reg_num;
8663                   set_rex_vrex (i.op[op].regs, REX_B,
8664                                 i.tm.opcode_modifier.sse2avx);
8665                 }
8666               else
8667                 {
8668                   i.rm.reg = i.op[op].regs->reg_num;
8669                   set_rex_vrex (i.op[op].regs, REX_R,
8670                                 i.tm.opcode_modifier.sse2avx);
8671                 }
8672             }
8673
8674           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8675              must set it to 3 to indicate this is a register operand
8676              in the regmem field.  */
8677           if (!i.mem_operands)
8678             i.rm.mode = 3;
8679         }
8680
8681       /* Fill in i.rm.reg field with extension opcode (if any).  */
8682       if (i.tm.extension_opcode != None)
8683         i.rm.reg = i.tm.extension_opcode;
8684     }
8685   return default_seg;
8686 }
8687
8688 static INLINE void
8689 frag_opcode_byte (unsigned char byte)
8690 {
8691   if (now_seg != absolute_section)
8692     FRAG_APPEND_1_CHAR (byte);
8693   else
8694     ++abs_section_offset;
8695 }
8696
8697 static unsigned int
8698 flip_code16 (unsigned int code16)
8699 {
8700   gas_assert (i.tm.operands == 1);
8701
8702   return !(i.prefix[REX_PREFIX] & REX_W)
8703          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8704                       || i.tm.operand_types[0].bitfield.disp32s
8705                     : i.tm.operand_types[0].bitfield.disp16)
8706          ? CODE16 : 0;
8707 }
8708
8709 static void
8710 output_branch (void)
8711 {
8712   char *p;
8713   int size;
8714   int code16;
8715   int prefix;
8716   relax_substateT subtype;
8717   symbolS *sym;
8718   offsetT off;
8719
8720   if (now_seg == absolute_section)
8721     {
8722       as_bad (_("relaxable branches not supported in absolute section"));
8723       return;
8724     }
8725
8726   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8727   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8728
8729   prefix = 0;
8730   if (i.prefix[DATA_PREFIX] != 0)
8731     {
8732       prefix = 1;
8733       i.prefixes -= 1;
8734       code16 ^= flip_code16(code16);
8735     }
8736   /* Pentium4 branch hints.  */
8737   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8738       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8739     {
8740       prefix++;
8741       i.prefixes--;
8742     }
8743   if (i.prefix[REX_PREFIX] != 0)
8744     {
8745       prefix++;
8746       i.prefixes--;
8747     }
8748
8749   /* BND prefixed jump.  */
8750   if (i.prefix[BND_PREFIX] != 0)
8751     {
8752       prefix++;
8753       i.prefixes--;
8754     }
8755
8756   if (i.prefixes != 0)
8757     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8758
8759   /* It's always a symbol;  End frag & setup for relax.
8760      Make sure there is enough room in this frag for the largest
8761      instruction we may generate in md_convert_frag.  This is 2
8762      bytes for the opcode and room for the prefix and largest
8763      displacement.  */
8764   frag_grow (prefix + 2 + 4);
8765   /* Prefix and 1 opcode byte go in fr_fix.  */
8766   p = frag_more (prefix + 1);
8767   if (i.prefix[DATA_PREFIX] != 0)
8768     *p++ = DATA_PREFIX_OPCODE;
8769   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8770       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8771     *p++ = i.prefix[SEG_PREFIX];
8772   if (i.prefix[BND_PREFIX] != 0)
8773     *p++ = BND_PREFIX_OPCODE;
8774   if (i.prefix[REX_PREFIX] != 0)
8775     *p++ = i.prefix[REX_PREFIX];
8776   *p = i.tm.base_opcode;
8777
8778   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8779     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8780   else if (cpu_arch_flags.bitfield.cpui386)
8781     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8782   else
8783     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8784   subtype |= code16;
8785
8786   sym = i.op[0].disps->X_add_symbol;
8787   off = i.op[0].disps->X_add_number;
8788
8789   if (i.op[0].disps->X_op != O_constant
8790       && i.op[0].disps->X_op != O_symbol)
8791     {
8792       /* Handle complex expressions.  */
8793       sym = make_expr_symbol (i.op[0].disps);
8794       off = 0;
8795     }
8796
8797   /* 1 possible extra opcode + 4 byte displacement go in var part.
8798      Pass reloc in fr_var.  */
8799   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8800 }
8801
8802 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8803 /* Return TRUE iff PLT32 relocation should be used for branching to
8804    symbol S.  */
8805
8806 static bool
8807 need_plt32_p (symbolS *s)
8808 {
8809   /* PLT32 relocation is ELF only.  */
8810   if (!IS_ELF)
8811     return false;
8812
8813 #ifdef TE_SOLARIS
8814   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8815      krtld support it.  */
8816   return false;
8817 #endif
8818
8819   /* Since there is no need to prepare for PLT branch on x86-64, we
8820      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8821      be used as a marker for 32-bit PC-relative branches.  */
8822   if (!object_64bit)
8823     return false;
8824
8825   if (s == NULL)
8826     return false;
8827
8828   /* Weak or undefined symbol need PLT32 relocation.  */
8829   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8830     return true;
8831
8832   /* Non-global symbol doesn't need PLT32 relocation.  */
8833   if (! S_IS_EXTERNAL (s))
8834     return false;
8835
8836   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8837      non-default visibilities are treated as normal global symbol
8838      so that PLT32 relocation can be used as a marker for 32-bit
8839      PC-relative branches.  It is useful for linker relaxation.  */
8840   return true;
8841 }
8842 #endif
8843
8844 static void
8845 output_jump (void)
8846 {
8847   char *p;
8848   int size;
8849   fixS *fixP;
8850   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8851
8852   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8853     {
8854       /* This is a loop or jecxz type instruction.  */
8855       size = 1;
8856       if (i.prefix[ADDR_PREFIX] != 0)
8857         {
8858           frag_opcode_byte (ADDR_PREFIX_OPCODE);
8859           i.prefixes -= 1;
8860         }
8861       /* Pentium4 branch hints.  */
8862       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8863           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8864         {
8865           frag_opcode_byte (i.prefix[SEG_PREFIX]);
8866           i.prefixes--;
8867         }
8868     }
8869   else
8870     {
8871       int code16;
8872
8873       code16 = 0;
8874       if (flag_code == CODE_16BIT)
8875         code16 = CODE16;
8876
8877       if (i.prefix[DATA_PREFIX] != 0)
8878         {
8879           frag_opcode_byte (DATA_PREFIX_OPCODE);
8880           i.prefixes -= 1;
8881           code16 ^= flip_code16(code16);
8882         }
8883
8884       size = 4;
8885       if (code16)
8886         size = 2;
8887     }
8888
8889   /* BND prefixed jump.  */
8890   if (i.prefix[BND_PREFIX] != 0)
8891     {
8892       frag_opcode_byte (i.prefix[BND_PREFIX]);
8893       i.prefixes -= 1;
8894     }
8895
8896   if (i.prefix[REX_PREFIX] != 0)
8897     {
8898       frag_opcode_byte (i.prefix[REX_PREFIX]);
8899       i.prefixes -= 1;
8900     }
8901
8902   if (i.prefixes != 0)
8903     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8904
8905   if (now_seg == absolute_section)
8906     {
8907       abs_section_offset += i.opcode_length + size;
8908       return;
8909     }
8910
8911   p = frag_more (i.opcode_length + size);
8912   switch (i.opcode_length)
8913     {
8914     case 2:
8915       *p++ = i.tm.base_opcode >> 8;
8916       /* Fall through.  */
8917     case 1:
8918       *p++ = i.tm.base_opcode;
8919       break;
8920     default:
8921       abort ();
8922     }
8923
8924 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8925   if (size == 4
8926       && jump_reloc == NO_RELOC
8927       && need_plt32_p (i.op[0].disps->X_add_symbol))
8928     jump_reloc = BFD_RELOC_X86_64_PLT32;
8929 #endif
8930
8931   jump_reloc = reloc (size, 1, 1, jump_reloc);
8932
8933   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8934                       i.op[0].disps, 1, jump_reloc);
8935
8936   /* All jumps handled here are signed, but don't unconditionally use a
8937      signed limit check for 32 and 16 bit jumps as we want to allow wrap
8938      around at 4G (outside of 64-bit mode) and 64k (except for XBEGIN)
8939      respectively.  */
8940   switch (size)
8941     {
8942     case 1:
8943       fixP->fx_signed = 1;
8944       break;
8945
8946     case 2:
8947       if (i.tm.base_opcode == 0xc7f8)
8948         fixP->fx_signed = 1;
8949       break;
8950
8951     case 4:
8952       if (flag_code == CODE_64BIT)
8953         fixP->fx_signed = 1;
8954       break;
8955     }
8956 }
8957
8958 static void
8959 output_interseg_jump (void)
8960 {
8961   char *p;
8962   int size;
8963   int prefix;
8964   int code16;
8965
8966   code16 = 0;
8967   if (flag_code == CODE_16BIT)
8968     code16 = CODE16;
8969
8970   prefix = 0;
8971   if (i.prefix[DATA_PREFIX] != 0)
8972     {
8973       prefix = 1;
8974       i.prefixes -= 1;
8975       code16 ^= CODE16;
8976     }
8977
8978   gas_assert (!i.prefix[REX_PREFIX]);
8979
8980   size = 4;
8981   if (code16)
8982     size = 2;
8983
8984   if (i.prefixes != 0)
8985     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8986
8987   if (now_seg == absolute_section)
8988     {
8989       abs_section_offset += prefix + 1 + 2 + size;
8990       return;
8991     }
8992
8993   /* 1 opcode; 2 segment; offset  */
8994   p = frag_more (prefix + 1 + 2 + size);
8995
8996   if (i.prefix[DATA_PREFIX] != 0)
8997     *p++ = DATA_PREFIX_OPCODE;
8998
8999   if (i.prefix[REX_PREFIX] != 0)
9000     *p++ = i.prefix[REX_PREFIX];
9001
9002   *p++ = i.tm.base_opcode;
9003   if (i.op[1].imms->X_op == O_constant)
9004     {
9005       offsetT n = i.op[1].imms->X_add_number;
9006
9007       if (size == 2
9008           && !fits_in_unsigned_word (n)
9009           && !fits_in_signed_word (n))
9010         {
9011           as_bad (_("16-bit jump out of range"));
9012           return;
9013         }
9014       md_number_to_chars (p, n, size);
9015     }
9016   else
9017     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9018                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
9019
9020   p += size;
9021   if (i.op[0].imms->X_op == O_constant)
9022     md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
9023   else
9024     fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
9025                  i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
9026 }
9027
9028 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9029 void
9030 x86_cleanup (void)
9031 {
9032   char *p;
9033   asection *seg = now_seg;
9034   subsegT subseg = now_subseg;
9035   asection *sec;
9036   unsigned int alignment, align_size_1;
9037   unsigned int isa_1_descsz, feature_2_descsz, descsz;
9038   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
9039   unsigned int padding;
9040
9041   if (!IS_ELF || !x86_used_note)
9042     return;
9043
9044   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
9045
9046   /* The .note.gnu.property section layout:
9047
9048      Field      Length          Contents
9049      ----       ----            ----
9050      n_namsz    4               4
9051      n_descsz   4               The note descriptor size
9052      n_type     4               NT_GNU_PROPERTY_TYPE_0
9053      n_name     4               "GNU"
9054      n_desc     n_descsz        The program property array
9055      ....       ....            ....
9056    */
9057
9058   /* Create the .note.gnu.property section.  */
9059   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
9060   bfd_set_section_flags (sec,
9061                          (SEC_ALLOC
9062                           | SEC_LOAD
9063                           | SEC_DATA
9064                           | SEC_HAS_CONTENTS
9065                           | SEC_READONLY));
9066
9067   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
9068     {
9069       align_size_1 = 7;
9070       alignment = 3;
9071     }
9072   else
9073     {
9074       align_size_1 = 3;
9075       alignment = 2;
9076     }
9077
9078   bfd_set_section_alignment (sec, alignment);
9079   elf_section_type (sec) = SHT_NOTE;
9080
9081   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
9082                                   + 4-byte data  */
9083   isa_1_descsz_raw = 4 + 4 + 4;
9084   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
9085   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
9086
9087   feature_2_descsz_raw = isa_1_descsz;
9088   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
9089                                       + 4-byte data  */
9090   feature_2_descsz_raw += 4 + 4 + 4;
9091   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
9092   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
9093                       & ~align_size_1);
9094
9095   descsz = feature_2_descsz;
9096   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
9097   p = frag_more (4 + 4 + 4 + 4 + descsz);
9098
9099   /* Write n_namsz.  */
9100   md_number_to_chars (p, (valueT) 4, 4);
9101
9102   /* Write n_descsz.  */
9103   md_number_to_chars (p + 4, (valueT) descsz, 4);
9104
9105   /* Write n_type.  */
9106   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
9107
9108   /* Write n_name.  */
9109   memcpy (p + 4 * 3, "GNU", 4);
9110
9111   /* Write 4-byte type.  */
9112   md_number_to_chars (p + 4 * 4,
9113                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
9114
9115   /* Write 4-byte data size.  */
9116   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
9117
9118   /* Write 4-byte data.  */
9119   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
9120
9121   /* Zero out paddings.  */
9122   padding = isa_1_descsz - isa_1_descsz_raw;
9123   if (padding)
9124     memset (p + 4 * 7, 0, padding);
9125
9126   /* Write 4-byte type.  */
9127   md_number_to_chars (p + isa_1_descsz + 4 * 4,
9128                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
9129
9130   /* Write 4-byte data size.  */
9131   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
9132
9133   /* Write 4-byte data.  */
9134   md_number_to_chars (p + isa_1_descsz + 4 * 6,
9135                       (valueT) x86_feature_2_used, 4);
9136
9137   /* Zero out paddings.  */
9138   padding = feature_2_descsz - feature_2_descsz_raw;
9139   if (padding)
9140     memset (p + isa_1_descsz + 4 * 7, 0, padding);
9141
9142   /* We probably can't restore the current segment, for there likely
9143      isn't one yet...  */
9144   if (seg && subseg)
9145     subseg_set (seg, subseg);
9146 }
9147 #endif
9148
9149 static unsigned int
9150 encoding_length (const fragS *start_frag, offsetT start_off,
9151                  const char *frag_now_ptr)
9152 {
9153   unsigned int len = 0;
9154
9155   if (start_frag != frag_now)
9156     {
9157       const fragS *fr = start_frag;
9158
9159       do {
9160         len += fr->fr_fix;
9161         fr = fr->fr_next;
9162       } while (fr && fr != frag_now);
9163     }
9164
9165   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
9166 }
9167
9168 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
9169    be macro-fused with conditional jumps.
9170    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
9171    or is one of the following format:
9172
9173     cmp m, imm
9174     add m, imm
9175     sub m, imm
9176    test m, imm
9177     and m, imm
9178     inc m
9179     dec m
9180
9181    it is unfusible.  */
9182
9183 static int
9184 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
9185 {
9186   /* No RIP address.  */
9187   if (i.base_reg && i.base_reg->reg_num == RegIP)
9188     return 0;
9189
9190   /* No opcodes outside of base encoding space.  */
9191   if (i.tm.opcode_modifier.opcodespace != SPACE_BASE)
9192     return 0;
9193
9194   /* add, sub without add/sub m, imm.  */
9195   if (i.tm.base_opcode <= 5
9196       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
9197       || ((i.tm.base_opcode | 3) == 0x83
9198           && (i.tm.extension_opcode == 0x5
9199               || i.tm.extension_opcode == 0x0)))
9200     {
9201       *mf_cmp_p = mf_cmp_alu_cmp;
9202       return !(i.mem_operands && i.imm_operands);
9203     }
9204
9205   /* and without and m, imm.  */
9206   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
9207       || ((i.tm.base_opcode | 3) == 0x83
9208           && i.tm.extension_opcode == 0x4))
9209     {
9210       *mf_cmp_p = mf_cmp_test_and;
9211       return !(i.mem_operands && i.imm_operands);
9212     }
9213
9214   /* test without test m imm.  */
9215   if ((i.tm.base_opcode | 1) == 0x85
9216       || (i.tm.base_opcode | 1) == 0xa9
9217       || ((i.tm.base_opcode | 1) == 0xf7
9218           && i.tm.extension_opcode == 0))
9219     {
9220       *mf_cmp_p = mf_cmp_test_and;
9221       return !(i.mem_operands && i.imm_operands);
9222     }
9223
9224   /* cmp without cmp m, imm.  */
9225   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
9226       || ((i.tm.base_opcode | 3) == 0x83
9227           && (i.tm.extension_opcode == 0x7)))
9228     {
9229       *mf_cmp_p = mf_cmp_alu_cmp;
9230       return !(i.mem_operands && i.imm_operands);
9231     }
9232
9233   /* inc, dec without inc/dec m.   */
9234   if ((i.tm.cpu_flags.bitfield.cpuno64
9235        && (i.tm.base_opcode | 0xf) == 0x4f)
9236       || ((i.tm.base_opcode | 1) == 0xff
9237           && i.tm.extension_opcode <= 0x1))
9238     {
9239       *mf_cmp_p = mf_cmp_incdec;
9240       return !i.mem_operands;
9241     }
9242
9243   return 0;
9244 }
9245
9246 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
9247
9248 static int
9249 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9250 {
9251   /* NB: Don't work with COND_JUMP86 without i386.  */
9252   if (!align_branch_power
9253       || now_seg == absolute_section
9254       || !cpu_arch_flags.bitfield.cpui386
9255       || !(align_branch & align_branch_fused_bit))
9256     return 0;
9257
9258   if (maybe_fused_with_jcc_p (mf_cmp_p))
9259     {
9260       if (last_insn.kind == last_insn_other
9261           || last_insn.seg != now_seg)
9262         return 1;
9263       if (flag_debug)
9264         as_warn_where (last_insn.file, last_insn.line,
9265                        _("`%s` skips -malign-branch-boundary on `%s`"),
9266                        last_insn.name, i.tm.name);
9267     }
9268
9269   return 0;
9270 }
9271
9272 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
9273
9274 static int
9275 add_branch_prefix_frag_p (void)
9276 {
9277   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
9278      to PadLock instructions since they include prefixes in opcode.  */
9279   if (!align_branch_power
9280       || !align_branch_prefix_size
9281       || now_seg == absolute_section
9282       || i.tm.cpu_flags.bitfield.cpupadlock
9283       || !cpu_arch_flags.bitfield.cpui386)
9284     return 0;
9285
9286   /* Don't add prefix if it is a prefix or there is no operand in case
9287      that segment prefix is special.  */
9288   if (!i.operands || i.tm.opcode_modifier.isprefix)
9289     return 0;
9290
9291   if (last_insn.kind == last_insn_other
9292       || last_insn.seg != now_seg)
9293     return 1;
9294
9295   if (flag_debug)
9296     as_warn_where (last_insn.file, last_insn.line,
9297                    _("`%s` skips -malign-branch-boundary on `%s`"),
9298                    last_insn.name, i.tm.name);
9299
9300   return 0;
9301 }
9302
9303 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
9304
9305 static int
9306 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9307                            enum mf_jcc_kind *mf_jcc_p)
9308 {
9309   int add_padding;
9310
9311   /* NB: Don't work with COND_JUMP86 without i386.  */
9312   if (!align_branch_power
9313       || now_seg == absolute_section
9314       || !cpu_arch_flags.bitfield.cpui386
9315       || i.tm.opcode_modifier.opcodespace != SPACE_BASE)
9316     return 0;
9317
9318   add_padding = 0;
9319
9320   /* Check for jcc and direct jmp.  */
9321   if (i.tm.opcode_modifier.jump == JUMP)
9322     {
9323       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9324         {
9325           *branch_p = align_branch_jmp;
9326           add_padding = align_branch & align_branch_jmp_bit;
9327         }
9328       else
9329         {
9330           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9331              igore the lowest bit.  */
9332           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9333           *branch_p = align_branch_jcc;
9334           if ((align_branch & align_branch_jcc_bit))
9335             add_padding = 1;
9336         }
9337     }
9338   else if ((i.tm.base_opcode | 1) == 0xc3)
9339     {
9340       /* Near ret.  */
9341       *branch_p = align_branch_ret;
9342       if ((align_branch & align_branch_ret_bit))
9343         add_padding = 1;
9344     }
9345   else
9346     {
9347       /* Check for indirect jmp, direct and indirect calls.  */
9348       if (i.tm.base_opcode == 0xe8)
9349         {
9350           /* Direct call.  */
9351           *branch_p = align_branch_call;
9352           if ((align_branch & align_branch_call_bit))
9353             add_padding = 1;
9354         }
9355       else if (i.tm.base_opcode == 0xff
9356                && (i.tm.extension_opcode == 2
9357                    || i.tm.extension_opcode == 4))
9358         {
9359           /* Indirect call and jmp.  */
9360           *branch_p = align_branch_indirect;
9361           if ((align_branch & align_branch_indirect_bit))
9362             add_padding = 1;
9363         }
9364
9365       if (add_padding
9366           && i.disp_operands
9367           && tls_get_addr
9368           && (i.op[0].disps->X_op == O_symbol
9369               || (i.op[0].disps->X_op == O_subtract
9370                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9371         {
9372           symbolS *s = i.op[0].disps->X_add_symbol;
9373           /* No padding to call to global or undefined tls_get_addr.  */
9374           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9375               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9376             return 0;
9377         }
9378     }
9379
9380   if (add_padding
9381       && last_insn.kind != last_insn_other
9382       && last_insn.seg == now_seg)
9383     {
9384       if (flag_debug)
9385         as_warn_where (last_insn.file, last_insn.line,
9386                        _("`%s` skips -malign-branch-boundary on `%s`"),
9387                        last_insn.name, i.tm.name);
9388       return 0;
9389     }
9390
9391   return add_padding;
9392 }
9393
9394 static void
9395 output_insn (void)
9396 {
9397   fragS *insn_start_frag;
9398   offsetT insn_start_off;
9399   fragS *fragP = NULL;
9400   enum align_branch_kind branch = align_branch_none;
9401   /* The initializer is arbitrary just to avoid uninitialized error.
9402      it's actually either assigned in add_branch_padding_frag_p
9403      or never be used.  */
9404   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9405
9406 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9407   if (IS_ELF && x86_used_note && now_seg != absolute_section)
9408     {
9409       if ((i.xstate & xstate_tmm) == xstate_tmm
9410           || i.tm.cpu_flags.bitfield.cpuamx_tile)
9411         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9412
9413       if (i.tm.cpu_flags.bitfield.cpu8087
9414           || i.tm.cpu_flags.bitfield.cpu287
9415           || i.tm.cpu_flags.bitfield.cpu387
9416           || i.tm.cpu_flags.bitfield.cpu687
9417           || i.tm.cpu_flags.bitfield.cpufisttp)
9418         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9419
9420       if ((i.xstate & xstate_mmx)
9421           || (i.tm.opcode_modifier.opcodespace == SPACE_0F
9422               && !is_any_vex_encoding (&i.tm)
9423               && (i.tm.base_opcode == 0x77 /* emms */
9424                   || i.tm.base_opcode == 0x0e /* femms */)))
9425         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9426
9427       if (i.index_reg)
9428         {
9429           if (i.index_reg->reg_type.bitfield.zmmword)
9430             i.xstate |= xstate_zmm;
9431           else if (i.index_reg->reg_type.bitfield.ymmword)
9432             i.xstate |= xstate_ymm;
9433           else if (i.index_reg->reg_type.bitfield.xmmword)
9434             i.xstate |= xstate_xmm;
9435         }
9436
9437       /* vzeroall / vzeroupper */
9438       if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9439         i.xstate |= xstate_ymm;
9440
9441       if ((i.xstate & xstate_xmm)
9442           /* ldmxcsr / stmxcsr / vldmxcsr / vstmxcsr */
9443           || (i.tm.base_opcode == 0xae
9444               && (i.tm.cpu_flags.bitfield.cpusse
9445                   || i.tm.cpu_flags.bitfield.cpuavx))
9446           || i.tm.cpu_flags.bitfield.cpuwidekl
9447           || i.tm.cpu_flags.bitfield.cpukl)
9448         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9449
9450       if ((i.xstate & xstate_ymm) == xstate_ymm)
9451         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9452       if ((i.xstate & xstate_zmm) == xstate_zmm)
9453         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9454       if (i.mask.reg || (i.xstate & xstate_mask) == xstate_mask)
9455         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9456       if (i.tm.cpu_flags.bitfield.cpufxsr)
9457         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9458       if (i.tm.cpu_flags.bitfield.cpuxsave)
9459         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9460       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9461         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9462       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9463         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9464
9465       if (x86_feature_2_used
9466           || i.tm.cpu_flags.bitfield.cpucmov
9467           || i.tm.cpu_flags.bitfield.cpusyscall
9468           || (i.tm.opcode_modifier.opcodespace == SPACE_0F
9469               && i.tm.base_opcode == 0xc7
9470               && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
9471               && i.tm.extension_opcode == 1) /* cmpxchg8b */)
9472         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9473       if (i.tm.cpu_flags.bitfield.cpusse3
9474           || i.tm.cpu_flags.bitfield.cpussse3
9475           || i.tm.cpu_flags.bitfield.cpusse4_1
9476           || i.tm.cpu_flags.bitfield.cpusse4_2
9477           || i.tm.cpu_flags.bitfield.cpucx16
9478           || i.tm.cpu_flags.bitfield.cpupopcnt
9479           /* LAHF-SAHF insns in 64-bit mode.  */
9480           || (flag_code == CODE_64BIT
9481               && (i.tm.base_opcode | 1) == 0x9f
9482               && i.tm.opcode_modifier.opcodespace == SPACE_BASE))
9483         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9484       if (i.tm.cpu_flags.bitfield.cpuavx
9485           || i.tm.cpu_flags.bitfield.cpuavx2
9486           /* Any VEX encoded insns execpt for CpuAVX512F, CpuAVX512BW,
9487              CpuAVX512DQ, LPW, TBM and AMX.  */
9488           || (i.tm.opcode_modifier.vex
9489               && !i.tm.cpu_flags.bitfield.cpuavx512f
9490               && !i.tm.cpu_flags.bitfield.cpuavx512bw
9491               && !i.tm.cpu_flags.bitfield.cpuavx512dq
9492               && !i.tm.cpu_flags.bitfield.cpulwp
9493               && !i.tm.cpu_flags.bitfield.cputbm
9494               && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9495           || i.tm.cpu_flags.bitfield.cpuf16c
9496           || i.tm.cpu_flags.bitfield.cpufma
9497           || i.tm.cpu_flags.bitfield.cpulzcnt
9498           || i.tm.cpu_flags.bitfield.cpumovbe
9499           || i.tm.cpu_flags.bitfield.cpuxsaves
9500           || (x86_feature_2_used
9501               & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9502                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9503                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9504         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9505       if (i.tm.cpu_flags.bitfield.cpuavx512f
9506           || i.tm.cpu_flags.bitfield.cpuavx512bw
9507           || i.tm.cpu_flags.bitfield.cpuavx512dq
9508           || i.tm.cpu_flags.bitfield.cpuavx512vl
9509           /* Any EVEX encoded insns except for AVX512ER, AVX512PF and
9510              VNNIW.  */
9511           || (i.tm.opcode_modifier.evex
9512               && !i.tm.cpu_flags.bitfield.cpuavx512er
9513               && !i.tm.cpu_flags.bitfield.cpuavx512pf
9514               && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9515         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9516     }
9517 #endif
9518
9519   /* Tie dwarf2 debug info to the address at the start of the insn.
9520      We can't do this after the insn has been output as the current
9521      frag may have been closed off.  eg. by frag_var.  */
9522   dwarf2_emit_insn (0);
9523
9524   insn_start_frag = frag_now;
9525   insn_start_off = frag_now_fix ();
9526
9527   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9528     {
9529       char *p;
9530       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9531       unsigned int max_branch_padding_size = 14;
9532
9533       /* Align section to boundary.  */
9534       record_alignment (now_seg, align_branch_power);
9535
9536       /* Make room for padding.  */
9537       frag_grow (max_branch_padding_size);
9538
9539       /* Start of the padding.  */
9540       p = frag_more (0);
9541
9542       fragP = frag_now;
9543
9544       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9545                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9546                 NULL, 0, p);
9547
9548       fragP->tc_frag_data.mf_type = mf_jcc;
9549       fragP->tc_frag_data.branch_type = branch;
9550       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9551     }
9552
9553   /* Output jumps.  */
9554   if (i.tm.opcode_modifier.jump == JUMP)
9555     output_branch ();
9556   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9557            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9558     output_jump ();
9559   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9560     output_interseg_jump ();
9561   else
9562     {
9563       /* Output normal instructions here.  */
9564       char *p;
9565       unsigned char *q;
9566       unsigned int j;
9567       enum mf_cmp_kind mf_cmp;
9568
9569       if (avoid_fence
9570           && (i.tm.base_opcode == 0xaee8
9571               || i.tm.base_opcode == 0xaef0
9572               || i.tm.base_opcode == 0xaef8))
9573         {
9574           /* Encode lfence, mfence, and sfence as
9575              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9576           if (now_seg != absolute_section)
9577             {
9578               offsetT val = 0x240483f0ULL;
9579
9580               p = frag_more (5);
9581               md_number_to_chars (p, val, 5);
9582             }
9583           else
9584             abs_section_offset += 5;
9585           return;
9586         }
9587
9588       /* Some processors fail on LOCK prefix. This options makes
9589          assembler ignore LOCK prefix and serves as a workaround.  */
9590       if (omit_lock_prefix)
9591         {
9592           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE
9593               && i.tm.opcode_modifier.isprefix)
9594             return;
9595           i.prefix[LOCK_PREFIX] = 0;
9596         }
9597
9598       if (branch)
9599         /* Skip if this is a branch.  */
9600         ;
9601       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9602         {
9603           /* Make room for padding.  */
9604           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9605           p = frag_more (0);
9606
9607           fragP = frag_now;
9608
9609           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9610                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9611                     NULL, 0, p);
9612
9613           fragP->tc_frag_data.mf_type = mf_cmp;
9614           fragP->tc_frag_data.branch_type = align_branch_fused;
9615           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9616         }
9617       else if (add_branch_prefix_frag_p ())
9618         {
9619           unsigned int max_prefix_size = align_branch_prefix_size;
9620
9621           /* Make room for padding.  */
9622           frag_grow (max_prefix_size);
9623           p = frag_more (0);
9624
9625           fragP = frag_now;
9626
9627           frag_var (rs_machine_dependent, max_prefix_size, 0,
9628                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9629                     NULL, 0, p);
9630
9631           fragP->tc_frag_data.max_bytes = max_prefix_size;
9632         }
9633
9634       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9635          don't need the explicit prefix.  */
9636       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9637         {
9638           switch (i.tm.opcode_modifier.opcodeprefix)
9639             {
9640             case PREFIX_0X66:
9641               add_prefix (0x66);
9642               break;
9643             case PREFIX_0XF2:
9644               add_prefix (0xf2);
9645               break;
9646             case PREFIX_0XF3:
9647               if (!i.tm.cpu_flags.bitfield.cpupadlock
9648                   || (i.prefix[REP_PREFIX] != 0xf3))
9649                 add_prefix (0xf3);
9650               break;
9651             case PREFIX_NONE:
9652               switch (i.opcode_length)
9653                 {
9654                 case 2:
9655                   break;
9656                 case 1:
9657                   /* Check for pseudo prefixes.  */
9658                   if (!i.tm.opcode_modifier.isprefix || i.tm.base_opcode)
9659                     break;
9660                   as_bad_where (insn_start_frag->fr_file,
9661                                 insn_start_frag->fr_line,
9662                                 _("pseudo prefix without instruction"));
9663                   return;
9664                 default:
9665                   abort ();
9666                 }
9667               break;
9668             default:
9669               abort ();
9670             }
9671
9672 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9673           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9674              R_X86_64_GOTTPOFF relocation so that linker can safely
9675              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9676              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9677              relocation for GDesc -> IE/LE optimization.  */
9678           if (x86_elf_abi == X86_64_X32_ABI
9679               && i.operands == 2
9680               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9681                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9682               && i.prefix[REX_PREFIX] == 0)
9683             add_prefix (REX_OPCODE);
9684 #endif
9685
9686           /* The prefix bytes.  */
9687           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9688             if (*q)
9689               frag_opcode_byte (*q);
9690         }
9691       else
9692         {
9693           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9694             if (*q)
9695               switch (j)
9696                 {
9697                 case SEG_PREFIX:
9698                 case ADDR_PREFIX:
9699                   frag_opcode_byte (*q);
9700                   break;
9701                 default:
9702                   /* There should be no other prefixes for instructions
9703                      with VEX prefix.  */
9704                   abort ();
9705                 }
9706
9707           /* For EVEX instructions i.vrex should become 0 after
9708              build_evex_prefix.  For VEX instructions upper 16 registers
9709              aren't available, so VREX should be 0.  */
9710           if (i.vrex)
9711             abort ();
9712           /* Now the VEX prefix.  */
9713           if (now_seg != absolute_section)
9714             {
9715               p = frag_more (i.vex.length);
9716               for (j = 0; j < i.vex.length; j++)
9717                 p[j] = i.vex.bytes[j];
9718             }
9719           else
9720             abs_section_offset += i.vex.length;
9721         }
9722
9723       /* Now the opcode; be careful about word order here!  */
9724       j = i.opcode_length;
9725       if (!i.vex.length)
9726         switch (i.tm.opcode_modifier.opcodespace)
9727           {
9728           case SPACE_BASE:
9729             break;
9730           case SPACE_0F:
9731             ++j;
9732             break;
9733           case SPACE_0F38:
9734           case SPACE_0F3A:
9735             j += 2;
9736             break;
9737           default:
9738             abort ();
9739           }
9740
9741       if (now_seg == absolute_section)
9742         abs_section_offset += j;
9743       else if (j == 1)
9744         {
9745           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9746         }
9747       else
9748         {
9749           p = frag_more (j);
9750           if (!i.vex.length
9751               && i.tm.opcode_modifier.opcodespace != SPACE_BASE)
9752             {
9753               *p++ = 0x0f;
9754               if (i.tm.opcode_modifier.opcodespace != SPACE_0F)
9755                 *p++ = i.tm.opcode_modifier.opcodespace == SPACE_0F38
9756                        ? 0x38 : 0x3a;
9757             }
9758
9759           switch (i.opcode_length)
9760             {
9761             case 2:
9762               /* Put out high byte first: can't use md_number_to_chars!  */
9763               *p++ = (i.tm.base_opcode >> 8) & 0xff;
9764               /* Fall through.  */
9765             case 1:
9766               *p = i.tm.base_opcode & 0xff;
9767               break;
9768             default:
9769               abort ();
9770               break;
9771             }
9772
9773         }
9774
9775       /* Now the modrm byte and sib byte (if present).  */
9776       if (i.tm.opcode_modifier.modrm)
9777         {
9778           frag_opcode_byte ((i.rm.regmem << 0)
9779                              | (i.rm.reg << 3)
9780                              | (i.rm.mode << 6));
9781           /* If i.rm.regmem == ESP (4)
9782              && i.rm.mode != (Register mode)
9783              && not 16 bit
9784              ==> need second modrm byte.  */
9785           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9786               && i.rm.mode != 3
9787               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9788             frag_opcode_byte ((i.sib.base << 0)
9789                               | (i.sib.index << 3)
9790                               | (i.sib.scale << 6));
9791         }
9792
9793       if (i.disp_operands)
9794         output_disp (insn_start_frag, insn_start_off);
9795
9796       if (i.imm_operands)
9797         output_imm (insn_start_frag, insn_start_off);
9798
9799       /*
9800        * frag_now_fix () returning plain abs_section_offset when we're in the
9801        * absolute section, and abs_section_offset not getting updated as data
9802        * gets added to the frag breaks the logic below.
9803        */
9804       if (now_seg != absolute_section)
9805         {
9806           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9807           if (j > 15)
9808             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9809                      j);
9810           else if (fragP)
9811             {
9812               /* NB: Don't add prefix with GOTPC relocation since
9813                  output_disp() above depends on the fixed encoding
9814                  length.  Can't add prefix with TLS relocation since
9815                  it breaks TLS linker optimization.  */
9816               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9817               /* Prefix count on the current instruction.  */
9818               unsigned int count = i.vex.length;
9819               unsigned int k;
9820               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9821                 /* REX byte is encoded in VEX/EVEX prefix.  */
9822                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9823                   count++;
9824
9825               /* Count prefixes for extended opcode maps.  */
9826               if (!i.vex.length)
9827                 switch (i.tm.opcode_modifier.opcodespace)
9828                   {
9829                   case SPACE_BASE:
9830                     break;
9831                   case SPACE_0F:
9832                     count++;
9833                     break;
9834                   case SPACE_0F38:
9835                   case SPACE_0F3A:
9836                     count += 2;
9837                     break;
9838                   default:
9839                     abort ();
9840                   }
9841
9842               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9843                   == BRANCH_PREFIX)
9844                 {
9845                   /* Set the maximum prefix size in BRANCH_PREFIX
9846                      frag.  */
9847                   if (fragP->tc_frag_data.max_bytes > max)
9848                     fragP->tc_frag_data.max_bytes = max;
9849                   if (fragP->tc_frag_data.max_bytes > count)
9850                     fragP->tc_frag_data.max_bytes -= count;
9851                   else
9852                     fragP->tc_frag_data.max_bytes = 0;
9853                 }
9854               else
9855                 {
9856                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9857                      frag.  */
9858                   unsigned int max_prefix_size;
9859                   if (align_branch_prefix_size > max)
9860                     max_prefix_size = max;
9861                   else
9862                     max_prefix_size = align_branch_prefix_size;
9863                   if (max_prefix_size > count)
9864                     fragP->tc_frag_data.max_prefix_length
9865                       = max_prefix_size - count;
9866                 }
9867
9868               /* Use existing segment prefix if possible.  Use CS
9869                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9870                  segment prefix with ESP/EBP base register and use DS
9871                  segment prefix without ESP/EBP base register.  */
9872               if (i.prefix[SEG_PREFIX])
9873                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9874               else if (flag_code == CODE_64BIT)
9875                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9876               else if (i.base_reg
9877                        && (i.base_reg->reg_num == 4
9878                            || i.base_reg->reg_num == 5))
9879                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9880               else
9881                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9882             }
9883         }
9884     }
9885
9886   /* NB: Don't work with COND_JUMP86 without i386.  */
9887   if (align_branch_power
9888       && now_seg != absolute_section
9889       && cpu_arch_flags.bitfield.cpui386)
9890     {
9891       /* Terminate each frag so that we can add prefix and check for
9892          fused jcc.  */
9893       frag_wane (frag_now);
9894       frag_new (0);
9895     }
9896
9897 #ifdef DEBUG386
9898   if (flag_debug)
9899     {
9900       pi ("" /*line*/, &i);
9901     }
9902 #endif /* DEBUG386  */
9903 }
9904
9905 /* Return the size of the displacement operand N.  */
9906
9907 static int
9908 disp_size (unsigned int n)
9909 {
9910   int size = 4;
9911
9912   if (i.types[n].bitfield.disp64)
9913     size = 8;
9914   else if (i.types[n].bitfield.disp8)
9915     size = 1;
9916   else if (i.types[n].bitfield.disp16)
9917     size = 2;
9918   return size;
9919 }
9920
9921 /* Return the size of the immediate operand N.  */
9922
9923 static int
9924 imm_size (unsigned int n)
9925 {
9926   int size = 4;
9927   if (i.types[n].bitfield.imm64)
9928     size = 8;
9929   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9930     size = 1;
9931   else if (i.types[n].bitfield.imm16)
9932     size = 2;
9933   return size;
9934 }
9935
9936 static void
9937 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9938 {
9939   char *p;
9940   unsigned int n;
9941
9942   for (n = 0; n < i.operands; n++)
9943     {
9944       if (operand_type_check (i.types[n], disp))
9945         {
9946           int size = disp_size (n);
9947
9948           if (now_seg == absolute_section)
9949             abs_section_offset += size;
9950           else if (i.op[n].disps->X_op == O_constant)
9951             {
9952               offsetT val = i.op[n].disps->X_add_number;
9953
9954               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9955                                      size);
9956               p = frag_more (size);
9957               md_number_to_chars (p, val, size);
9958             }
9959           else
9960             {
9961               enum bfd_reloc_code_real reloc_type;
9962               int sign = i.types[n].bitfield.disp32s;
9963               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9964               fixS *fixP;
9965
9966               /* We can't have 8 bit displacement here.  */
9967               gas_assert (!i.types[n].bitfield.disp8);
9968
9969               /* The PC relative address is computed relative
9970                  to the instruction boundary, so in case immediate
9971                  fields follows, we need to adjust the value.  */
9972               if (pcrel && i.imm_operands)
9973                 {
9974                   unsigned int n1;
9975                   int sz = 0;
9976
9977                   for (n1 = 0; n1 < i.operands; n1++)
9978                     if (operand_type_check (i.types[n1], imm))
9979                       {
9980                         /* Only one immediate is allowed for PC
9981                            relative address.  */
9982                         gas_assert (sz == 0);
9983                         sz = imm_size (n1);
9984                         i.op[n].disps->X_add_number -= sz;
9985                       }
9986                   /* We should find the immediate.  */
9987                   gas_assert (sz != 0);
9988                 }
9989
9990               p = frag_more (size);
9991               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9992               if (GOT_symbol
9993                   && GOT_symbol == i.op[n].disps->X_add_symbol
9994                   && (((reloc_type == BFD_RELOC_32
9995                         || reloc_type == BFD_RELOC_X86_64_32S
9996                         || (reloc_type == BFD_RELOC_64
9997                             && object_64bit))
9998                        && (i.op[n].disps->X_op == O_symbol
9999                            || (i.op[n].disps->X_op == O_add
10000                                && ((symbol_get_value_expression
10001                                     (i.op[n].disps->X_op_symbol)->X_op)
10002                                    == O_subtract))))
10003                       || reloc_type == BFD_RELOC_32_PCREL))
10004                 {
10005                   if (!object_64bit)
10006                     {
10007                       reloc_type = BFD_RELOC_386_GOTPC;
10008                       i.has_gotpc_tls_reloc = true;
10009                       i.op[n].disps->X_add_number +=
10010                         encoding_length (insn_start_frag, insn_start_off, p);
10011                     }
10012                   else if (reloc_type == BFD_RELOC_64)
10013                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
10014                   else
10015                     /* Don't do the adjustment for x86-64, as there
10016                        the pcrel addressing is relative to the _next_
10017                        insn, and that is taken care of in other code.  */
10018                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
10019                 }
10020               else if (align_branch_power)
10021                 {
10022                   switch (reloc_type)
10023                     {
10024                     case BFD_RELOC_386_TLS_GD:
10025                     case BFD_RELOC_386_TLS_LDM:
10026                     case BFD_RELOC_386_TLS_IE:
10027                     case BFD_RELOC_386_TLS_IE_32:
10028                     case BFD_RELOC_386_TLS_GOTIE:
10029                     case BFD_RELOC_386_TLS_GOTDESC:
10030                     case BFD_RELOC_386_TLS_DESC_CALL:
10031                     case BFD_RELOC_X86_64_TLSGD:
10032                     case BFD_RELOC_X86_64_TLSLD:
10033                     case BFD_RELOC_X86_64_GOTTPOFF:
10034                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10035                     case BFD_RELOC_X86_64_TLSDESC_CALL:
10036                       i.has_gotpc_tls_reloc = true;
10037                     default:
10038                       break;
10039                     }
10040                 }
10041               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
10042                                   size, i.op[n].disps, pcrel,
10043                                   reloc_type);
10044
10045               if (flag_code == CODE_64BIT && size == 4 && pcrel
10046                   && !i.prefix[ADDR_PREFIX])
10047                 fixP->fx_signed = 1;
10048
10049               /* Check for "call/jmp *mem", "mov mem, %reg",
10050                  "test %reg, mem" and "binop mem, %reg" where binop
10051                  is one of adc, add, and, cmp, or, sbb, sub, xor
10052                  instructions without data prefix.  Always generate
10053                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
10054               if (i.prefix[DATA_PREFIX] == 0
10055                   && (generate_relax_relocations
10056                       || (!object_64bit
10057                           && i.rm.mode == 0
10058                           && i.rm.regmem == 5))
10059                   && (i.rm.mode == 2
10060                       || (i.rm.mode == 0 && i.rm.regmem == 5))
10061                   && i.tm.opcode_modifier.opcodespace == SPACE_BASE
10062                   && ((i.operands == 1
10063                        && i.tm.base_opcode == 0xff
10064                        && (i.rm.reg == 2 || i.rm.reg == 4))
10065                       || (i.operands == 2
10066                           && (i.tm.base_opcode == 0x8b
10067                               || i.tm.base_opcode == 0x85
10068                               || (i.tm.base_opcode & ~0x38) == 0x03))))
10069                 {
10070                   if (object_64bit)
10071                     {
10072                       fixP->fx_tcbit = i.rex != 0;
10073                       if (i.base_reg
10074                           && (i.base_reg->reg_num == RegIP))
10075                       fixP->fx_tcbit2 = 1;
10076                     }
10077                   else
10078                     fixP->fx_tcbit2 = 1;
10079                 }
10080             }
10081         }
10082     }
10083 }
10084
10085 static void
10086 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
10087 {
10088   char *p;
10089   unsigned int n;
10090
10091   for (n = 0; n < i.operands; n++)
10092     {
10093       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
10094       if (i.rounding.type != rc_none && n == i.rounding.operand)
10095         continue;
10096
10097       if (operand_type_check (i.types[n], imm))
10098         {
10099           int size = imm_size (n);
10100
10101           if (now_seg == absolute_section)
10102             abs_section_offset += size;
10103           else if (i.op[n].imms->X_op == O_constant)
10104             {
10105               offsetT val;
10106
10107               val = offset_in_range (i.op[n].imms->X_add_number,
10108                                      size);
10109               p = frag_more (size);
10110               md_number_to_chars (p, val, size);
10111             }
10112           else
10113             {
10114               /* Not absolute_section.
10115                  Need a 32-bit fixup (don't support 8bit
10116                  non-absolute imms).  Try to support other
10117                  sizes ...  */
10118               enum bfd_reloc_code_real reloc_type;
10119               int sign;
10120
10121               if (i.types[n].bitfield.imm32s
10122                   && (i.suffix == QWORD_MNEM_SUFFIX
10123                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
10124                 sign = 1;
10125               else
10126                 sign = 0;
10127
10128               p = frag_more (size);
10129               reloc_type = reloc (size, 0, sign, i.reloc[n]);
10130
10131               /*   This is tough to explain.  We end up with this one if we
10132                * have operands that look like
10133                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
10134                * obtain the absolute address of the GOT, and it is strongly
10135                * preferable from a performance point of view to avoid using
10136                * a runtime relocation for this.  The actual sequence of
10137                * instructions often look something like:
10138                *
10139                *        call    .L66
10140                * .L66:
10141                *        popl    %ebx
10142                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
10143                *
10144                *   The call and pop essentially return the absolute address
10145                * of the label .L66 and store it in %ebx.  The linker itself
10146                * will ultimately change the first operand of the addl so
10147                * that %ebx points to the GOT, but to keep things simple, the
10148                * .o file must have this operand set so that it generates not
10149                * the absolute address of .L66, but the absolute address of
10150                * itself.  This allows the linker itself simply treat a GOTPC
10151                * relocation as asking for a pcrel offset to the GOT to be
10152                * added in, and the addend of the relocation is stored in the
10153                * operand field for the instruction itself.
10154                *
10155                *   Our job here is to fix the operand so that it would add
10156                * the correct offset so that %ebx would point to itself.  The
10157                * thing that is tricky is that .-.L66 will point to the
10158                * beginning of the instruction, so we need to further modify
10159                * the operand so that it will point to itself.  There are
10160                * other cases where you have something like:
10161                *
10162                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
10163                *
10164                * and here no correction would be required.  Internally in
10165                * the assembler we treat operands of this form as not being
10166                * pcrel since the '.' is explicitly mentioned, and I wonder
10167                * whether it would simplify matters to do it this way.  Who
10168                * knows.  In earlier versions of the PIC patches, the
10169                * pcrel_adjust field was used to store the correction, but
10170                * since the expression is not pcrel, I felt it would be
10171                * confusing to do it this way.  */
10172
10173               if ((reloc_type == BFD_RELOC_32
10174                    || reloc_type == BFD_RELOC_X86_64_32S
10175                    || reloc_type == BFD_RELOC_64)
10176                   && GOT_symbol
10177                   && GOT_symbol == i.op[n].imms->X_add_symbol
10178                   && (i.op[n].imms->X_op == O_symbol
10179                       || (i.op[n].imms->X_op == O_add
10180                           && ((symbol_get_value_expression
10181                                (i.op[n].imms->X_op_symbol)->X_op)
10182                               == O_subtract))))
10183                 {
10184                   if (!object_64bit)
10185                     reloc_type = BFD_RELOC_386_GOTPC;
10186                   else if (size == 4)
10187                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
10188                   else if (size == 8)
10189                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
10190                   i.has_gotpc_tls_reloc = true;
10191                   i.op[n].imms->X_add_number +=
10192                     encoding_length (insn_start_frag, insn_start_off, p);
10193                 }
10194               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
10195                            i.op[n].imms, 0, reloc_type);
10196             }
10197         }
10198     }
10199 }
10200 \f
10201 /* x86_cons_fix_new is called via the expression parsing code when a
10202    reloc is needed.  We use this hook to get the correct .got reloc.  */
10203 static int cons_sign = -1;
10204
10205 void
10206 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
10207                   expressionS *exp, bfd_reloc_code_real_type r)
10208 {
10209   r = reloc (len, 0, cons_sign, r);
10210
10211 #ifdef TE_PE
10212   if (exp->X_op == O_secrel)
10213     {
10214       exp->X_op = O_symbol;
10215       r = BFD_RELOC_32_SECREL;
10216     }
10217 #endif
10218
10219   fix_new_exp (frag, off, len, exp, 0, r);
10220 }
10221
10222 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
10223    purpose of the `.dc.a' internal pseudo-op.  */
10224
10225 int
10226 x86_address_bytes (void)
10227 {
10228   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
10229     return 4;
10230   return stdoutput->arch_info->bits_per_address / 8;
10231 }
10232
10233 #if (!(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
10234      || defined (LEX_AT)) && !defined (TE_PE)
10235 # define lex_got(reloc, adjust, types) NULL
10236 #else
10237 /* Parse operands of the form
10238    <symbol>@GOTOFF+<nnn>
10239    and similar .plt or .got references.
10240
10241    If we find one, set up the correct relocation in RELOC and copy the
10242    input string, minus the `@GOTOFF' into a malloc'd buffer for
10243    parsing by the calling routine.  Return this buffer, and if ADJUST
10244    is non-null set it to the length of the string we removed from the
10245    input line.  Otherwise return NULL.  */
10246 static char *
10247 lex_got (enum bfd_reloc_code_real *rel,
10248          int *adjust,
10249          i386_operand_type *types)
10250 {
10251   /* Some of the relocations depend on the size of what field is to
10252      be relocated.  But in our callers i386_immediate and i386_displacement
10253      we don't yet know the operand size (this will be set by insn
10254      matching).  Hence we record the word32 relocation here,
10255      and adjust the reloc according to the real size in reloc().  */
10256   static const struct {
10257     const char *str;
10258     int len;
10259     const enum bfd_reloc_code_real rel[2];
10260     const i386_operand_type types64;
10261     bool need_GOT_symbol;
10262   } gotrel[] = {
10263 #ifndef TE_PE
10264 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10265     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
10266                                         BFD_RELOC_SIZE32 },
10267       OPERAND_TYPE_IMM32_64, false },
10268 #endif
10269     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
10270                                        BFD_RELOC_X86_64_PLTOFF64 },
10271       OPERAND_TYPE_IMM64, true },
10272     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
10273                                        BFD_RELOC_X86_64_PLT32    },
10274       OPERAND_TYPE_IMM32_32S_DISP32, false },
10275     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
10276                                        BFD_RELOC_X86_64_GOTPLT64 },
10277       OPERAND_TYPE_IMM64_DISP64, true },
10278     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
10279                                        BFD_RELOC_X86_64_GOTOFF64 },
10280       OPERAND_TYPE_IMM64_DISP64, true },
10281     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10282                                        BFD_RELOC_X86_64_GOTPCREL },
10283       OPERAND_TYPE_IMM32_32S_DISP32, true },
10284     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
10285                                        BFD_RELOC_X86_64_TLSGD    },
10286       OPERAND_TYPE_IMM32_32S_DISP32, true },
10287     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
10288                                        _dummy_first_bfd_reloc_code_real },
10289       OPERAND_TYPE_NONE, true },
10290     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
10291                                        BFD_RELOC_X86_64_TLSLD    },
10292       OPERAND_TYPE_IMM32_32S_DISP32, true },
10293     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10294                                        BFD_RELOC_X86_64_GOTTPOFF },
10295       OPERAND_TYPE_IMM32_32S_DISP32, true },
10296     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
10297                                        BFD_RELOC_X86_64_TPOFF32  },
10298       OPERAND_TYPE_IMM32_32S_64_DISP32_64, true },
10299     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
10300                                        _dummy_first_bfd_reloc_code_real },
10301       OPERAND_TYPE_NONE, true },
10302     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
10303                                        BFD_RELOC_X86_64_DTPOFF32 },
10304       OPERAND_TYPE_IMM32_32S_64_DISP32_64, true },
10305     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10306                                        _dummy_first_bfd_reloc_code_real },
10307       OPERAND_TYPE_NONE, true },
10308     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10309                                        _dummy_first_bfd_reloc_code_real },
10310       OPERAND_TYPE_NONE, true },
10311     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
10312                                        BFD_RELOC_X86_64_GOT32    },
10313       OPERAND_TYPE_IMM32_32S_64_DISP32, true },
10314     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
10315                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10316       OPERAND_TYPE_IMM32_32S_DISP32, true },
10317     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
10318                                        BFD_RELOC_X86_64_TLSDESC_CALL },
10319       OPERAND_TYPE_IMM32_32S_DISP32, true },
10320 #else /* TE_PE */
10321     { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10322                                        BFD_RELOC_32_SECREL },
10323       OPERAND_TYPE_IMM32_32S_64_DISP32_64, false },
10324 #endif
10325   };
10326   char *cp;
10327   unsigned int j;
10328
10329 #if defined (OBJ_MAYBE_ELF) && !defined (TE_PE)
10330   if (!IS_ELF)
10331     return NULL;
10332 #endif
10333
10334   for (cp = input_line_pointer; *cp != '@'; cp++)
10335     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10336       return NULL;
10337
10338   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10339     {
10340       int len = gotrel[j].len;
10341       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10342         {
10343           if (gotrel[j].rel[object_64bit] != 0)
10344             {
10345               int first, second;
10346               char *tmpbuf, *past_reloc;
10347
10348               *rel = gotrel[j].rel[object_64bit];
10349
10350               if (types)
10351                 {
10352                   if (flag_code != CODE_64BIT)
10353                     {
10354                       types->bitfield.imm32 = 1;
10355                       types->bitfield.disp32 = 1;
10356                     }
10357                   else
10358                     *types = gotrel[j].types64;
10359                 }
10360
10361               if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10362                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10363
10364               /* The length of the first part of our input line.  */
10365               first = cp - input_line_pointer;
10366
10367               /* The second part goes from after the reloc token until
10368                  (and including) an end_of_line char or comma.  */
10369               past_reloc = cp + 1 + len;
10370               cp = past_reloc;
10371               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10372                 ++cp;
10373               second = cp + 1 - past_reloc;
10374
10375               /* Allocate and copy string.  The trailing NUL shouldn't
10376                  be necessary, but be safe.  */
10377               tmpbuf = XNEWVEC (char, first + second + 2);
10378               memcpy (tmpbuf, input_line_pointer, first);
10379               if (second != 0 && *past_reloc != ' ')
10380                 /* Replace the relocation token with ' ', so that
10381                    errors like foo@GOTOFF1 will be detected.  */
10382                 tmpbuf[first++] = ' ';
10383               else
10384                 /* Increment length by 1 if the relocation token is
10385                    removed.  */
10386                 len++;
10387               if (adjust)
10388                 *adjust = len;
10389               memcpy (tmpbuf + first, past_reloc, second);
10390               tmpbuf[first + second] = '\0';
10391               return tmpbuf;
10392             }
10393
10394           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10395                   gotrel[j].str, 1 << (5 + object_64bit));
10396           return NULL;
10397         }
10398     }
10399
10400   /* Might be a symbol version string.  Don't as_bad here.  */
10401   return NULL;
10402 }
10403 #endif
10404
10405 bfd_reloc_code_real_type
10406 x86_cons (expressionS *exp, int size)
10407 {
10408   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10409
10410 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
10411       && !defined (LEX_AT)) \
10412     || defined (TE_PE)
10413   intel_syntax = -intel_syntax;
10414
10415   exp->X_md = 0;
10416   if (size == 4 || (object_64bit && size == 8))
10417     {
10418       /* Handle @GOTOFF and the like in an expression.  */
10419       char *save;
10420       char *gotfree_input_line;
10421       int adjust = 0;
10422
10423       save = input_line_pointer;
10424       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10425       if (gotfree_input_line)
10426         input_line_pointer = gotfree_input_line;
10427
10428       expression (exp);
10429
10430       if (gotfree_input_line)
10431         {
10432           /* expression () has merrily parsed up to the end of line,
10433              or a comma - in the wrong buffer.  Transfer how far
10434              input_line_pointer has moved to the right buffer.  */
10435           input_line_pointer = (save
10436                                 + (input_line_pointer - gotfree_input_line)
10437                                 + adjust);
10438           free (gotfree_input_line);
10439           if (exp->X_op == O_constant
10440               || exp->X_op == O_absent
10441               || exp->X_op == O_illegal
10442               || exp->X_op == O_register
10443               || exp->X_op == O_big)
10444             {
10445               char c = *input_line_pointer;
10446               *input_line_pointer = 0;
10447               as_bad (_("missing or invalid expression `%s'"), save);
10448               *input_line_pointer = c;
10449             }
10450           else if ((got_reloc == BFD_RELOC_386_PLT32
10451                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10452                    && exp->X_op != O_symbol)
10453             {
10454               char c = *input_line_pointer;
10455               *input_line_pointer = 0;
10456               as_bad (_("invalid PLT expression `%s'"), save);
10457               *input_line_pointer = c;
10458             }
10459         }
10460     }
10461   else
10462     expression (exp);
10463
10464   intel_syntax = -intel_syntax;
10465
10466   if (intel_syntax)
10467     i386_intel_simplify (exp);
10468 #else
10469   expression (exp);
10470 #endif
10471
10472   /* If not 64bit, massage value, to account for wraparound when !BFD64.  */
10473   if (size == 4 && exp->X_op == O_constant && !object_64bit)
10474     exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
10475
10476   return got_reloc;
10477 }
10478
10479 static void
10480 signed_cons (int size)
10481 {
10482   if (object_64bit)
10483     cons_sign = 1;
10484   cons (size);
10485   cons_sign = -1;
10486 }
10487
10488 #ifdef TE_PE
10489 static void
10490 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10491 {
10492   expressionS exp;
10493
10494   do
10495     {
10496       expression (&exp);
10497       if (exp.X_op == O_symbol)
10498         exp.X_op = O_secrel;
10499
10500       emit_expr (&exp, 4);
10501     }
10502   while (*input_line_pointer++ == ',');
10503
10504   input_line_pointer--;
10505   demand_empty_rest_of_line ();
10506 }
10507 #endif
10508
10509 /* Handle Vector operations.  */
10510
10511 static char *
10512 check_VecOperations (char *op_string)
10513 {
10514   const reg_entry *mask;
10515   const char *saved;
10516   char *end_op;
10517
10518   while (*op_string)
10519     {
10520       saved = op_string;
10521       if (*op_string == '{')
10522         {
10523           op_string++;
10524
10525           /* Check broadcasts.  */
10526           if (startswith (op_string, "1to"))
10527             {
10528               unsigned int bcst_type;
10529
10530               if (i.broadcast.type)
10531                 goto duplicated_vec_op;
10532
10533               op_string += 3;
10534               if (*op_string == '8')
10535                 bcst_type = 8;
10536               else if (*op_string == '4')
10537                 bcst_type = 4;
10538               else if (*op_string == '2')
10539                 bcst_type = 2;
10540               else if (*op_string == '1'
10541                        && *(op_string+1) == '6')
10542                 {
10543                   bcst_type = 16;
10544                   op_string++;
10545                 }
10546               else
10547                 {
10548                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10549                   return NULL;
10550                 }
10551               op_string++;
10552
10553               i.broadcast.type = bcst_type;
10554               i.broadcast.operand = this_operand;
10555             }
10556           /* Check masking operation.  */
10557           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10558             {
10559               if (mask == &bad_reg)
10560                 return NULL;
10561
10562               /* k0 can't be used for write mask.  */
10563               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10564                 {
10565                   as_bad (_("`%s%s' can't be used for write mask"),
10566                           register_prefix, mask->reg_name);
10567                   return NULL;
10568                 }
10569
10570               if (!i.mask.reg)
10571                 {
10572                   i.mask.reg = mask;
10573                   i.mask.operand = this_operand;
10574                 }
10575               else if (i.mask.reg->reg_num)
10576                 goto duplicated_vec_op;
10577               else
10578                 {
10579                   i.mask.reg = mask;
10580
10581                   /* Only "{z}" is allowed here.  No need to check
10582                      zeroing mask explicitly.  */
10583                   if (i.mask.operand != (unsigned int) this_operand)
10584                     {
10585                       as_bad (_("invalid write mask `%s'"), saved);
10586                       return NULL;
10587                     }
10588                 }
10589
10590               op_string = end_op;
10591             }
10592           /* Check zeroing-flag for masking operation.  */
10593           else if (*op_string == 'z')
10594             {
10595               if (!i.mask.reg)
10596                 {
10597                   i.mask.reg = reg_k0;
10598                   i.mask.zeroing = 1;
10599                   i.mask.operand = this_operand;
10600                 }
10601               else
10602                 {
10603                   if (i.mask.zeroing)
10604                     {
10605                     duplicated_vec_op:
10606                       as_bad (_("duplicated `%s'"), saved);
10607                       return NULL;
10608                     }
10609
10610                   i.mask.zeroing = 1;
10611
10612                   /* Only "{%k}" is allowed here.  No need to check mask
10613                      register explicitly.  */
10614                   if (i.mask.operand != (unsigned int) this_operand)
10615                     {
10616                       as_bad (_("invalid zeroing-masking `%s'"),
10617                               saved);
10618                       return NULL;
10619                     }
10620                 }
10621
10622               op_string++;
10623             }
10624           else
10625             goto unknown_vec_op;
10626
10627           if (*op_string != '}')
10628             {
10629               as_bad (_("missing `}' in `%s'"), saved);
10630               return NULL;
10631             }
10632           op_string++;
10633
10634           /* Strip whitespace since the addition of pseudo prefixes
10635              changed how the scrubber treats '{'.  */
10636           if (is_space_char (*op_string))
10637             ++op_string;
10638
10639           continue;
10640         }
10641     unknown_vec_op:
10642       /* We don't know this one.  */
10643       as_bad (_("unknown vector operation: `%s'"), saved);
10644       return NULL;
10645     }
10646
10647   if (i.mask.reg && i.mask.zeroing && !i.mask.reg->reg_num)
10648     {
10649       as_bad (_("zeroing-masking only allowed with write mask"));
10650       return NULL;
10651     }
10652
10653   return op_string;
10654 }
10655
10656 static int
10657 i386_immediate (char *imm_start)
10658 {
10659   char *save_input_line_pointer;
10660   char *gotfree_input_line;
10661   segT exp_seg = 0;
10662   expressionS *exp;
10663   i386_operand_type types;
10664
10665   operand_type_set (&types, ~0);
10666
10667   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10668     {
10669       as_bad (_("at most %d immediate operands are allowed"),
10670               MAX_IMMEDIATE_OPERANDS);
10671       return 0;
10672     }
10673
10674   exp = &im_expressions[i.imm_operands++];
10675   i.op[this_operand].imms = exp;
10676
10677   if (is_space_char (*imm_start))
10678     ++imm_start;
10679
10680   save_input_line_pointer = input_line_pointer;
10681   input_line_pointer = imm_start;
10682
10683   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10684   if (gotfree_input_line)
10685     input_line_pointer = gotfree_input_line;
10686
10687   exp_seg = expression (exp);
10688
10689   SKIP_WHITESPACE ();
10690   if (*input_line_pointer)
10691     as_bad (_("junk `%s' after expression"), input_line_pointer);
10692
10693   input_line_pointer = save_input_line_pointer;
10694   if (gotfree_input_line)
10695     {
10696       free (gotfree_input_line);
10697
10698       if (exp->X_op == O_constant)
10699         exp->X_op = O_illegal;
10700     }
10701
10702   if (exp_seg == reg_section)
10703     {
10704       as_bad (_("illegal immediate register operand %s"), imm_start);
10705       return 0;
10706     }
10707
10708   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10709 }
10710
10711 static int
10712 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10713                          i386_operand_type types, const char *imm_start)
10714 {
10715   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10716     {
10717       if (imm_start)
10718         as_bad (_("missing or invalid immediate expression `%s'"),
10719                 imm_start);
10720       return 0;
10721     }
10722   else if (exp->X_op == O_constant)
10723     {
10724       /* Size it properly later.  */
10725       i.types[this_operand].bitfield.imm64 = 1;
10726
10727       /* If not 64bit, sign/zero extend val, to account for wraparound
10728          when !BFD64.  */
10729       if (flag_code != CODE_64BIT)
10730         exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
10731     }
10732 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10733   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10734            && exp_seg != absolute_section
10735            && exp_seg != text_section
10736            && exp_seg != data_section
10737            && exp_seg != bss_section
10738            && exp_seg != undefined_section
10739            && !bfd_is_com_section (exp_seg))
10740     {
10741       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10742       return 0;
10743     }
10744 #endif
10745   else
10746     {
10747       /* This is an address.  The size of the address will be
10748          determined later, depending on destination register,
10749          suffix, or the default for the section.  */
10750       i.types[this_operand].bitfield.imm8 = 1;
10751       i.types[this_operand].bitfield.imm16 = 1;
10752       i.types[this_operand].bitfield.imm32 = 1;
10753       i.types[this_operand].bitfield.imm32s = 1;
10754       i.types[this_operand].bitfield.imm64 = 1;
10755       i.types[this_operand] = operand_type_and (i.types[this_operand],
10756                                                 types);
10757     }
10758
10759   return 1;
10760 }
10761
10762 static char *
10763 i386_scale (char *scale)
10764 {
10765   offsetT val;
10766   char *save = input_line_pointer;
10767
10768   input_line_pointer = scale;
10769   val = get_absolute_expression ();
10770
10771   switch (val)
10772     {
10773     case 1:
10774       i.log2_scale_factor = 0;
10775       break;
10776     case 2:
10777       i.log2_scale_factor = 1;
10778       break;
10779     case 4:
10780       i.log2_scale_factor = 2;
10781       break;
10782     case 8:
10783       i.log2_scale_factor = 3;
10784       break;
10785     default:
10786       {
10787         char sep = *input_line_pointer;
10788
10789         *input_line_pointer = '\0';
10790         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10791                 scale);
10792         *input_line_pointer = sep;
10793         input_line_pointer = save;
10794         return NULL;
10795       }
10796     }
10797   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10798     {
10799       as_warn (_("scale factor of %d without an index register"),
10800                1 << i.log2_scale_factor);
10801       i.log2_scale_factor = 0;
10802     }
10803   scale = input_line_pointer;
10804   input_line_pointer = save;
10805   return scale;
10806 }
10807
10808 static int
10809 i386_displacement (char *disp_start, char *disp_end)
10810 {
10811   expressionS *exp;
10812   segT exp_seg = 0;
10813   char *save_input_line_pointer;
10814   char *gotfree_input_line;
10815   int override;
10816   i386_operand_type bigdisp, types = anydisp;
10817   int ret;
10818
10819   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10820     {
10821       as_bad (_("at most %d displacement operands are allowed"),
10822               MAX_MEMORY_OPERANDS);
10823       return 0;
10824     }
10825
10826   operand_type_set (&bigdisp, 0);
10827   if (i.jumpabsolute
10828       || i.types[this_operand].bitfield.baseindex
10829       || (current_templates->start->opcode_modifier.jump != JUMP
10830           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10831     {
10832       i386_addressing_mode ();
10833       override = (i.prefix[ADDR_PREFIX] != 0);
10834       if (flag_code == CODE_64BIT)
10835         {
10836           if (!override)
10837             {
10838               bigdisp.bitfield.disp32s = 1;
10839               bigdisp.bitfield.disp64 = 1;
10840             }
10841           else
10842             bigdisp.bitfield.disp32 = 1;
10843         }
10844       else if ((flag_code == CODE_16BIT) ^ override)
10845           bigdisp.bitfield.disp16 = 1;
10846       else
10847           bigdisp.bitfield.disp32 = 1;
10848     }
10849   else
10850     {
10851       /* For PC-relative branches, the width of the displacement may be
10852          dependent upon data size, but is never dependent upon address size.
10853          Also make sure to not unintentionally match against a non-PC-relative
10854          branch template.  */
10855       static templates aux_templates;
10856       const insn_template *t = current_templates->start;
10857       bool has_intel64 = false;
10858
10859       aux_templates.start = t;
10860       while (++t < current_templates->end)
10861         {
10862           if (t->opcode_modifier.jump
10863               != current_templates->start->opcode_modifier.jump)
10864             break;
10865           if ((t->opcode_modifier.isa64 >= INTEL64))
10866             has_intel64 = true;
10867         }
10868       if (t < current_templates->end)
10869         {
10870           aux_templates.end = t;
10871           current_templates = &aux_templates;
10872         }
10873
10874       override = (i.prefix[DATA_PREFIX] != 0);
10875       if (flag_code == CODE_64BIT)
10876         {
10877           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10878               && (!intel64 || !has_intel64))
10879             bigdisp.bitfield.disp16 = 1;
10880           else
10881             bigdisp.bitfield.disp32s = 1;
10882         }
10883       else
10884         {
10885           if (!override)
10886             override = (i.suffix == (flag_code != CODE_16BIT
10887                                      ? WORD_MNEM_SUFFIX
10888                                      : LONG_MNEM_SUFFIX));
10889           bigdisp.bitfield.disp32 = 1;
10890           if ((flag_code == CODE_16BIT) ^ override)
10891             {
10892               bigdisp.bitfield.disp32 = 0;
10893               bigdisp.bitfield.disp16 = 1;
10894             }
10895         }
10896     }
10897   i.types[this_operand] = operand_type_or (i.types[this_operand],
10898                                            bigdisp);
10899
10900   exp = &disp_expressions[i.disp_operands];
10901   i.op[this_operand].disps = exp;
10902   i.disp_operands++;
10903   save_input_line_pointer = input_line_pointer;
10904   input_line_pointer = disp_start;
10905   END_STRING_AND_SAVE (disp_end);
10906
10907 #ifndef GCC_ASM_O_HACK
10908 #define GCC_ASM_O_HACK 0
10909 #endif
10910 #if GCC_ASM_O_HACK
10911   END_STRING_AND_SAVE (disp_end + 1);
10912   if (i.types[this_operand].bitfield.baseIndex
10913       && displacement_string_end[-1] == '+')
10914     {
10915       /* This hack is to avoid a warning when using the "o"
10916          constraint within gcc asm statements.
10917          For instance:
10918
10919          #define _set_tssldt_desc(n,addr,limit,type) \
10920          __asm__ __volatile__ ( \
10921          "movw %w2,%0\n\t" \
10922          "movw %w1,2+%0\n\t" \
10923          "rorl $16,%1\n\t" \
10924          "movb %b1,4+%0\n\t" \
10925          "movb %4,5+%0\n\t" \
10926          "movb $0,6+%0\n\t" \
10927          "movb %h1,7+%0\n\t" \
10928          "rorl $16,%1" \
10929          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10930
10931          This works great except that the output assembler ends
10932          up looking a bit weird if it turns out that there is
10933          no offset.  You end up producing code that looks like:
10934
10935          #APP
10936          movw $235,(%eax)
10937          movw %dx,2+(%eax)
10938          rorl $16,%edx
10939          movb %dl,4+(%eax)
10940          movb $137,5+(%eax)
10941          movb $0,6+(%eax)
10942          movb %dh,7+(%eax)
10943          rorl $16,%edx
10944          #NO_APP
10945
10946          So here we provide the missing zero.  */
10947
10948       *displacement_string_end = '0';
10949     }
10950 #endif
10951   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10952   if (gotfree_input_line)
10953     input_line_pointer = gotfree_input_line;
10954
10955   exp_seg = expression (exp);
10956
10957   SKIP_WHITESPACE ();
10958   if (*input_line_pointer)
10959     as_bad (_("junk `%s' after expression"), input_line_pointer);
10960 #if GCC_ASM_O_HACK
10961   RESTORE_END_STRING (disp_end + 1);
10962 #endif
10963   input_line_pointer = save_input_line_pointer;
10964   if (gotfree_input_line)
10965     {
10966       free (gotfree_input_line);
10967
10968       if (exp->X_op == O_constant || exp->X_op == O_register)
10969         exp->X_op = O_illegal;
10970     }
10971
10972   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10973
10974   RESTORE_END_STRING (disp_end);
10975
10976   return ret;
10977 }
10978
10979 static int
10980 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10981                             i386_operand_type types, const char *disp_start)
10982 {
10983   i386_operand_type bigdisp;
10984   int ret = 1;
10985
10986   /* We do this to make sure that the section symbol is in
10987      the symbol table.  We will ultimately change the relocation
10988      to be relative to the beginning of the section.  */
10989   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10990       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10991       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10992     {
10993       if (exp->X_op != O_symbol)
10994         goto inv_disp;
10995
10996       if (S_IS_LOCAL (exp->X_add_symbol)
10997           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10998           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10999         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
11000       exp->X_op = O_subtract;
11001       exp->X_op_symbol = GOT_symbol;
11002       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
11003         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
11004       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
11005         i.reloc[this_operand] = BFD_RELOC_64;
11006       else
11007         i.reloc[this_operand] = BFD_RELOC_32;
11008     }
11009
11010   else if (exp->X_op == O_absent
11011            || exp->X_op == O_illegal
11012            || exp->X_op == O_big)
11013     {
11014     inv_disp:
11015       as_bad (_("missing or invalid displacement expression `%s'"),
11016               disp_start);
11017       ret = 0;
11018     }
11019
11020   else if (exp->X_op == O_constant)
11021     {
11022       /* Sizing gets taken care of by optimize_disp().
11023
11024          If not 64bit, sign/zero extend val, to account for wraparound
11025          when !BFD64.  */
11026       if (flag_code != CODE_64BIT)
11027         exp->X_add_number = extend_to_32bit_address (exp->X_add_number);
11028     }
11029
11030 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
11031   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
11032            && exp_seg != absolute_section
11033            && exp_seg != text_section
11034            && exp_seg != data_section
11035            && exp_seg != bss_section
11036            && exp_seg != undefined_section
11037            && !bfd_is_com_section (exp_seg))
11038     {
11039       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
11040       ret = 0;
11041     }
11042 #endif
11043
11044   else if (current_templates->start->opcode_modifier.jump == JUMP_BYTE)
11045     i.types[this_operand].bitfield.disp8 = 1;
11046
11047   /* Check if this is a displacement only operand.  */
11048   bigdisp = i.types[this_operand];
11049   bigdisp.bitfield.disp8 = 0;
11050   bigdisp.bitfield.disp16 = 0;
11051   bigdisp.bitfield.disp32 = 0;
11052   bigdisp.bitfield.disp32s = 0;
11053   bigdisp.bitfield.disp64 = 0;
11054   if (operand_type_all_zero (&bigdisp))
11055     i.types[this_operand] = operand_type_and (i.types[this_operand],
11056                                               types);
11057
11058   return ret;
11059 }
11060
11061 /* Return the active addressing mode, taking address override and
11062    registers forming the address into consideration.  Update the
11063    address override prefix if necessary.  */
11064
11065 static enum flag_code
11066 i386_addressing_mode (void)
11067 {
11068   enum flag_code addr_mode;
11069
11070   if (i.prefix[ADDR_PREFIX])
11071     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
11072   else if (flag_code == CODE_16BIT
11073            && current_templates->start->cpu_flags.bitfield.cpumpx
11074            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
11075               from md_assemble() by "is not a valid base/index expression"
11076               when there is a base and/or index.  */
11077            && !i.types[this_operand].bitfield.baseindex)
11078     {
11079       /* MPX insn memory operands with neither base nor index must be forced
11080          to use 32-bit addressing in 16-bit mode.  */
11081       addr_mode = CODE_32BIT;
11082       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
11083       ++i.prefixes;
11084       gas_assert (!i.types[this_operand].bitfield.disp16);
11085       gas_assert (!i.types[this_operand].bitfield.disp32);
11086     }
11087   else
11088     {
11089       addr_mode = flag_code;
11090
11091 #if INFER_ADDR_PREFIX
11092       if (i.mem_operands == 0)
11093         {
11094           /* Infer address prefix from the first memory operand.  */
11095           const reg_entry *addr_reg = i.base_reg;
11096
11097           if (addr_reg == NULL)
11098             addr_reg = i.index_reg;
11099
11100           if (addr_reg)
11101             {
11102               if (addr_reg->reg_type.bitfield.dword)
11103                 addr_mode = CODE_32BIT;
11104               else if (flag_code != CODE_64BIT
11105                        && addr_reg->reg_type.bitfield.word)
11106                 addr_mode = CODE_16BIT;
11107
11108               if (addr_mode != flag_code)
11109                 {
11110                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
11111                   i.prefixes += 1;
11112                   /* Change the size of any displacement too.  At most one
11113                      of Disp16 or Disp32 is set.
11114                      FIXME.  There doesn't seem to be any real need for
11115                      separate Disp16 and Disp32 flags.  The same goes for
11116                      Imm16 and Imm32.  Removing them would probably clean
11117                      up the code quite a lot.  */
11118                   if (flag_code != CODE_64BIT
11119                       && (i.types[this_operand].bitfield.disp16
11120                           || i.types[this_operand].bitfield.disp32))
11121                     i.types[this_operand]
11122                       = operand_type_xor (i.types[this_operand], disp16_32);
11123                 }
11124             }
11125         }
11126 #endif
11127     }
11128
11129   return addr_mode;
11130 }
11131
11132 /* Make sure the memory operand we've been dealt is valid.
11133    Return 1 on success, 0 on a failure.  */
11134
11135 static int
11136 i386_index_check (const char *operand_string)
11137 {
11138   const char *kind = "base/index";
11139   enum flag_code addr_mode = i386_addressing_mode ();
11140   const insn_template *t = current_templates->start;
11141
11142   if (t->opcode_modifier.isstring
11143       && !t->cpu_flags.bitfield.cpupadlock
11144       && (current_templates->end[-1].opcode_modifier.isstring
11145           || i.mem_operands))
11146     {
11147       /* Memory operands of string insns are special in that they only allow
11148          a single register (rDI, rSI, or rBX) as their memory address.  */
11149       const reg_entry *expected_reg;
11150       static const char *di_si[][2] =
11151         {
11152           { "esi", "edi" },
11153           { "si", "di" },
11154           { "rsi", "rdi" }
11155         };
11156       static const char *bx[] = { "ebx", "bx", "rbx" };
11157
11158       kind = "string address";
11159
11160       if (t->opcode_modifier.prefixok == PrefixRep)
11161         {
11162           int es_op = current_templates->end[-1].opcode_modifier.isstring
11163                       - IS_STRING_ES_OP0;
11164           int op = 0;
11165
11166           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11167               || ((!i.mem_operands != !intel_syntax)
11168                   && current_templates->end[-1].operand_types[1]
11169                      .bitfield.baseindex))
11170             op = 1;
11171           expected_reg
11172             = (const reg_entry *) str_hash_find (reg_hash,
11173                                                  di_si[addr_mode][op == es_op]);
11174         }
11175       else
11176         expected_reg
11177           = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11178
11179       if (i.base_reg != expected_reg
11180           || i.index_reg
11181           || operand_type_check (i.types[this_operand], disp))
11182         {
11183           /* The second memory operand must have the same size as
11184              the first one.  */
11185           if (i.mem_operands
11186               && i.base_reg
11187               && !((addr_mode == CODE_64BIT
11188                     && i.base_reg->reg_type.bitfield.qword)
11189                    || (addr_mode == CODE_32BIT
11190                        ? i.base_reg->reg_type.bitfield.dword
11191                        : i.base_reg->reg_type.bitfield.word)))
11192             goto bad_address;
11193
11194           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11195                    operand_string,
11196                    intel_syntax ? '[' : '(',
11197                    register_prefix,
11198                    expected_reg->reg_name,
11199                    intel_syntax ? ']' : ')');
11200           return 1;
11201         }
11202       else
11203         return 1;
11204
11205     bad_address:
11206       as_bad (_("`%s' is not a valid %s expression"),
11207               operand_string, kind);
11208       return 0;
11209     }
11210   else
11211     {
11212       if (addr_mode != CODE_16BIT)
11213         {
11214           /* 32-bit/64-bit checks.  */
11215           if (i.disp_encoding == disp_encoding_16bit)
11216             {
11217             bad_disp:
11218               as_bad (_("invalid `%s' prefix"),
11219                       addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11220               return 0;
11221             }
11222
11223           if ((i.base_reg
11224                && ((addr_mode == CODE_64BIT
11225                     ? !i.base_reg->reg_type.bitfield.qword
11226                     : !i.base_reg->reg_type.bitfield.dword)
11227                    || (i.index_reg && i.base_reg->reg_num == RegIP)
11228                    || i.base_reg->reg_num == RegIZ))
11229               || (i.index_reg
11230                   && !i.index_reg->reg_type.bitfield.xmmword
11231                   && !i.index_reg->reg_type.bitfield.ymmword
11232                   && !i.index_reg->reg_type.bitfield.zmmword
11233                   && ((addr_mode == CODE_64BIT
11234                        ? !i.index_reg->reg_type.bitfield.qword
11235                        : !i.index_reg->reg_type.bitfield.dword)
11236                       || !i.index_reg->reg_type.bitfield.baseindex)))
11237             goto bad_address;
11238
11239           /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11240           if ((t->opcode_modifier.opcodeprefix == PREFIX_0XF3
11241                && t->opcode_modifier.opcodespace == SPACE_0F
11242                && t->base_opcode == 0x1b)
11243               || (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11244                   && t->opcode_modifier.opcodespace == SPACE_0F
11245                   && (t->base_opcode & ~1) == 0x1a)
11246               || t->opcode_modifier.sib == SIBMEM)
11247             {
11248               /* They cannot use RIP-relative addressing. */
11249               if (i.base_reg && i.base_reg->reg_num == RegIP)
11250                 {
11251                   as_bad (_("`%s' cannot be used here"), operand_string);
11252                   return 0;
11253                 }
11254
11255               /* bndldx and bndstx ignore their scale factor. */
11256               if (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11257                   && t->opcode_modifier.opcodespace == SPACE_0F
11258                   && (t->base_opcode & ~1) == 0x1a
11259                   && i.log2_scale_factor)
11260                 as_warn (_("register scaling is being ignored here"));
11261             }
11262         }
11263       else
11264         {
11265           /* 16-bit checks.  */
11266           if (i.disp_encoding == disp_encoding_32bit)
11267             goto bad_disp;
11268
11269           if ((i.base_reg
11270                && (!i.base_reg->reg_type.bitfield.word
11271                    || !i.base_reg->reg_type.bitfield.baseindex))
11272               || (i.index_reg
11273                   && (!i.index_reg->reg_type.bitfield.word
11274                       || !i.index_reg->reg_type.bitfield.baseindex
11275                       || !(i.base_reg
11276                            && i.base_reg->reg_num < 6
11277                            && i.index_reg->reg_num >= 6
11278                            && i.log2_scale_factor == 0))))
11279             goto bad_address;
11280         }
11281     }
11282   return 1;
11283 }
11284
11285 /* Handle vector immediates.  */
11286
11287 static int
11288 RC_SAE_immediate (const char *imm_start)
11289 {
11290   unsigned int match_found, j;
11291   const char *pstr = imm_start;
11292   expressionS *exp;
11293
11294   if (*pstr != '{')
11295     return 0;
11296
11297   pstr++;
11298   match_found = 0;
11299   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11300     {
11301       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11302         {
11303           if (i.rounding.type != rc_none)
11304             {
11305               as_bad (_("duplicated `%s'"), imm_start);
11306               return 0;
11307             }
11308
11309           i.rounding.type = RC_NamesTable[j].type;
11310           i.rounding.operand = this_operand;
11311
11312           pstr += RC_NamesTable[j].len;
11313           match_found = 1;
11314           break;
11315         }
11316     }
11317   if (!match_found)
11318     return 0;
11319
11320   if (*pstr++ != '}')
11321     {
11322       as_bad (_("Missing '}': '%s'"), imm_start);
11323       return 0;
11324     }
11325   /* RC/SAE immediate string should contain nothing more.  */;
11326   if (*pstr != 0)
11327     {
11328       as_bad (_("Junk after '}': '%s'"), imm_start);
11329       return 0;
11330     }
11331
11332   exp = &im_expressions[i.imm_operands++];
11333   i.op[this_operand].imms = exp;
11334
11335   exp->X_op = O_constant;
11336   exp->X_add_number = 0;
11337   exp->X_add_symbol = (symbolS *) 0;
11338   exp->X_op_symbol = (symbolS *) 0;
11339
11340   i.types[this_operand].bitfield.imm8 = 1;
11341   return 1;
11342 }
11343
11344 /* Only string instructions can have a second memory operand, so
11345    reduce current_templates to just those if it contains any.  */
11346 static int
11347 maybe_adjust_templates (void)
11348 {
11349   const insn_template *t;
11350
11351   gas_assert (i.mem_operands == 1);
11352
11353   for (t = current_templates->start; t < current_templates->end; ++t)
11354     if (t->opcode_modifier.isstring)
11355       break;
11356
11357   if (t < current_templates->end)
11358     {
11359       static templates aux_templates;
11360       bool recheck;
11361
11362       aux_templates.start = t;
11363       for (; t < current_templates->end; ++t)
11364         if (!t->opcode_modifier.isstring)
11365           break;
11366       aux_templates.end = t;
11367
11368       /* Determine whether to re-check the first memory operand.  */
11369       recheck = (aux_templates.start != current_templates->start
11370                  || t != current_templates->end);
11371
11372       current_templates = &aux_templates;
11373
11374       if (recheck)
11375         {
11376           i.mem_operands = 0;
11377           if (i.memop1_string != NULL
11378               && i386_index_check (i.memop1_string) == 0)
11379             return 0;
11380           i.mem_operands = 1;
11381         }
11382     }
11383
11384   return 1;
11385 }
11386
11387 static INLINE bool starts_memory_operand (char c)
11388 {
11389   return ISDIGIT (c)
11390          || is_identifier_char (c)
11391          || strchr ("([\"+-!~", c);
11392 }
11393
11394 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11395    on error.  */
11396
11397 static int
11398 i386_att_operand (char *operand_string)
11399 {
11400   const reg_entry *r;
11401   char *end_op;
11402   char *op_string = operand_string;
11403
11404   if (is_space_char (*op_string))
11405     ++op_string;
11406
11407   /* We check for an absolute prefix (differentiating,
11408      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11409   if (*op_string == ABSOLUTE_PREFIX)
11410     {
11411       ++op_string;
11412       if (is_space_char (*op_string))
11413         ++op_string;
11414       i.jumpabsolute = true;
11415     }
11416
11417   /* Check if operand is a register.  */
11418   if ((r = parse_register (op_string, &end_op)) != NULL)
11419     {
11420       i386_operand_type temp;
11421
11422       if (r == &bad_reg)
11423         return 0;
11424
11425       /* Check for a segment override by searching for ':' after a
11426          segment register.  */
11427       op_string = end_op;
11428       if (is_space_char (*op_string))
11429         ++op_string;
11430       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11431         {
11432           i.seg[i.mem_operands] = r;
11433
11434           /* Skip the ':' and whitespace.  */
11435           ++op_string;
11436           if (is_space_char (*op_string))
11437             ++op_string;
11438
11439           /* Handle case of %es:*foo.  */
11440           if (!i.jumpabsolute && *op_string == ABSOLUTE_PREFIX)
11441             {
11442               ++op_string;
11443               if (is_space_char (*op_string))
11444                 ++op_string;
11445               i.jumpabsolute = true;
11446             }
11447
11448           if (!starts_memory_operand (*op_string))
11449             {
11450               as_bad (_("bad memory operand `%s'"), op_string);
11451               return 0;
11452             }
11453           goto do_memory_reference;
11454         }
11455
11456       /* Handle vector operations.  */
11457       if (*op_string == '{')
11458         {
11459           op_string = check_VecOperations (op_string);
11460           if (op_string == NULL)
11461             return 0;
11462         }
11463
11464       if (*op_string)
11465         {
11466           as_bad (_("junk `%s' after register"), op_string);
11467           return 0;
11468         }
11469       temp = r->reg_type;
11470       temp.bitfield.baseindex = 0;
11471       i.types[this_operand] = operand_type_or (i.types[this_operand],
11472                                                temp);
11473       i.types[this_operand].bitfield.unspecified = 0;
11474       i.op[this_operand].regs = r;
11475       i.reg_operands++;
11476     }
11477   else if (*op_string == REGISTER_PREFIX)
11478     {
11479       as_bad (_("bad register name `%s'"), op_string);
11480       return 0;
11481     }
11482   else if (*op_string == IMMEDIATE_PREFIX)
11483     {
11484       ++op_string;
11485       if (i.jumpabsolute)
11486         {
11487           as_bad (_("immediate operand illegal with absolute jump"));
11488           return 0;
11489         }
11490       if (!i386_immediate (op_string))
11491         return 0;
11492     }
11493   else if (RC_SAE_immediate (operand_string))
11494     {
11495       /* If it is a RC or SAE immediate, do nothing.  */
11496       ;
11497     }
11498   else if (starts_memory_operand (*op_string))
11499     {
11500       /* This is a memory reference of some sort.  */
11501       char *base_string;
11502
11503       /* Start and end of displacement string expression (if found).  */
11504       char *displacement_string_start;
11505       char *displacement_string_end;
11506
11507     do_memory_reference:
11508       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11509         return 0;
11510       if ((i.mem_operands == 1
11511            && !current_templates->start->opcode_modifier.isstring)
11512           || i.mem_operands == 2)
11513         {
11514           as_bad (_("too many memory references for `%s'"),
11515                   current_templates->start->name);
11516           return 0;
11517         }
11518
11519       /* Check for base index form.  We detect the base index form by
11520          looking for an ')' at the end of the operand, searching
11521          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11522          after the '('.  */
11523       base_string = op_string + strlen (op_string);
11524
11525       /* Handle vector operations.  */
11526       --base_string;
11527       if (is_space_char (*base_string))
11528         --base_string;
11529
11530       if (*base_string == '}')
11531         {
11532           char *vop_start = NULL;
11533
11534           while (base_string-- > op_string)
11535             {
11536               if (*base_string == '"')
11537                 break;
11538               if (*base_string != '{')
11539                 continue;
11540
11541               vop_start = base_string;
11542
11543               --base_string;
11544               if (is_space_char (*base_string))
11545                 --base_string;
11546
11547               if (*base_string != '}')
11548                 break;
11549
11550               vop_start = NULL;
11551             }
11552
11553           if (!vop_start)
11554             {
11555               as_bad (_("unbalanced figure braces"));
11556               return 0;
11557             }
11558
11559           if (check_VecOperations (vop_start) == NULL)
11560             return 0;
11561         }
11562
11563       /* If we only have a displacement, set-up for it to be parsed later.  */
11564       displacement_string_start = op_string;
11565       displacement_string_end = base_string + 1;
11566
11567       if (*base_string == ')')
11568         {
11569           char *temp_string;
11570           unsigned int parens_not_balanced = 1;
11571
11572           /* We've already checked that the number of left & right ()'s are
11573              equal, so this loop will not be infinite.  */
11574           do
11575             {
11576               base_string--;
11577               if (*base_string == ')')
11578                 parens_not_balanced++;
11579               if (*base_string == '(')
11580                 parens_not_balanced--;
11581             }
11582           while (parens_not_balanced && *base_string != '"');
11583
11584           temp_string = base_string;
11585
11586           /* Skip past '(' and whitespace.  */
11587           if (*base_string == '(')
11588             ++base_string;
11589           if (is_space_char (*base_string))
11590             ++base_string;
11591
11592           if (*base_string == ','
11593               || ((i.base_reg = parse_register (base_string, &end_op))
11594                   != NULL))
11595             {
11596               displacement_string_end = temp_string;
11597
11598               i.types[this_operand].bitfield.baseindex = 1;
11599
11600               if (i.base_reg)
11601                 {
11602                   if (i.base_reg == &bad_reg)
11603                     return 0;
11604                   base_string = end_op;
11605                   if (is_space_char (*base_string))
11606                     ++base_string;
11607                 }
11608
11609               /* There may be an index reg or scale factor here.  */
11610               if (*base_string == ',')
11611                 {
11612                   ++base_string;
11613                   if (is_space_char (*base_string))
11614                     ++base_string;
11615
11616                   if ((i.index_reg = parse_register (base_string, &end_op))
11617                       != NULL)
11618                     {
11619                       if (i.index_reg == &bad_reg)
11620                         return 0;
11621                       base_string = end_op;
11622                       if (is_space_char (*base_string))
11623                         ++base_string;
11624                       if (*base_string == ',')
11625                         {
11626                           ++base_string;
11627                           if (is_space_char (*base_string))
11628                             ++base_string;
11629                         }
11630                       else if (*base_string != ')')
11631                         {
11632                           as_bad (_("expecting `,' or `)' "
11633                                     "after index register in `%s'"),
11634                                   operand_string);
11635                           return 0;
11636                         }
11637                     }
11638                   else if (*base_string == REGISTER_PREFIX)
11639                     {
11640                       end_op = strchr (base_string, ',');
11641                       if (end_op)
11642                         *end_op = '\0';
11643                       as_bad (_("bad register name `%s'"), base_string);
11644                       return 0;
11645                     }
11646
11647                   /* Check for scale factor.  */
11648                   if (*base_string != ')')
11649                     {
11650                       char *end_scale = i386_scale (base_string);
11651
11652                       if (!end_scale)
11653                         return 0;
11654
11655                       base_string = end_scale;
11656                       if (is_space_char (*base_string))
11657                         ++base_string;
11658                       if (*base_string != ')')
11659                         {
11660                           as_bad (_("expecting `)' "
11661                                     "after scale factor in `%s'"),
11662                                   operand_string);
11663                           return 0;
11664                         }
11665                     }
11666                   else if (!i.index_reg)
11667                     {
11668                       as_bad (_("expecting index register or scale factor "
11669                                 "after `,'; got '%c'"),
11670                               *base_string);
11671                       return 0;
11672                     }
11673                 }
11674               else if (*base_string != ')')
11675                 {
11676                   as_bad (_("expecting `,' or `)' "
11677                             "after base register in `%s'"),
11678                           operand_string);
11679                   return 0;
11680                 }
11681             }
11682           else if (*base_string == REGISTER_PREFIX)
11683             {
11684               end_op = strchr (base_string, ',');
11685               if (end_op)
11686                 *end_op = '\0';
11687               as_bad (_("bad register name `%s'"), base_string);
11688               return 0;
11689             }
11690         }
11691
11692       /* If there's an expression beginning the operand, parse it,
11693          assuming displacement_string_start and
11694          displacement_string_end are meaningful.  */
11695       if (displacement_string_start != displacement_string_end)
11696         {
11697           if (!i386_displacement (displacement_string_start,
11698                                   displacement_string_end))
11699             return 0;
11700         }
11701
11702       /* Special case for (%dx) while doing input/output op.  */
11703       if (i.base_reg
11704           && i.base_reg->reg_type.bitfield.instance == RegD
11705           && i.base_reg->reg_type.bitfield.word
11706           && i.index_reg == 0
11707           && i.log2_scale_factor == 0
11708           && i.seg[i.mem_operands] == 0
11709           && !operand_type_check (i.types[this_operand], disp))
11710         {
11711           i.types[this_operand] = i.base_reg->reg_type;
11712           return 1;
11713         }
11714
11715       if (i386_index_check (operand_string) == 0)
11716         return 0;
11717       i.flags[this_operand] |= Operand_Mem;
11718       if (i.mem_operands == 0)
11719         i.memop1_string = xstrdup (operand_string);
11720       i.mem_operands++;
11721     }
11722   else
11723     {
11724       /* It's not a memory operand; argh!  */
11725       as_bad (_("invalid char %s beginning operand %d `%s'"),
11726               output_invalid (*op_string),
11727               this_operand + 1,
11728               op_string);
11729       return 0;
11730     }
11731   return 1;                     /* Normal return.  */
11732 }
11733 \f
11734 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11735    that an rs_machine_dependent frag may reach.  */
11736
11737 unsigned int
11738 i386_frag_max_var (fragS *frag)
11739 {
11740   /* The only relaxable frags are for jumps.
11741      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11742   gas_assert (frag->fr_type == rs_machine_dependent);
11743   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11744 }
11745
11746 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11747 static int
11748 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11749 {
11750   /* STT_GNU_IFUNC symbol must go through PLT.  */
11751   if ((symbol_get_bfdsym (fr_symbol)->flags
11752        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11753     return 0;
11754
11755   if (!S_IS_EXTERNAL (fr_symbol))
11756     /* Symbol may be weak or local.  */
11757     return !S_IS_WEAK (fr_symbol);
11758
11759   /* Global symbols with non-default visibility can't be preempted. */
11760   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11761     return 1;
11762
11763   if (fr_var != NO_RELOC)
11764     switch ((enum bfd_reloc_code_real) fr_var)
11765       {
11766       case BFD_RELOC_386_PLT32:
11767       case BFD_RELOC_X86_64_PLT32:
11768         /* Symbol with PLT relocation may be preempted. */
11769         return 0;
11770       default:
11771         abort ();
11772       }
11773
11774   /* Global symbols with default visibility in a shared library may be
11775      preempted by another definition.  */
11776   return !shared;
11777 }
11778 #endif
11779
11780 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11781    Note also work for Skylake and Cascadelake.
11782 ---------------------------------------------------------------------
11783 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11784 | ------  | ----------- | ------- | -------- |
11785 |   Jo    |      N      |    N    |     Y    |
11786 |   Jno   |      N      |    N    |     Y    |
11787 |  Jc/Jb  |      Y      |    N    |     Y    |
11788 | Jae/Jnb |      Y      |    N    |     Y    |
11789 |  Je/Jz  |      Y      |    Y    |     Y    |
11790 | Jne/Jnz |      Y      |    Y    |     Y    |
11791 | Jna/Jbe |      Y      |    N    |     Y    |
11792 | Ja/Jnbe |      Y      |    N    |     Y    |
11793 |   Js    |      N      |    N    |     Y    |
11794 |   Jns   |      N      |    N    |     Y    |
11795 |  Jp/Jpe |      N      |    N    |     Y    |
11796 | Jnp/Jpo |      N      |    N    |     Y    |
11797 | Jl/Jnge |      Y      |    Y    |     Y    |
11798 | Jge/Jnl |      Y      |    Y    |     Y    |
11799 | Jle/Jng |      Y      |    Y    |     Y    |
11800 | Jg/Jnle |      Y      |    Y    |     Y    |
11801 ---------------------------------------------------------------------  */
11802 static int
11803 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11804 {
11805   if (mf_cmp == mf_cmp_alu_cmp)
11806     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11807             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11808   if (mf_cmp == mf_cmp_incdec)
11809     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11810             || mf_jcc == mf_jcc_jle);
11811   if (mf_cmp == mf_cmp_test_and)
11812     return 1;
11813   return 0;
11814 }
11815
11816 /* Return the next non-empty frag.  */
11817
11818 static fragS *
11819 i386_next_non_empty_frag (fragS *fragP)
11820 {
11821   /* There may be a frag with a ".fill 0" when there is no room in
11822      the current frag for frag_grow in output_insn.  */
11823   for (fragP = fragP->fr_next;
11824        (fragP != NULL
11825         && fragP->fr_type == rs_fill
11826         && fragP->fr_fix == 0);
11827        fragP = fragP->fr_next)
11828     ;
11829   return fragP;
11830 }
11831
11832 /* Return the next jcc frag after BRANCH_PADDING.  */
11833
11834 static fragS *
11835 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11836 {
11837   fragS *branch_fragP;
11838   if (!pad_fragP)
11839     return NULL;
11840
11841   if (pad_fragP->fr_type == rs_machine_dependent
11842       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11843           == BRANCH_PADDING))
11844     {
11845       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11846       if (branch_fragP->fr_type != rs_machine_dependent)
11847         return NULL;
11848       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11849           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11850                                    pad_fragP->tc_frag_data.mf_type))
11851         return branch_fragP;
11852     }
11853
11854   return NULL;
11855 }
11856
11857 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11858
11859 static void
11860 i386_classify_machine_dependent_frag (fragS *fragP)
11861 {
11862   fragS *cmp_fragP;
11863   fragS *pad_fragP;
11864   fragS *branch_fragP;
11865   fragS *next_fragP;
11866   unsigned int max_prefix_length;
11867
11868   if (fragP->tc_frag_data.classified)
11869     return;
11870
11871   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11872      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11873   for (next_fragP = fragP;
11874        next_fragP != NULL;
11875        next_fragP = next_fragP->fr_next)
11876     {
11877       next_fragP->tc_frag_data.classified = 1;
11878       if (next_fragP->fr_type == rs_machine_dependent)
11879         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11880           {
11881           case BRANCH_PADDING:
11882             /* The BRANCH_PADDING frag must be followed by a branch
11883                frag.  */
11884             branch_fragP = i386_next_non_empty_frag (next_fragP);
11885             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11886             break;
11887           case FUSED_JCC_PADDING:
11888             /* Check if this is a fused jcc:
11889                FUSED_JCC_PADDING
11890                CMP like instruction
11891                BRANCH_PADDING
11892                COND_JUMP
11893                */
11894             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11895             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11896             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11897             if (branch_fragP)
11898               {
11899                 /* The BRANCH_PADDING frag is merged with the
11900                    FUSED_JCC_PADDING frag.  */
11901                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11902                 /* CMP like instruction size.  */
11903                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11904                 frag_wane (pad_fragP);
11905                 /* Skip to branch_fragP.  */
11906                 next_fragP = branch_fragP;
11907               }
11908             else if (next_fragP->tc_frag_data.max_prefix_length)
11909               {
11910                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11911                    a fused jcc.  */
11912                 next_fragP->fr_subtype
11913                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11914                 next_fragP->tc_frag_data.max_bytes
11915                   = next_fragP->tc_frag_data.max_prefix_length;
11916                 /* This will be updated in the BRANCH_PREFIX scan.  */
11917                 next_fragP->tc_frag_data.max_prefix_length = 0;
11918               }
11919             else
11920               frag_wane (next_fragP);
11921             break;
11922           }
11923     }
11924
11925   /* Stop if there is no BRANCH_PREFIX.  */
11926   if (!align_branch_prefix_size)
11927     return;
11928
11929   /* Scan for BRANCH_PREFIX.  */
11930   for (; fragP != NULL; fragP = fragP->fr_next)
11931     {
11932       if (fragP->fr_type != rs_machine_dependent
11933           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11934               != BRANCH_PREFIX))
11935         continue;
11936
11937       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11938          COND_JUMP_PREFIX.  */
11939       max_prefix_length = 0;
11940       for (next_fragP = fragP;
11941            next_fragP != NULL;
11942            next_fragP = next_fragP->fr_next)
11943         {
11944           if (next_fragP->fr_type == rs_fill)
11945             /* Skip rs_fill frags.  */
11946             continue;
11947           else if (next_fragP->fr_type != rs_machine_dependent)
11948             /* Stop for all other frags.  */
11949             break;
11950
11951           /* rs_machine_dependent frags.  */
11952           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11953               == BRANCH_PREFIX)
11954             {
11955               /* Count BRANCH_PREFIX frags.  */
11956               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11957                 {
11958                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11959                   frag_wane (next_fragP);
11960                 }
11961               else
11962                 max_prefix_length
11963                   += next_fragP->tc_frag_data.max_bytes;
11964             }
11965           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11966                     == BRANCH_PADDING)
11967                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11968                        == FUSED_JCC_PADDING))
11969             {
11970               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11971               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11972               break;
11973             }
11974           else
11975             /* Stop for other rs_machine_dependent frags.  */
11976             break;
11977         }
11978
11979       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11980
11981       /* Skip to the next frag.  */
11982       fragP = next_fragP;
11983     }
11984 }
11985
11986 /* Compute padding size for
11987
11988         FUSED_JCC_PADDING
11989         CMP like instruction
11990         BRANCH_PADDING
11991         COND_JUMP/UNCOND_JUMP
11992
11993    or
11994
11995         BRANCH_PADDING
11996         COND_JUMP/UNCOND_JUMP
11997  */
11998
11999 static int
12000 i386_branch_padding_size (fragS *fragP, offsetT address)
12001 {
12002   unsigned int offset, size, padding_size;
12003   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
12004
12005   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
12006   if (!address)
12007     address = fragP->fr_address;
12008   address += fragP->fr_fix;
12009
12010   /* CMP like instrunction size.  */
12011   size = fragP->tc_frag_data.cmp_size;
12012
12013   /* The base size of the branch frag.  */
12014   size += branch_fragP->fr_fix;
12015
12016   /* Add opcode and displacement bytes for the rs_machine_dependent
12017      branch frag.  */
12018   if (branch_fragP->fr_type == rs_machine_dependent)
12019     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
12020
12021   /* Check if branch is within boundary and doesn't end at the last
12022      byte.  */
12023   offset = address & ((1U << align_branch_power) - 1);
12024   if ((offset + size) >= (1U << align_branch_power))
12025     /* Padding needed to avoid crossing boundary.  */
12026     padding_size = (1U << align_branch_power) - offset;
12027   else
12028     /* No padding needed.  */
12029     padding_size = 0;
12030
12031   /* The return value may be saved in tc_frag_data.length which is
12032      unsigned byte.  */
12033   if (!fits_in_unsigned_byte (padding_size))
12034     abort ();
12035
12036   return padding_size;
12037 }
12038
12039 /* i386_generic_table_relax_frag()
12040
12041    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
12042    grow/shrink padding to align branch frags.  Hand others to
12043    relax_frag().  */
12044
12045 long
12046 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
12047 {
12048   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12049       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12050     {
12051       long padding_size = i386_branch_padding_size (fragP, 0);
12052       long grow = padding_size - fragP->tc_frag_data.length;
12053
12054       /* When the BRANCH_PREFIX frag is used, the computed address
12055          must match the actual address and there should be no padding.  */
12056       if (fragP->tc_frag_data.padding_address
12057           && (fragP->tc_frag_data.padding_address != fragP->fr_address
12058               || padding_size))
12059         abort ();
12060
12061       /* Update the padding size.  */
12062       if (grow)
12063         fragP->tc_frag_data.length = padding_size;
12064
12065       return grow;
12066     }
12067   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12068     {
12069       fragS *padding_fragP, *next_fragP;
12070       long padding_size, left_size, last_size;
12071
12072       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12073       if (!padding_fragP)
12074         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
12075         return (fragP->tc_frag_data.length
12076                 - fragP->tc_frag_data.last_length);
12077
12078       /* Compute the relative address of the padding frag in the very
12079         first time where the BRANCH_PREFIX frag sizes are zero.  */
12080       if (!fragP->tc_frag_data.padding_address)
12081         fragP->tc_frag_data.padding_address
12082           = padding_fragP->fr_address - (fragP->fr_address - stretch);
12083
12084       /* First update the last length from the previous interation.  */
12085       left_size = fragP->tc_frag_data.prefix_length;
12086       for (next_fragP = fragP;
12087            next_fragP != padding_fragP;
12088            next_fragP = next_fragP->fr_next)
12089         if (next_fragP->fr_type == rs_machine_dependent
12090             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12091                 == BRANCH_PREFIX))
12092           {
12093             if (left_size)
12094               {
12095                 int max = next_fragP->tc_frag_data.max_bytes;
12096                 if (max)
12097                   {
12098                     int size;
12099                     if (max > left_size)
12100                       size = left_size;
12101                     else
12102                       size = max;
12103                     left_size -= size;
12104                     next_fragP->tc_frag_data.last_length = size;
12105                   }
12106               }
12107             else
12108               next_fragP->tc_frag_data.last_length = 0;
12109           }
12110
12111       /* Check the padding size for the padding frag.  */
12112       padding_size = i386_branch_padding_size
12113         (padding_fragP, (fragP->fr_address
12114                          + fragP->tc_frag_data.padding_address));
12115
12116       last_size = fragP->tc_frag_data.prefix_length;
12117       /* Check if there is change from the last interation.  */
12118       if (padding_size == last_size)
12119         {
12120           /* Update the expected address of the padding frag.  */
12121           padding_fragP->tc_frag_data.padding_address
12122             = (fragP->fr_address + padding_size
12123                + fragP->tc_frag_data.padding_address);
12124           return 0;
12125         }
12126
12127       if (padding_size > fragP->tc_frag_data.max_prefix_length)
12128         {
12129           /* No padding if there is no sufficient room.  Clear the
12130              expected address of the padding frag.  */
12131           padding_fragP->tc_frag_data.padding_address = 0;
12132           padding_size = 0;
12133         }
12134       else
12135         /* Store the expected address of the padding frag.  */
12136         padding_fragP->tc_frag_data.padding_address
12137           = (fragP->fr_address + padding_size
12138              + fragP->tc_frag_data.padding_address);
12139
12140       fragP->tc_frag_data.prefix_length = padding_size;
12141
12142       /* Update the length for the current interation.  */
12143       left_size = padding_size;
12144       for (next_fragP = fragP;
12145            next_fragP != padding_fragP;
12146            next_fragP = next_fragP->fr_next)
12147         if (next_fragP->fr_type == rs_machine_dependent
12148             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12149                 == BRANCH_PREFIX))
12150           {
12151             if (left_size)
12152               {
12153                 int max = next_fragP->tc_frag_data.max_bytes;
12154                 if (max)
12155                   {
12156                     int size;
12157                     if (max > left_size)
12158                       size = left_size;
12159                     else
12160                       size = max;
12161                     left_size -= size;
12162                     next_fragP->tc_frag_data.length = size;
12163                   }
12164               }
12165             else
12166               next_fragP->tc_frag_data.length = 0;
12167           }
12168
12169       return (fragP->tc_frag_data.length
12170               - fragP->tc_frag_data.last_length);
12171     }
12172   return relax_frag (segment, fragP, stretch);
12173 }
12174
12175 /* md_estimate_size_before_relax()
12176
12177    Called just before relax() for rs_machine_dependent frags.  The x86
12178    assembler uses these frags to handle variable size jump
12179    instructions.
12180
12181    Any symbol that is now undefined will not become defined.
12182    Return the correct fr_subtype in the frag.
12183    Return the initial "guess for variable size of frag" to caller.
12184    The guess is actually the growth beyond the fixed part.  Whatever
12185    we do to grow the fixed or variable part contributes to our
12186    returned value.  */
12187
12188 int
12189 md_estimate_size_before_relax (fragS *fragP, segT segment)
12190 {
12191   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12192       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12193       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12194     {
12195       i386_classify_machine_dependent_frag (fragP);
12196       return fragP->tc_frag_data.length;
12197     }
12198
12199   /* We've already got fragP->fr_subtype right;  all we have to do is
12200      check for un-relaxable symbols.  On an ELF system, we can't relax
12201      an externally visible symbol, because it may be overridden by a
12202      shared library.  */
12203   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12204 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12205       || (IS_ELF
12206           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12207                                                 fragP->fr_var))
12208 #endif
12209 #if defined (OBJ_COFF) && defined (TE_PE)
12210       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12211           && S_IS_WEAK (fragP->fr_symbol))
12212 #endif
12213       )
12214     {
12215       /* Symbol is undefined in this segment, or we need to keep a
12216          reloc so that weak symbols can be overridden.  */
12217       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12218       enum bfd_reloc_code_real reloc_type;
12219       unsigned char *opcode;
12220       int old_fr_fix;
12221       fixS *fixP = NULL;
12222
12223       if (fragP->fr_var != NO_RELOC)
12224         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12225       else if (size == 2)
12226         reloc_type = BFD_RELOC_16_PCREL;
12227 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12228       else if (need_plt32_p (fragP->fr_symbol))
12229         reloc_type = BFD_RELOC_X86_64_PLT32;
12230 #endif
12231       else
12232         reloc_type = BFD_RELOC_32_PCREL;
12233
12234       old_fr_fix = fragP->fr_fix;
12235       opcode = (unsigned char *) fragP->fr_opcode;
12236
12237       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12238         {
12239         case UNCOND_JUMP:
12240           /* Make jmp (0xeb) a (d)word displacement jump.  */
12241           opcode[0] = 0xe9;
12242           fragP->fr_fix += size;
12243           fixP = fix_new (fragP, old_fr_fix, size,
12244                           fragP->fr_symbol,
12245                           fragP->fr_offset, 1,
12246                           reloc_type);
12247           break;
12248
12249         case COND_JUMP86:
12250           if (size == 2
12251               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12252             {
12253               /* Negate the condition, and branch past an
12254                  unconditional jump.  */
12255               opcode[0] ^= 1;
12256               opcode[1] = 3;
12257               /* Insert an unconditional jump.  */
12258               opcode[2] = 0xe9;
12259               /* We added two extra opcode bytes, and have a two byte
12260                  offset.  */
12261               fragP->fr_fix += 2 + 2;
12262               fix_new (fragP, old_fr_fix + 2, 2,
12263                        fragP->fr_symbol,
12264                        fragP->fr_offset, 1,
12265                        reloc_type);
12266               break;
12267             }
12268           /* Fall through.  */
12269
12270         case COND_JUMP:
12271           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12272             {
12273               fragP->fr_fix += 1;
12274               fixP = fix_new (fragP, old_fr_fix, 1,
12275                               fragP->fr_symbol,
12276                               fragP->fr_offset, 1,
12277                               BFD_RELOC_8_PCREL);
12278               fixP->fx_signed = 1;
12279               break;
12280             }
12281
12282           /* This changes the byte-displacement jump 0x7N
12283              to the (d)word-displacement jump 0x0f,0x8N.  */
12284           opcode[1] = opcode[0] + 0x10;
12285           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12286           /* We've added an opcode byte.  */
12287           fragP->fr_fix += 1 + size;
12288           fixP = fix_new (fragP, old_fr_fix + 1, size,
12289                           fragP->fr_symbol,
12290                           fragP->fr_offset, 1,
12291                           reloc_type);
12292           break;
12293
12294         default:
12295           BAD_CASE (fragP->fr_subtype);
12296           break;
12297         }
12298
12299       /* All jumps handled here are signed, but don't unconditionally use a
12300          signed limit check for 32 and 16 bit jumps as we want to allow wrap
12301          around at 4G (outside of 64-bit mode) and 64k.  */
12302       if (size == 4 && flag_code == CODE_64BIT)
12303         fixP->fx_signed = 1;
12304
12305       frag_wane (fragP);
12306       return fragP->fr_fix - old_fr_fix;
12307     }
12308
12309   /* Guess size depending on current relax state.  Initially the relax
12310      state will correspond to a short jump and we return 1, because
12311      the variable part of the frag (the branch offset) is one byte
12312      long.  However, we can relax a section more than once and in that
12313      case we must either set fr_subtype back to the unrelaxed state,
12314      or return the value for the appropriate branch.  */
12315   return md_relax_table[fragP->fr_subtype].rlx_length;
12316 }
12317
12318 /* Called after relax() is finished.
12319
12320    In:  Address of frag.
12321         fr_type == rs_machine_dependent.
12322         fr_subtype is what the address relaxed to.
12323
12324    Out: Any fixSs and constants are set up.
12325         Caller will turn frag into a ".space 0".  */
12326
12327 void
12328 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12329                  fragS *fragP)
12330 {
12331   unsigned char *opcode;
12332   unsigned char *where_to_put_displacement = NULL;
12333   offsetT target_address;
12334   offsetT opcode_address;
12335   unsigned int extension = 0;
12336   offsetT displacement_from_opcode_start;
12337
12338   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12339       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12340       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12341     {
12342       /* Generate nop padding.  */
12343       unsigned int size = fragP->tc_frag_data.length;
12344       if (size)
12345         {
12346           if (size > fragP->tc_frag_data.max_bytes)
12347             abort ();
12348
12349           if (flag_debug)
12350             {
12351               const char *msg;
12352               const char *branch = "branch";
12353               const char *prefix = "";
12354               fragS *padding_fragP;
12355               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12356                   == BRANCH_PREFIX)
12357                 {
12358                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12359                   switch (fragP->tc_frag_data.default_prefix)
12360                     {
12361                     default:
12362                       abort ();
12363                       break;
12364                     case CS_PREFIX_OPCODE:
12365                       prefix = " cs";
12366                       break;
12367                     case DS_PREFIX_OPCODE:
12368                       prefix = " ds";
12369                       break;
12370                     case ES_PREFIX_OPCODE:
12371                       prefix = " es";
12372                       break;
12373                     case FS_PREFIX_OPCODE:
12374                       prefix = " fs";
12375                       break;
12376                     case GS_PREFIX_OPCODE:
12377                       prefix = " gs";
12378                       break;
12379                     case SS_PREFIX_OPCODE:
12380                       prefix = " ss";
12381                       break;
12382                     }
12383                   if (padding_fragP)
12384                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12385                             "%s within %d-byte boundary\n");
12386                   else
12387                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12388                             "align %s within %d-byte boundary\n");
12389                 }
12390               else
12391                 {
12392                   padding_fragP = fragP;
12393                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12394                           "%s within %d-byte boundary\n");
12395                 }
12396
12397               if (padding_fragP)
12398                 switch (padding_fragP->tc_frag_data.branch_type)
12399                   {
12400                   case align_branch_jcc:
12401                     branch = "jcc";
12402                     break;
12403                   case align_branch_fused:
12404                     branch = "fused jcc";
12405                     break;
12406                   case align_branch_jmp:
12407                     branch = "jmp";
12408                     break;
12409                   case align_branch_call:
12410                     branch = "call";
12411                     break;
12412                   case align_branch_indirect:
12413                     branch = "indiret branch";
12414                     break;
12415                   case align_branch_ret:
12416                     branch = "ret";
12417                     break;
12418                   default:
12419                     break;
12420                   }
12421
12422               fprintf (stdout, msg,
12423                        fragP->fr_file, fragP->fr_line, size, prefix,
12424                        (long long) fragP->fr_address, branch,
12425                        1 << align_branch_power);
12426             }
12427           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12428             memset (fragP->fr_opcode,
12429                     fragP->tc_frag_data.default_prefix, size);
12430           else
12431             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12432                                 size, 0);
12433           fragP->fr_fix += size;
12434         }
12435       return;
12436     }
12437
12438   opcode = (unsigned char *) fragP->fr_opcode;
12439
12440   /* Address we want to reach in file space.  */
12441   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12442
12443   /* Address opcode resides at in file space.  */
12444   opcode_address = fragP->fr_address + fragP->fr_fix;
12445
12446   /* Displacement from opcode start to fill into instruction.  */
12447   displacement_from_opcode_start = target_address - opcode_address;
12448
12449   if ((fragP->fr_subtype & BIG) == 0)
12450     {
12451       /* Don't have to change opcode.  */
12452       extension = 1;            /* 1 opcode + 1 displacement  */
12453       where_to_put_displacement = &opcode[1];
12454     }
12455   else
12456     {
12457       if (no_cond_jump_promotion
12458           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12459         as_warn_where (fragP->fr_file, fragP->fr_line,
12460                        _("long jump required"));
12461
12462       switch (fragP->fr_subtype)
12463         {
12464         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12465           extension = 4;                /* 1 opcode + 4 displacement  */
12466           opcode[0] = 0xe9;
12467           where_to_put_displacement = &opcode[1];
12468           break;
12469
12470         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12471           extension = 2;                /* 1 opcode + 2 displacement  */
12472           opcode[0] = 0xe9;
12473           where_to_put_displacement = &opcode[1];
12474           break;
12475
12476         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12477         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12478           extension = 5;                /* 2 opcode + 4 displacement  */
12479           opcode[1] = opcode[0] + 0x10;
12480           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12481           where_to_put_displacement = &opcode[2];
12482           break;
12483
12484         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12485           extension = 3;                /* 2 opcode + 2 displacement  */
12486           opcode[1] = opcode[0] + 0x10;
12487           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12488           where_to_put_displacement = &opcode[2];
12489           break;
12490
12491         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12492           extension = 4;
12493           opcode[0] ^= 1;
12494           opcode[1] = 3;
12495           opcode[2] = 0xe9;
12496           where_to_put_displacement = &opcode[3];
12497           break;
12498
12499         default:
12500           BAD_CASE (fragP->fr_subtype);
12501           break;
12502         }
12503     }
12504
12505   /* If size if less then four we are sure that the operand fits,
12506      but if it's 4, then it could be that the displacement is larger
12507      then -/+ 2GB.  */
12508   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12509       && object_64bit
12510       && ((addressT) (displacement_from_opcode_start - extension
12511                       + ((addressT) 1 << 31))
12512           > (((addressT) 2 << 31) - 1)))
12513     {
12514       as_bad_where (fragP->fr_file, fragP->fr_line,
12515                     _("jump target out of range"));
12516       /* Make us emit 0.  */
12517       displacement_from_opcode_start = extension;
12518     }
12519   /* Now put displacement after opcode.  */
12520   md_number_to_chars ((char *) where_to_put_displacement,
12521                       (valueT) (displacement_from_opcode_start - extension),
12522                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12523   fragP->fr_fix += extension;
12524 }
12525 \f
12526 /* Apply a fixup (fixP) to segment data, once it has been determined
12527    by our caller that we have all the info we need to fix it up.
12528
12529    Parameter valP is the pointer to the value of the bits.
12530
12531    On the 386, immediates, displacements, and data pointers are all in
12532    the same (little-endian) format, so we don't need to care about which
12533    we are handling.  */
12534
12535 void
12536 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12537 {
12538   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12539   valueT value = *valP;
12540
12541 #if !defined (TE_Mach)
12542   if (fixP->fx_pcrel)
12543     {
12544       switch (fixP->fx_r_type)
12545         {
12546         default:
12547           break;
12548
12549         case BFD_RELOC_64:
12550           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12551           break;
12552         case BFD_RELOC_32:
12553         case BFD_RELOC_X86_64_32S:
12554           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12555           break;
12556         case BFD_RELOC_16:
12557           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12558           break;
12559         case BFD_RELOC_8:
12560           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12561           break;
12562         }
12563     }
12564
12565   if (fixP->fx_addsy != NULL
12566       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12567           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12568           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12569           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12570       && !use_rela_relocations)
12571     {
12572       /* This is a hack.  There should be a better way to handle this.
12573          This covers for the fact that bfd_install_relocation will
12574          subtract the current location (for partial_inplace, PC relative
12575          relocations); see more below.  */
12576 #ifndef OBJ_AOUT
12577       if (IS_ELF
12578 #ifdef TE_PE
12579           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12580 #endif
12581           )
12582         value += fixP->fx_where + fixP->fx_frag->fr_address;
12583 #endif
12584 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12585       if (IS_ELF)
12586         {
12587           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12588
12589           if ((sym_seg == seg
12590                || (symbol_section_p (fixP->fx_addsy)
12591                    && sym_seg != absolute_section))
12592               && !generic_force_reloc (fixP))
12593             {
12594               /* Yes, we add the values in twice.  This is because
12595                  bfd_install_relocation subtracts them out again.  I think
12596                  bfd_install_relocation is broken, but I don't dare change
12597                  it.  FIXME.  */
12598               value += fixP->fx_where + fixP->fx_frag->fr_address;
12599             }
12600         }
12601 #endif
12602 #if defined (OBJ_COFF) && defined (TE_PE)
12603       /* For some reason, the PE format does not store a
12604          section address offset for a PC relative symbol.  */
12605       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12606           || S_IS_WEAK (fixP->fx_addsy))
12607         value += md_pcrel_from (fixP);
12608 #endif
12609     }
12610 #if defined (OBJ_COFF) && defined (TE_PE)
12611   if (fixP->fx_addsy != NULL
12612       && S_IS_WEAK (fixP->fx_addsy)
12613       /* PR 16858: Do not modify weak function references.  */
12614       && ! fixP->fx_pcrel)
12615     {
12616 #if !defined (TE_PEP)
12617       /* For x86 PE weak function symbols are neither PC-relative
12618          nor do they set S_IS_FUNCTION.  So the only reliable way
12619          to detect them is to check the flags of their containing
12620          section.  */
12621       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12622           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12623         ;
12624       else
12625 #endif
12626       value -= S_GET_VALUE (fixP->fx_addsy);
12627     }
12628 #endif
12629
12630   /* Fix a few things - the dynamic linker expects certain values here,
12631      and we must not disappoint it.  */
12632 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12633   if (IS_ELF && fixP->fx_addsy)
12634     switch (fixP->fx_r_type)
12635       {
12636       case BFD_RELOC_386_PLT32:
12637       case BFD_RELOC_X86_64_PLT32:
12638         /* Make the jump instruction point to the address of the operand.
12639            At runtime we merely add the offset to the actual PLT entry.
12640            NB: Subtract the offset size only for jump instructions.  */
12641         if (fixP->fx_pcrel)
12642           value = -4;
12643         break;
12644
12645       case BFD_RELOC_386_TLS_GD:
12646       case BFD_RELOC_386_TLS_LDM:
12647       case BFD_RELOC_386_TLS_IE_32:
12648       case BFD_RELOC_386_TLS_IE:
12649       case BFD_RELOC_386_TLS_GOTIE:
12650       case BFD_RELOC_386_TLS_GOTDESC:
12651       case BFD_RELOC_X86_64_TLSGD:
12652       case BFD_RELOC_X86_64_TLSLD:
12653       case BFD_RELOC_X86_64_GOTTPOFF:
12654       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12655         value = 0; /* Fully resolved at runtime.  No addend.  */
12656         /* Fallthrough */
12657       case BFD_RELOC_386_TLS_LE:
12658       case BFD_RELOC_386_TLS_LDO_32:
12659       case BFD_RELOC_386_TLS_LE_32:
12660       case BFD_RELOC_X86_64_DTPOFF32:
12661       case BFD_RELOC_X86_64_DTPOFF64:
12662       case BFD_RELOC_X86_64_TPOFF32:
12663       case BFD_RELOC_X86_64_TPOFF64:
12664         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12665         break;
12666
12667       case BFD_RELOC_386_TLS_DESC_CALL:
12668       case BFD_RELOC_X86_64_TLSDESC_CALL:
12669         value = 0; /* Fully resolved at runtime.  No addend.  */
12670         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12671         fixP->fx_done = 0;
12672         return;
12673
12674       case BFD_RELOC_VTABLE_INHERIT:
12675       case BFD_RELOC_VTABLE_ENTRY:
12676         fixP->fx_done = 0;
12677         return;
12678
12679       default:
12680         break;
12681       }
12682 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12683
12684   /* If not 64bit, massage value, to account for wraparound when !BFD64.  */
12685   if (!object_64bit)
12686     value = extend_to_32bit_address (value);
12687
12688   *valP = value;
12689 #endif /* !defined (TE_Mach)  */
12690
12691   /* Are we finished with this relocation now?  */
12692   if (fixP->fx_addsy == NULL)
12693     {
12694       fixP->fx_done = 1;
12695       switch (fixP->fx_r_type)
12696         {
12697         case BFD_RELOC_X86_64_32S:
12698           fixP->fx_signed = 1;
12699           break;
12700
12701         default:
12702           break;
12703         }
12704     }
12705 #if defined (OBJ_COFF) && defined (TE_PE)
12706   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12707     {
12708       fixP->fx_done = 0;
12709       /* Remember value for tc_gen_reloc.  */
12710       fixP->fx_addnumber = value;
12711       /* Clear out the frag for now.  */
12712       value = 0;
12713     }
12714 #endif
12715   else if (use_rela_relocations)
12716     {
12717       fixP->fx_no_overflow = 1;
12718       /* Remember value for tc_gen_reloc.  */
12719       fixP->fx_addnumber = value;
12720       value = 0;
12721     }
12722
12723   md_number_to_chars (p, value, fixP->fx_size);
12724 }
12725 \f
12726 const char *
12727 md_atof (int type, char *litP, int *sizeP)
12728 {
12729   /* This outputs the LITTLENUMs in REVERSE order;
12730      in accord with the bigendian 386.  */
12731   return ieee_md_atof (type, litP, sizeP, false);
12732 }
12733 \f
12734 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12735
12736 static char *
12737 output_invalid (int c)
12738 {
12739   if (ISPRINT (c))
12740     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12741               "'%c'", c);
12742   else
12743     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12744               "(0x%x)", (unsigned char) c);
12745   return output_invalid_buf;
12746 }
12747
12748 /* Verify that @r can be used in the current context.  */
12749
12750 static bool check_register (const reg_entry *r)
12751 {
12752   if (allow_pseudo_reg)
12753     return true;
12754
12755   if (operand_type_all_zero (&r->reg_type))
12756     return false;
12757
12758   if ((r->reg_type.bitfield.dword
12759        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12760        || r->reg_type.bitfield.class == RegCR
12761        || r->reg_type.bitfield.class == RegDR)
12762       && !cpu_arch_flags.bitfield.cpui386)
12763     return false;
12764
12765   if (r->reg_type.bitfield.class == RegTR
12766       && (flag_code == CODE_64BIT
12767           || !cpu_arch_flags.bitfield.cpui386
12768           || cpu_arch_isa_flags.bitfield.cpui586
12769           || cpu_arch_isa_flags.bitfield.cpui686))
12770     return false;
12771
12772   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12773     return false;
12774
12775   if (!cpu_arch_flags.bitfield.cpuavx512f)
12776     {
12777       if (r->reg_type.bitfield.zmmword
12778           || r->reg_type.bitfield.class == RegMask)
12779         return false;
12780
12781       if (!cpu_arch_flags.bitfield.cpuavx)
12782         {
12783           if (r->reg_type.bitfield.ymmword)
12784             return false;
12785
12786           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12787             return false;
12788         }
12789     }
12790
12791   if (r->reg_type.bitfield.tmmword
12792       && (!cpu_arch_flags.bitfield.cpuamx_tile
12793           || flag_code != CODE_64BIT))
12794     return false;
12795
12796   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12797     return false;
12798
12799   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12800   if (!allow_index_reg && r->reg_num == RegIZ)
12801     return false;
12802
12803   /* Upper 16 vector registers are only available with VREX in 64bit
12804      mode, and require EVEX encoding.  */
12805   if (r->reg_flags & RegVRex)
12806     {
12807       if (!cpu_arch_flags.bitfield.cpuavx512f
12808           || flag_code != CODE_64BIT)
12809         return false;
12810
12811       if (i.vec_encoding == vex_encoding_default)
12812         i.vec_encoding = vex_encoding_evex;
12813       else if (i.vec_encoding != vex_encoding_evex)
12814         i.vec_encoding = vex_encoding_error;
12815     }
12816
12817   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12818       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12819       && flag_code != CODE_64BIT)
12820     return false;
12821
12822   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12823       && !intel_syntax)
12824     return false;
12825
12826   return true;
12827 }
12828
12829 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12830
12831 static const reg_entry *
12832 parse_real_register (char *reg_string, char **end_op)
12833 {
12834   char *s = reg_string;
12835   char *p;
12836   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12837   const reg_entry *r;
12838
12839   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12840   if (*s == REGISTER_PREFIX)
12841     ++s;
12842
12843   if (is_space_char (*s))
12844     ++s;
12845
12846   p = reg_name_given;
12847   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12848     {
12849       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12850         return (const reg_entry *) NULL;
12851       s++;
12852     }
12853
12854   /* For naked regs, make sure that we are not dealing with an identifier.
12855      This prevents confusing an identifier like `eax_var' with register
12856      `eax'.  */
12857   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12858     return (const reg_entry *) NULL;
12859
12860   *end_op = s;
12861
12862   r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12863
12864   /* Handle floating point regs, allowing spaces in the (i) part.  */
12865   if (r == reg_st0)
12866     {
12867       if (!cpu_arch_flags.bitfield.cpu8087
12868           && !cpu_arch_flags.bitfield.cpu287
12869           && !cpu_arch_flags.bitfield.cpu387
12870           && !allow_pseudo_reg)
12871         return (const reg_entry *) NULL;
12872
12873       if (is_space_char (*s))
12874         ++s;
12875       if (*s == '(')
12876         {
12877           ++s;
12878           if (is_space_char (*s))
12879             ++s;
12880           if (*s >= '0' && *s <= '7')
12881             {
12882               int fpr = *s - '0';
12883               ++s;
12884               if (is_space_char (*s))
12885                 ++s;
12886               if (*s == ')')
12887                 {
12888                   *end_op = s + 1;
12889                   know (r[fpr].reg_num == fpr);
12890                   return r + fpr;
12891                 }
12892             }
12893           /* We have "%st(" then garbage.  */
12894           return (const reg_entry *) NULL;
12895         }
12896     }
12897
12898   return r && check_register (r) ? r : NULL;
12899 }
12900
12901 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12902
12903 static const reg_entry *
12904 parse_register (char *reg_string, char **end_op)
12905 {
12906   const reg_entry *r;
12907
12908   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12909     r = parse_real_register (reg_string, end_op);
12910   else
12911     r = NULL;
12912   if (!r)
12913     {
12914       char *save = input_line_pointer;
12915       char c;
12916       symbolS *symbolP;
12917
12918       input_line_pointer = reg_string;
12919       c = get_symbol_name (&reg_string);
12920       symbolP = symbol_find (reg_string);
12921       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12922         {
12923           const expressionS *e = symbol_get_value_expression (symbolP);
12924
12925           know (e->X_op == O_register);
12926           know (e->X_add_number >= 0
12927                 && (valueT) e->X_add_number < i386_regtab_size);
12928           r = i386_regtab + e->X_add_number;
12929           if (!check_register (r))
12930             {
12931               as_bad (_("register '%s%s' cannot be used here"),
12932                       register_prefix, r->reg_name);
12933               r = &bad_reg;
12934             }
12935           *end_op = input_line_pointer;
12936         }
12937       *input_line_pointer = c;
12938       input_line_pointer = save;
12939     }
12940   return r;
12941 }
12942
12943 int
12944 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12945 {
12946   const reg_entry *r;
12947   char *end = input_line_pointer;
12948
12949   *end = *nextcharP;
12950   r = parse_register (name, &input_line_pointer);
12951   if (r && end <= input_line_pointer)
12952     {
12953       *nextcharP = *input_line_pointer;
12954       *input_line_pointer = 0;
12955       if (r != &bad_reg)
12956         {
12957           e->X_op = O_register;
12958           e->X_add_number = r - i386_regtab;
12959         }
12960       else
12961           e->X_op = O_illegal;
12962       return 1;
12963     }
12964   input_line_pointer = end;
12965   *end = 0;
12966   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12967 }
12968
12969 void
12970 md_operand (expressionS *e)
12971 {
12972   char *end;
12973   const reg_entry *r;
12974
12975   switch (*input_line_pointer)
12976     {
12977     case REGISTER_PREFIX:
12978       r = parse_real_register (input_line_pointer, &end);
12979       if (r)
12980         {
12981           e->X_op = O_register;
12982           e->X_add_number = r - i386_regtab;
12983           input_line_pointer = end;
12984         }
12985       break;
12986
12987     case '[':
12988       gas_assert (intel_syntax);
12989       end = input_line_pointer++;
12990       expression (e);
12991       if (*input_line_pointer == ']')
12992         {
12993           ++input_line_pointer;
12994           e->X_op_symbol = make_expr_symbol (e);
12995           e->X_add_symbol = NULL;
12996           e->X_add_number = 0;
12997           e->X_op = O_index;
12998         }
12999       else
13000         {
13001           e->X_op = O_absent;
13002           input_line_pointer = end;
13003         }
13004       break;
13005     }
13006 }
13007
13008 \f
13009 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13010 const char *md_shortopts = "kVQ:sqnO::";
13011 #else
13012 const char *md_shortopts = "qnO::";
13013 #endif
13014
13015 #define OPTION_32 (OPTION_MD_BASE + 0)
13016 #define OPTION_64 (OPTION_MD_BASE + 1)
13017 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
13018 #define OPTION_MARCH (OPTION_MD_BASE + 3)
13019 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
13020 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
13021 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
13022 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
13023 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
13024 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
13025 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
13026 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
13027 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
13028 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
13029 #define OPTION_X32 (OPTION_MD_BASE + 14)
13030 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
13031 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
13032 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
13033 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
13034 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
13035 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
13036 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
13037 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
13038 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
13039 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
13040 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
13041 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
13042 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
13043 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
13044 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
13045 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
13046 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
13047 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
13048 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
13049
13050 struct option md_longopts[] =
13051 {
13052   {"32", no_argument, NULL, OPTION_32},
13053 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13054      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13055   {"64", no_argument, NULL, OPTION_64},
13056 #endif
13057 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13058   {"x32", no_argument, NULL, OPTION_X32},
13059   {"mshared", no_argument, NULL, OPTION_MSHARED},
13060   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
13061 #endif
13062   {"divide", no_argument, NULL, OPTION_DIVIDE},
13063   {"march", required_argument, NULL, OPTION_MARCH},
13064   {"mtune", required_argument, NULL, OPTION_MTUNE},
13065   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
13066   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
13067   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
13068   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
13069   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
13070   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
13071   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
13072   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
13073   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
13074   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
13075   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
13076   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
13077 # if defined (TE_PE) || defined (TE_PEP)
13078   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
13079 #endif
13080   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
13081   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
13082   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
13083   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
13084   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
13085   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
13086   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
13087   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
13088   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
13089   {"mlfence-before-indirect-branch", required_argument, NULL,
13090    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
13091   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
13092   {"mamd64", no_argument, NULL, OPTION_MAMD64},
13093   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
13094   {NULL, no_argument, NULL, 0}
13095 };
13096 size_t md_longopts_size = sizeof (md_longopts);
13097
13098 int
13099 md_parse_option (int c, const char *arg)
13100 {
13101   unsigned int j;
13102   char *arch, *next, *saved, *type;
13103
13104   switch (c)
13105     {
13106     case 'n':
13107       optimize_align_code = 0;
13108       break;
13109
13110     case 'q':
13111       quiet_warnings = 1;
13112       break;
13113
13114 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13115       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
13116          should be emitted or not.  FIXME: Not implemented.  */
13117     case 'Q':
13118       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
13119         return 0;
13120       break;
13121
13122       /* -V: SVR4 argument to print version ID.  */
13123     case 'V':
13124       print_version_id ();
13125       break;
13126
13127       /* -k: Ignore for FreeBSD compatibility.  */
13128     case 'k':
13129       break;
13130
13131     case 's':
13132       /* -s: On i386 Solaris, this tells the native assembler to use
13133          .stab instead of .stab.excl.  We always use .stab anyhow.  */
13134       break;
13135
13136     case OPTION_MSHARED:
13137       shared = 1;
13138       break;
13139
13140     case OPTION_X86_USED_NOTE:
13141       if (strcasecmp (arg, "yes") == 0)
13142         x86_used_note = 1;
13143       else if (strcasecmp (arg, "no") == 0)
13144         x86_used_note = 0;
13145       else
13146         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
13147       break;
13148
13149
13150 #endif
13151 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13152      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13153     case OPTION_64:
13154       {
13155         const char **list, **l;
13156
13157         list = bfd_target_list ();
13158         for (l = list; *l != NULL; l++)
13159           if (startswith (*l, "elf64-x86-64")
13160               || strcmp (*l, "coff-x86-64") == 0
13161               || strcmp (*l, "pe-x86-64") == 0
13162               || strcmp (*l, "pei-x86-64") == 0
13163               || strcmp (*l, "mach-o-x86-64") == 0)
13164             {
13165               default_arch = "x86_64";
13166               break;
13167             }
13168         if (*l == NULL)
13169           as_fatal (_("no compiled in support for x86_64"));
13170         free (list);
13171       }
13172       break;
13173 #endif
13174
13175 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13176     case OPTION_X32:
13177       if (IS_ELF)
13178         {
13179           const char **list, **l;
13180
13181           list = bfd_target_list ();
13182           for (l = list; *l != NULL; l++)
13183             if (startswith (*l, "elf32-x86-64"))
13184               {
13185                 default_arch = "x86_64:32";
13186                 break;
13187               }
13188           if (*l == NULL)
13189             as_fatal (_("no compiled in support for 32bit x86_64"));
13190           free (list);
13191         }
13192       else
13193         as_fatal (_("32bit x86_64 is only supported for ELF"));
13194       break;
13195 #endif
13196
13197     case OPTION_32:
13198       default_arch = "i386";
13199       break;
13200
13201     case OPTION_DIVIDE:
13202 #ifdef SVR4_COMMENT_CHARS
13203       {
13204         char *n, *t;
13205         const char *s;
13206
13207         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13208         t = n;
13209         for (s = i386_comment_chars; *s != '\0'; s++)
13210           if (*s != '/')
13211             *t++ = *s;
13212         *t = '\0';
13213         i386_comment_chars = n;
13214       }
13215 #endif
13216       break;
13217
13218     case OPTION_MARCH:
13219       saved = xstrdup (arg);
13220       arch = saved;
13221       /* Allow -march=+nosse.  */
13222       if (*arch == '+')
13223         arch++;
13224       do
13225         {
13226           if (*arch == '.')
13227             as_fatal (_("invalid -march= option: `%s'"), arg);
13228           next = strchr (arch, '+');
13229           if (next)
13230             *next++ = '\0';
13231           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13232             {
13233               if (strcmp (arch, cpu_arch [j].name) == 0)
13234                 {
13235                   /* Processor.  */
13236                   if (! cpu_arch[j].flags.bitfield.cpui386)
13237                     continue;
13238
13239                   cpu_arch_name = cpu_arch[j].name;
13240                   cpu_sub_arch_name = NULL;
13241                   cpu_arch_flags = cpu_arch[j].flags;
13242                   cpu_arch_isa = cpu_arch[j].type;
13243                   cpu_arch_isa_flags = cpu_arch[j].flags;
13244                   if (!cpu_arch_tune_set)
13245                     {
13246                       cpu_arch_tune = cpu_arch_isa;
13247                       cpu_arch_tune_flags = cpu_arch_isa_flags;
13248                     }
13249                   break;
13250                 }
13251               else if (*cpu_arch [j].name == '.'
13252                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
13253                 {
13254                   /* ISA extension.  */
13255                   i386_cpu_flags flags;
13256
13257                   flags = cpu_flags_or (cpu_arch_flags,
13258                                         cpu_arch[j].flags);
13259
13260                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13261                     {
13262                       if (cpu_sub_arch_name)
13263                         {
13264                           char *name = cpu_sub_arch_name;
13265                           cpu_sub_arch_name = concat (name,
13266                                                       cpu_arch[j].name,
13267                                                       (const char *) NULL);
13268                           free (name);
13269                         }
13270                       else
13271                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13272                       cpu_arch_flags = flags;
13273                       cpu_arch_isa_flags = flags;
13274                     }
13275                   else
13276                     cpu_arch_isa_flags
13277                       = cpu_flags_or (cpu_arch_isa_flags,
13278                                       cpu_arch[j].flags);
13279                   break;
13280                 }
13281             }
13282
13283           if (j >= ARRAY_SIZE (cpu_arch))
13284             {
13285               /* Disable an ISA extension.  */
13286               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13287                 if (strcmp (arch, cpu_noarch [j].name) == 0)
13288                   {
13289                     i386_cpu_flags flags;
13290
13291                     flags = cpu_flags_and_not (cpu_arch_flags,
13292                                                cpu_noarch[j].flags);
13293                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13294                       {
13295                         if (cpu_sub_arch_name)
13296                           {
13297                             char *name = cpu_sub_arch_name;
13298                             cpu_sub_arch_name = concat (arch,
13299                                                         (const char *) NULL);
13300                             free (name);
13301                           }
13302                         else
13303                           cpu_sub_arch_name = xstrdup (arch);
13304                         cpu_arch_flags = flags;
13305                         cpu_arch_isa_flags = flags;
13306                       }
13307                     break;
13308                   }
13309
13310               if (j >= ARRAY_SIZE (cpu_noarch))
13311                 j = ARRAY_SIZE (cpu_arch);
13312             }
13313
13314           if (j >= ARRAY_SIZE (cpu_arch))
13315             as_fatal (_("invalid -march= option: `%s'"), arg);
13316
13317           arch = next;
13318         }
13319       while (next != NULL);
13320       free (saved);
13321       break;
13322
13323     case OPTION_MTUNE:
13324       if (*arg == '.')
13325         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13326       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13327         {
13328           if (strcmp (arg, cpu_arch [j].name) == 0)
13329             {
13330               cpu_arch_tune_set = 1;
13331               cpu_arch_tune = cpu_arch [j].type;
13332               cpu_arch_tune_flags = cpu_arch[j].flags;
13333               break;
13334             }
13335         }
13336       if (j >= ARRAY_SIZE (cpu_arch))
13337         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13338       break;
13339
13340     case OPTION_MMNEMONIC:
13341       if (strcasecmp (arg, "att") == 0)
13342         intel_mnemonic = 0;
13343       else if (strcasecmp (arg, "intel") == 0)
13344         intel_mnemonic = 1;
13345       else
13346         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13347       break;
13348
13349     case OPTION_MSYNTAX:
13350       if (strcasecmp (arg, "att") == 0)
13351         intel_syntax = 0;
13352       else if (strcasecmp (arg, "intel") == 0)
13353         intel_syntax = 1;
13354       else
13355         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13356       break;
13357
13358     case OPTION_MINDEX_REG:
13359       allow_index_reg = 1;
13360       break;
13361
13362     case OPTION_MNAKED_REG:
13363       allow_naked_reg = 1;
13364       break;
13365
13366     case OPTION_MSSE2AVX:
13367       sse2avx = 1;
13368       break;
13369
13370     case OPTION_MSSE_CHECK:
13371       if (strcasecmp (arg, "error") == 0)
13372         sse_check = check_error;
13373       else if (strcasecmp (arg, "warning") == 0)
13374         sse_check = check_warning;
13375       else if (strcasecmp (arg, "none") == 0)
13376         sse_check = check_none;
13377       else
13378         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13379       break;
13380
13381     case OPTION_MOPERAND_CHECK:
13382       if (strcasecmp (arg, "error") == 0)
13383         operand_check = check_error;
13384       else if (strcasecmp (arg, "warning") == 0)
13385         operand_check = check_warning;
13386       else if (strcasecmp (arg, "none") == 0)
13387         operand_check = check_none;
13388       else
13389         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13390       break;
13391
13392     case OPTION_MAVXSCALAR:
13393       if (strcasecmp (arg, "128") == 0)
13394         avxscalar = vex128;
13395       else if (strcasecmp (arg, "256") == 0)
13396         avxscalar = vex256;
13397       else
13398         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13399       break;
13400
13401     case OPTION_MVEXWIG:
13402       if (strcmp (arg, "0") == 0)
13403         vexwig = vexw0;
13404       else if (strcmp (arg, "1") == 0)
13405         vexwig = vexw1;
13406       else
13407         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13408       break;
13409
13410     case OPTION_MADD_BND_PREFIX:
13411       add_bnd_prefix = 1;
13412       break;
13413
13414     case OPTION_MEVEXLIG:
13415       if (strcmp (arg, "128") == 0)
13416         evexlig = evexl128;
13417       else if (strcmp (arg, "256") == 0)
13418         evexlig = evexl256;
13419       else  if (strcmp (arg, "512") == 0)
13420         evexlig = evexl512;
13421       else
13422         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13423       break;
13424
13425     case OPTION_MEVEXRCIG:
13426       if (strcmp (arg, "rne") == 0)
13427         evexrcig = rne;
13428       else if (strcmp (arg, "rd") == 0)
13429         evexrcig = rd;
13430       else if (strcmp (arg, "ru") == 0)
13431         evexrcig = ru;
13432       else if (strcmp (arg, "rz") == 0)
13433         evexrcig = rz;
13434       else
13435         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13436       break;
13437
13438     case OPTION_MEVEXWIG:
13439       if (strcmp (arg, "0") == 0)
13440         evexwig = evexw0;
13441       else if (strcmp (arg, "1") == 0)
13442         evexwig = evexw1;
13443       else
13444         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13445       break;
13446
13447 # if defined (TE_PE) || defined (TE_PEP)
13448     case OPTION_MBIG_OBJ:
13449       use_big_obj = 1;
13450       break;
13451 #endif
13452
13453     case OPTION_MOMIT_LOCK_PREFIX:
13454       if (strcasecmp (arg, "yes") == 0)
13455         omit_lock_prefix = 1;
13456       else if (strcasecmp (arg, "no") == 0)
13457         omit_lock_prefix = 0;
13458       else
13459         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13460       break;
13461
13462     case OPTION_MFENCE_AS_LOCK_ADD:
13463       if (strcasecmp (arg, "yes") == 0)
13464         avoid_fence = 1;
13465       else if (strcasecmp (arg, "no") == 0)
13466         avoid_fence = 0;
13467       else
13468         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13469       break;
13470
13471     case OPTION_MLFENCE_AFTER_LOAD:
13472       if (strcasecmp (arg, "yes") == 0)
13473         lfence_after_load = 1;
13474       else if (strcasecmp (arg, "no") == 0)
13475         lfence_after_load = 0;
13476       else
13477         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13478       break;
13479
13480     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13481       if (strcasecmp (arg, "all") == 0)
13482         {
13483           lfence_before_indirect_branch = lfence_branch_all;
13484           if (lfence_before_ret == lfence_before_ret_none)
13485             lfence_before_ret = lfence_before_ret_shl;
13486         }
13487       else if (strcasecmp (arg, "memory") == 0)
13488         lfence_before_indirect_branch = lfence_branch_memory;
13489       else if (strcasecmp (arg, "register") == 0)
13490         lfence_before_indirect_branch = lfence_branch_register;
13491       else if (strcasecmp (arg, "none") == 0)
13492         lfence_before_indirect_branch = lfence_branch_none;
13493       else
13494         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13495                   arg);
13496       break;
13497
13498     case OPTION_MLFENCE_BEFORE_RET:
13499       if (strcasecmp (arg, "or") == 0)
13500         lfence_before_ret = lfence_before_ret_or;
13501       else if (strcasecmp (arg, "not") == 0)
13502         lfence_before_ret = lfence_before_ret_not;
13503       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13504         lfence_before_ret = lfence_before_ret_shl;
13505       else if (strcasecmp (arg, "none") == 0)
13506         lfence_before_ret = lfence_before_ret_none;
13507       else
13508         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13509                   arg);
13510       break;
13511
13512     case OPTION_MRELAX_RELOCATIONS:
13513       if (strcasecmp (arg, "yes") == 0)
13514         generate_relax_relocations = 1;
13515       else if (strcasecmp (arg, "no") == 0)
13516         generate_relax_relocations = 0;
13517       else
13518         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13519       break;
13520
13521     case OPTION_MALIGN_BRANCH_BOUNDARY:
13522       {
13523         char *end;
13524         long int align = strtoul (arg, &end, 0);
13525         if (*end == '\0')
13526           {
13527             if (align == 0)
13528               {
13529                 align_branch_power = 0;
13530                 break;
13531               }
13532             else if (align >= 16)
13533               {
13534                 int align_power;
13535                 for (align_power = 0;
13536                      (align & 1) == 0;
13537                      align >>= 1, align_power++)
13538                   continue;
13539                 /* Limit alignment power to 31.  */
13540                 if (align == 1 && align_power < 32)
13541                   {
13542                     align_branch_power = align_power;
13543                     break;
13544                   }
13545               }
13546           }
13547         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13548       }
13549       break;
13550
13551     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13552       {
13553         char *end;
13554         int align = strtoul (arg, &end, 0);
13555         /* Some processors only support 5 prefixes.  */
13556         if (*end == '\0' && align >= 0 && align < 6)
13557           {
13558             align_branch_prefix_size = align;
13559             break;
13560           }
13561         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13562                   arg);
13563       }
13564       break;
13565
13566     case OPTION_MALIGN_BRANCH:
13567       align_branch = 0;
13568       saved = xstrdup (arg);
13569       type = saved;
13570       do
13571         {
13572           next = strchr (type, '+');
13573           if (next)
13574             *next++ = '\0';
13575           if (strcasecmp (type, "jcc") == 0)
13576             align_branch |= align_branch_jcc_bit;
13577           else if (strcasecmp (type, "fused") == 0)
13578             align_branch |= align_branch_fused_bit;
13579           else if (strcasecmp (type, "jmp") == 0)
13580             align_branch |= align_branch_jmp_bit;
13581           else if (strcasecmp (type, "call") == 0)
13582             align_branch |= align_branch_call_bit;
13583           else if (strcasecmp (type, "ret") == 0)
13584             align_branch |= align_branch_ret_bit;
13585           else if (strcasecmp (type, "indirect") == 0)
13586             align_branch |= align_branch_indirect_bit;
13587           else
13588             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13589           type = next;
13590         }
13591       while (next != NULL);
13592       free (saved);
13593       break;
13594
13595     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13596       align_branch_power = 5;
13597       align_branch_prefix_size = 5;
13598       align_branch = (align_branch_jcc_bit
13599                       | align_branch_fused_bit
13600                       | align_branch_jmp_bit);
13601       break;
13602
13603     case OPTION_MAMD64:
13604       isa64 = amd64;
13605       break;
13606
13607     case OPTION_MINTEL64:
13608       isa64 = intel64;
13609       break;
13610
13611     case 'O':
13612       if (arg == NULL)
13613         {
13614           optimize = 1;
13615           /* Turn off -Os.  */
13616           optimize_for_space = 0;
13617         }
13618       else if (*arg == 's')
13619         {
13620           optimize_for_space = 1;
13621           /* Turn on all encoding optimizations.  */
13622           optimize = INT_MAX;
13623         }
13624       else
13625         {
13626           optimize = atoi (arg);
13627           /* Turn off -Os.  */
13628           optimize_for_space = 0;
13629         }
13630       break;
13631
13632     default:
13633       return 0;
13634     }
13635   return 1;
13636 }
13637
13638 #define MESSAGE_TEMPLATE \
13639 "                                                                                "
13640
13641 static char *
13642 output_message (FILE *stream, char *p, char *message, char *start,
13643                 int *left_p, const char *name, int len)
13644 {
13645   int size = sizeof (MESSAGE_TEMPLATE);
13646   int left = *left_p;
13647
13648   /* Reserve 2 spaces for ", " or ",\0" */
13649   left -= len + 2;
13650
13651   /* Check if there is any room.  */
13652   if (left >= 0)
13653     {
13654       if (p != start)
13655         {
13656           *p++ = ',';
13657           *p++ = ' ';
13658         }
13659       p = mempcpy (p, name, len);
13660     }
13661   else
13662     {
13663       /* Output the current message now and start a new one.  */
13664       *p++ = ',';
13665       *p = '\0';
13666       fprintf (stream, "%s\n", message);
13667       p = start;
13668       left = size - (start - message) - len - 2;
13669
13670       gas_assert (left >= 0);
13671
13672       p = mempcpy (p, name, len);
13673     }
13674
13675   *left_p = left;
13676   return p;
13677 }
13678
13679 static void
13680 show_arch (FILE *stream, int ext, int check)
13681 {
13682   static char message[] = MESSAGE_TEMPLATE;
13683   char *start = message + 27;
13684   char *p;
13685   int size = sizeof (MESSAGE_TEMPLATE);
13686   int left;
13687   const char *name;
13688   int len;
13689   unsigned int j;
13690
13691   p = start;
13692   left = size - (start - message);
13693   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13694     {
13695       /* Should it be skipped?  */
13696       if (cpu_arch [j].skip)
13697         continue;
13698
13699       name = cpu_arch [j].name;
13700       len = cpu_arch [j].len;
13701       if (*name == '.')
13702         {
13703           /* It is an extension.  Skip if we aren't asked to show it.  */
13704           if (ext)
13705             {
13706               name++;
13707               len--;
13708             }
13709           else
13710             continue;
13711         }
13712       else if (ext)
13713         {
13714           /* It is an processor.  Skip if we show only extension.  */
13715           continue;
13716         }
13717       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13718         {
13719           /* It is an impossible processor - skip.  */
13720           continue;
13721         }
13722
13723       p = output_message (stream, p, message, start, &left, name, len);
13724     }
13725
13726   /* Display disabled extensions.  */
13727   if (ext)
13728     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13729       {
13730         name = cpu_noarch [j].name;
13731         len = cpu_noarch [j].len;
13732         p = output_message (stream, p, message, start, &left, name,
13733                             len);
13734       }
13735
13736   *p = '\0';
13737   fprintf (stream, "%s\n", message);
13738 }
13739
13740 void
13741 md_show_usage (FILE *stream)
13742 {
13743 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13744   fprintf (stream, _("\
13745   -Qy, -Qn                ignored\n\
13746   -V                      print assembler version number\n\
13747   -k                      ignored\n"));
13748 #endif
13749   fprintf (stream, _("\
13750   -n                      Do not optimize code alignment\n\
13751   -q                      quieten some warnings\n"));
13752 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13753   fprintf (stream, _("\
13754   -s                      ignored\n"));
13755 #endif
13756 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13757                       || defined (TE_PE) || defined (TE_PEP))
13758   fprintf (stream, _("\
13759   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13760 #endif
13761 #ifdef SVR4_COMMENT_CHARS
13762   fprintf (stream, _("\
13763   --divide                do not treat `/' as a comment character\n"));
13764 #else
13765   fprintf (stream, _("\
13766   --divide                ignored\n"));
13767 #endif
13768   fprintf (stream, _("\
13769   -march=CPU[,+EXTENSION...]\n\
13770                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13771   show_arch (stream, 0, 1);
13772   fprintf (stream, _("\
13773                           EXTENSION is combination of:\n"));
13774   show_arch (stream, 1, 0);
13775   fprintf (stream, _("\
13776   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13777   show_arch (stream, 0, 0);
13778   fprintf (stream, _("\
13779   -msse2avx               encode SSE instructions with VEX prefix\n"));
13780   fprintf (stream, _("\
13781   -msse-check=[none|error|warning] (default: warning)\n\
13782                           check SSE instructions\n"));
13783   fprintf (stream, _("\
13784   -moperand-check=[none|error|warning] (default: warning)\n\
13785                           check operand combinations for validity\n"));
13786   fprintf (stream, _("\
13787   -mavxscalar=[128|256] (default: 128)\n\
13788                           encode scalar AVX instructions with specific vector\n\
13789                            length\n"));
13790   fprintf (stream, _("\
13791   -mvexwig=[0|1] (default: 0)\n\
13792                           encode VEX instructions with specific VEX.W value\n\
13793                            for VEX.W bit ignored instructions\n"));
13794   fprintf (stream, _("\
13795   -mevexlig=[128|256|512] (default: 128)\n\
13796                           encode scalar EVEX instructions with specific vector\n\
13797                            length\n"));
13798   fprintf (stream, _("\
13799   -mevexwig=[0|1] (default: 0)\n\
13800                           encode EVEX instructions with specific EVEX.W value\n\
13801                            for EVEX.W bit ignored instructions\n"));
13802   fprintf (stream, _("\
13803   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13804                           encode EVEX instructions with specific EVEX.RC value\n\
13805                            for SAE-only ignored instructions\n"));
13806   fprintf (stream, _("\
13807   -mmnemonic=[att|intel] "));
13808   if (SYSV386_COMPAT)
13809     fprintf (stream, _("(default: att)\n"));
13810   else
13811     fprintf (stream, _("(default: intel)\n"));
13812   fprintf (stream, _("\
13813                           use AT&T/Intel mnemonic\n"));
13814   fprintf (stream, _("\
13815   -msyntax=[att|intel] (default: att)\n\
13816                           use AT&T/Intel syntax\n"));
13817   fprintf (stream, _("\
13818   -mindex-reg             support pseudo index registers\n"));
13819   fprintf (stream, _("\
13820   -mnaked-reg             don't require `%%' prefix for registers\n"));
13821   fprintf (stream, _("\
13822   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13823 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13824   fprintf (stream, _("\
13825   -mshared                disable branch optimization for shared code\n"));
13826   fprintf (stream, _("\
13827   -mx86-used-note=[no|yes] "));
13828   if (DEFAULT_X86_USED_NOTE)
13829     fprintf (stream, _("(default: yes)\n"));
13830   else
13831     fprintf (stream, _("(default: no)\n"));
13832   fprintf (stream, _("\
13833                           generate x86 used ISA and feature properties\n"));
13834 #endif
13835 #if defined (TE_PE) || defined (TE_PEP)
13836   fprintf (stream, _("\
13837   -mbig-obj               generate big object files\n"));
13838 #endif
13839   fprintf (stream, _("\
13840   -momit-lock-prefix=[no|yes] (default: no)\n\
13841                           strip all lock prefixes\n"));
13842   fprintf (stream, _("\
13843   -mfence-as-lock-add=[no|yes] (default: no)\n\
13844                           encode lfence, mfence and sfence as\n\
13845                            lock addl $0x0, (%%{re}sp)\n"));
13846   fprintf (stream, _("\
13847   -mrelax-relocations=[no|yes] "));
13848   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13849     fprintf (stream, _("(default: yes)\n"));
13850   else
13851     fprintf (stream, _("(default: no)\n"));
13852   fprintf (stream, _("\
13853                           generate relax relocations\n"));
13854   fprintf (stream, _("\
13855   -malign-branch-boundary=NUM (default: 0)\n\
13856                           align branches within NUM byte boundary\n"));
13857   fprintf (stream, _("\
13858   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13859                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13860                            indirect\n\
13861                           specify types of branches to align\n"));
13862   fprintf (stream, _("\
13863   -malign-branch-prefix-size=NUM (default: 5)\n\
13864                           align branches with NUM prefixes per instruction\n"));
13865   fprintf (stream, _("\
13866   -mbranches-within-32B-boundaries\n\
13867                           align branches within 32 byte boundary\n"));
13868   fprintf (stream, _("\
13869   -mlfence-after-load=[no|yes] (default: no)\n\
13870                           generate lfence after load\n"));
13871   fprintf (stream, _("\
13872   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13873                           generate lfence before indirect near branch\n"));
13874   fprintf (stream, _("\
13875   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13876                           generate lfence before ret\n"));
13877   fprintf (stream, _("\
13878   -mamd64                 accept only AMD64 ISA [default]\n"));
13879   fprintf (stream, _("\
13880   -mintel64               accept only Intel64 ISA\n"));
13881 }
13882
13883 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13884      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13885      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13886
13887 /* Pick the target format to use.  */
13888
13889 const char *
13890 i386_target_format (void)
13891 {
13892   if (startswith (default_arch, "x86_64"))
13893     {
13894       update_code_flag (CODE_64BIT, 1);
13895       if (default_arch[6] == '\0')
13896         x86_elf_abi = X86_64_ABI;
13897       else
13898         x86_elf_abi = X86_64_X32_ABI;
13899     }
13900   else if (!strcmp (default_arch, "i386"))
13901     update_code_flag (CODE_32BIT, 1);
13902   else if (!strcmp (default_arch, "iamcu"))
13903     {
13904       update_code_flag (CODE_32BIT, 1);
13905       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13906         {
13907           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13908           cpu_arch_name = "iamcu";
13909           cpu_sub_arch_name = NULL;
13910           cpu_arch_flags = iamcu_flags;
13911           cpu_arch_isa = PROCESSOR_IAMCU;
13912           cpu_arch_isa_flags = iamcu_flags;
13913           if (!cpu_arch_tune_set)
13914             {
13915               cpu_arch_tune = cpu_arch_isa;
13916               cpu_arch_tune_flags = cpu_arch_isa_flags;
13917             }
13918         }
13919       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13920         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13921                   cpu_arch_name);
13922     }
13923   else
13924     as_fatal (_("unknown architecture"));
13925
13926   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13927     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13928   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13929     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13930
13931   switch (OUTPUT_FLAVOR)
13932     {
13933 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13934     case bfd_target_aout_flavour:
13935       return AOUT_TARGET_FORMAT;
13936 #endif
13937 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13938 # if defined (TE_PE) || defined (TE_PEP)
13939     case bfd_target_coff_flavour:
13940       if (flag_code == CODE_64BIT)
13941         {
13942           object_64bit = 1;
13943           return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13944         }
13945       return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13946 # elif defined (TE_GO32)
13947     case bfd_target_coff_flavour:
13948       return "coff-go32";
13949 # else
13950     case bfd_target_coff_flavour:
13951       return "coff-i386";
13952 # endif
13953 #endif
13954 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13955     case bfd_target_elf_flavour:
13956       {
13957         const char *format;
13958
13959         switch (x86_elf_abi)
13960           {
13961           default:
13962             format = ELF_TARGET_FORMAT;
13963 #ifndef TE_SOLARIS
13964             tls_get_addr = "___tls_get_addr";
13965 #endif
13966             break;
13967           case X86_64_ABI:
13968             use_rela_relocations = 1;
13969             object_64bit = 1;
13970 #ifndef TE_SOLARIS
13971             tls_get_addr = "__tls_get_addr";
13972 #endif
13973             format = ELF_TARGET_FORMAT64;
13974             break;
13975           case X86_64_X32_ABI:
13976             use_rela_relocations = 1;
13977             object_64bit = 1;
13978 #ifndef TE_SOLARIS
13979             tls_get_addr = "__tls_get_addr";
13980 #endif
13981             disallow_64bit_reloc = 1;
13982             format = ELF_TARGET_FORMAT32;
13983             break;
13984           }
13985         if (cpu_arch_isa == PROCESSOR_L1OM)
13986           {
13987             if (x86_elf_abi != X86_64_ABI)
13988               as_fatal (_("Intel L1OM is 64bit only"));
13989             return ELF_TARGET_L1OM_FORMAT;
13990           }
13991         else if (cpu_arch_isa == PROCESSOR_K1OM)
13992           {
13993             if (x86_elf_abi != X86_64_ABI)
13994               as_fatal (_("Intel K1OM is 64bit only"));
13995             return ELF_TARGET_K1OM_FORMAT;
13996           }
13997         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13998           {
13999             if (x86_elf_abi != I386_ABI)
14000               as_fatal (_("Intel MCU is 32bit only"));
14001             return ELF_TARGET_IAMCU_FORMAT;
14002           }
14003         else
14004           return format;
14005       }
14006 #endif
14007 #if defined (OBJ_MACH_O)
14008     case bfd_target_mach_o_flavour:
14009       if (flag_code == CODE_64BIT)
14010         {
14011           use_rela_relocations = 1;
14012           object_64bit = 1;
14013           return "mach-o-x86-64";
14014         }
14015       else
14016         return "mach-o-i386";
14017 #endif
14018     default:
14019       abort ();
14020       return NULL;
14021     }
14022 }
14023
14024 #endif /* OBJ_MAYBE_ more than one  */
14025 \f
14026 symbolS *
14027 md_undefined_symbol (char *name)
14028 {
14029   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
14030       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
14031       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
14032       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
14033     {
14034       if (!GOT_symbol)
14035         {
14036           if (symbol_find (name))
14037             as_bad (_("GOT already in symbol table"));
14038           GOT_symbol = symbol_new (name, undefined_section,
14039                                    &zero_address_frag, 0);
14040         };
14041       return GOT_symbol;
14042     }
14043   return 0;
14044 }
14045
14046 /* Round up a section size to the appropriate boundary.  */
14047
14048 valueT
14049 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
14050 {
14051 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
14052   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
14053     {
14054       /* For a.out, force the section size to be aligned.  If we don't do
14055          this, BFD will align it for us, but it will not write out the
14056          final bytes of the section.  This may be a bug in BFD, but it is
14057          easier to fix it here since that is how the other a.out targets
14058          work.  */
14059       int align;
14060
14061       align = bfd_section_alignment (segment);
14062       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
14063     }
14064 #endif
14065
14066   return size;
14067 }
14068
14069 /* On the i386, PC-relative offsets are relative to the start of the
14070    next instruction.  That is, the address of the offset, plus its
14071    size, since the offset is always the last part of the insn.  */
14072
14073 long
14074 md_pcrel_from (fixS *fixP)
14075 {
14076   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
14077 }
14078
14079 #ifndef I386COFF
14080
14081 static void
14082 s_bss (int ignore ATTRIBUTE_UNUSED)
14083 {
14084   int temp;
14085
14086 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14087   if (IS_ELF)
14088     obj_elf_section_change_hook ();
14089 #endif
14090   temp = get_absolute_expression ();
14091   subseg_set (bss_section, (subsegT) temp);
14092   demand_empty_rest_of_line ();
14093 }
14094
14095 #endif
14096
14097 /* Remember constant directive.  */
14098
14099 void
14100 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
14101 {
14102   if (last_insn.kind != last_insn_directive
14103       && (bfd_section_flags (now_seg) & SEC_CODE))
14104     {
14105       last_insn.seg = now_seg;
14106       last_insn.kind = last_insn_directive;
14107       last_insn.name = "constant directive";
14108       last_insn.file = as_where (&last_insn.line);
14109       if (lfence_before_ret != lfence_before_ret_none)
14110         {
14111           if (lfence_before_indirect_branch != lfence_branch_none)
14112             as_warn (_("constant directive skips -mlfence-before-ret "
14113                        "and -mlfence-before-indirect-branch"));
14114           else
14115             as_warn (_("constant directive skips -mlfence-before-ret"));
14116         }
14117       else if (lfence_before_indirect_branch != lfence_branch_none)
14118         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
14119     }
14120 }
14121
14122 int
14123 i386_validate_fix (fixS *fixp)
14124 {
14125 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14126   if (fixp->fx_r_type == BFD_RELOC_SIZE32
14127       || fixp->fx_r_type == BFD_RELOC_SIZE64)
14128     return IS_ELF && fixp->fx_addsy
14129            && (!S_IS_DEFINED (fixp->fx_addsy)
14130                || S_IS_EXTERNAL (fixp->fx_addsy));
14131 #endif
14132
14133   if (fixp->fx_subsy)
14134     {
14135       if (fixp->fx_subsy == GOT_symbol)
14136         {
14137           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
14138             {
14139               if (!object_64bit)
14140                 abort ();
14141 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14142               if (fixp->fx_tcbit2)
14143                 fixp->fx_r_type = (fixp->fx_tcbit
14144                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
14145                                    : BFD_RELOC_X86_64_GOTPCRELX);
14146               else
14147 #endif
14148                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
14149             }
14150           else
14151             {
14152               if (!object_64bit)
14153                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
14154               else
14155                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
14156             }
14157           fixp->fx_subsy = 0;
14158         }
14159     }
14160 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14161   else
14162     {
14163       /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
14164          to section.  Since PLT32 relocation must be against symbols,
14165          turn such PLT32 relocation into PC32 relocation.  */
14166       if (fixp->fx_addsy
14167           && (fixp->fx_r_type == BFD_RELOC_386_PLT32
14168               || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
14169           && symbol_section_p (fixp->fx_addsy))
14170         fixp->fx_r_type = BFD_RELOC_32_PCREL;
14171       if (!object_64bit)
14172         {
14173           if (fixp->fx_r_type == BFD_RELOC_386_GOT32
14174               && fixp->fx_tcbit2)
14175             fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14176         }
14177     }
14178 #endif
14179
14180   return 1;
14181 }
14182
14183 arelent *
14184 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
14185 {
14186   arelent *rel;
14187   bfd_reloc_code_real_type code;
14188
14189   switch (fixp->fx_r_type)
14190     {
14191 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14192       symbolS *sym;
14193
14194     case BFD_RELOC_SIZE32:
14195     case BFD_RELOC_SIZE64:
14196       if (fixp->fx_addsy
14197           && !bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_addsy))
14198           && (!fixp->fx_subsy
14199               || bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_subsy))))
14200         sym = fixp->fx_addsy;
14201       else if (fixp->fx_subsy
14202                && !bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_subsy))
14203                && (!fixp->fx_addsy
14204                    || bfd_is_abs_section (S_GET_SEGMENT (fixp->fx_addsy))))
14205         sym = fixp->fx_subsy;
14206       else
14207         sym = NULL;
14208       if (IS_ELF && sym && S_IS_DEFINED (sym) && !S_IS_EXTERNAL (sym))
14209         {
14210           /* Resolve size relocation against local symbol to size of
14211              the symbol plus addend.  */
14212           valueT value = S_GET_SIZE (sym);
14213
14214           if (symbol_get_bfdsym (sym)->flags & BSF_SECTION_SYM)
14215             value = bfd_section_size (S_GET_SEGMENT (sym));
14216           if (sym == fixp->fx_subsy)
14217             {
14218               value = -value;
14219               if (fixp->fx_addsy)
14220                 value += S_GET_VALUE (fixp->fx_addsy);
14221             }
14222           else if (fixp->fx_subsy)
14223             value -= S_GET_VALUE (fixp->fx_subsy);
14224           value += fixp->fx_offset;
14225           if (fixp->fx_r_type == BFD_RELOC_SIZE32
14226               && object_64bit
14227               && !fits_in_unsigned_long (value))
14228             as_bad_where (fixp->fx_file, fixp->fx_line,
14229                           _("symbol size computation overflow"));
14230           fixp->fx_addsy = NULL;
14231           fixp->fx_subsy = NULL;
14232           md_apply_fix (fixp, (valueT *) &value, NULL);
14233           return NULL;
14234         }
14235       if (!fixp->fx_addsy || fixp->fx_subsy)
14236         {
14237           as_bad_where (fixp->fx_file, fixp->fx_line,
14238                         "unsupported expression involving @size");
14239           return NULL;
14240         }
14241 #endif
14242       /* Fall through.  */
14243
14244     case BFD_RELOC_X86_64_PLT32:
14245     case BFD_RELOC_X86_64_GOT32:
14246     case BFD_RELOC_X86_64_GOTPCREL:
14247     case BFD_RELOC_X86_64_GOTPCRELX:
14248     case BFD_RELOC_X86_64_REX_GOTPCRELX:
14249     case BFD_RELOC_386_PLT32:
14250     case BFD_RELOC_386_GOT32:
14251     case BFD_RELOC_386_GOT32X:
14252     case BFD_RELOC_386_GOTOFF:
14253     case BFD_RELOC_386_GOTPC:
14254     case BFD_RELOC_386_TLS_GD:
14255     case BFD_RELOC_386_TLS_LDM:
14256     case BFD_RELOC_386_TLS_LDO_32:
14257     case BFD_RELOC_386_TLS_IE_32:
14258     case BFD_RELOC_386_TLS_IE:
14259     case BFD_RELOC_386_TLS_GOTIE:
14260     case BFD_RELOC_386_TLS_LE_32:
14261     case BFD_RELOC_386_TLS_LE:
14262     case BFD_RELOC_386_TLS_GOTDESC:
14263     case BFD_RELOC_386_TLS_DESC_CALL:
14264     case BFD_RELOC_X86_64_TLSGD:
14265     case BFD_RELOC_X86_64_TLSLD:
14266     case BFD_RELOC_X86_64_DTPOFF32:
14267     case BFD_RELOC_X86_64_DTPOFF64:
14268     case BFD_RELOC_X86_64_GOTTPOFF:
14269     case BFD_RELOC_X86_64_TPOFF32:
14270     case BFD_RELOC_X86_64_TPOFF64:
14271     case BFD_RELOC_X86_64_GOTOFF64:
14272     case BFD_RELOC_X86_64_GOTPC32:
14273     case BFD_RELOC_X86_64_GOT64:
14274     case BFD_RELOC_X86_64_GOTPCREL64:
14275     case BFD_RELOC_X86_64_GOTPC64:
14276     case BFD_RELOC_X86_64_GOTPLT64:
14277     case BFD_RELOC_X86_64_PLTOFF64:
14278     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14279     case BFD_RELOC_X86_64_TLSDESC_CALL:
14280     case BFD_RELOC_RVA:
14281     case BFD_RELOC_VTABLE_ENTRY:
14282     case BFD_RELOC_VTABLE_INHERIT:
14283 #ifdef TE_PE
14284     case BFD_RELOC_32_SECREL:
14285 #endif
14286       code = fixp->fx_r_type;
14287       break;
14288     case BFD_RELOC_X86_64_32S:
14289       if (!fixp->fx_pcrel)
14290         {
14291           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
14292           code = fixp->fx_r_type;
14293           break;
14294         }
14295       /* Fall through.  */
14296     default:
14297       if (fixp->fx_pcrel)
14298         {
14299           switch (fixp->fx_size)
14300             {
14301             default:
14302               as_bad_where (fixp->fx_file, fixp->fx_line,
14303                             _("can not do %d byte pc-relative relocation"),
14304                             fixp->fx_size);
14305               code = BFD_RELOC_32_PCREL;
14306               break;
14307             case 1: code = BFD_RELOC_8_PCREL;  break;
14308             case 2: code = BFD_RELOC_16_PCREL; break;
14309             case 4: code = BFD_RELOC_32_PCREL; break;
14310 #ifdef BFD64
14311             case 8: code = BFD_RELOC_64_PCREL; break;
14312 #endif
14313             }
14314         }
14315       else
14316         {
14317           switch (fixp->fx_size)
14318             {
14319             default:
14320               as_bad_where (fixp->fx_file, fixp->fx_line,
14321                             _("can not do %d byte relocation"),
14322                             fixp->fx_size);
14323               code = BFD_RELOC_32;
14324               break;
14325             case 1: code = BFD_RELOC_8;  break;
14326             case 2: code = BFD_RELOC_16; break;
14327             case 4: code = BFD_RELOC_32; break;
14328 #ifdef BFD64
14329             case 8: code = BFD_RELOC_64; break;
14330 #endif
14331             }
14332         }
14333       break;
14334     }
14335
14336   if ((code == BFD_RELOC_32
14337        || code == BFD_RELOC_32_PCREL
14338        || code == BFD_RELOC_X86_64_32S)
14339       && GOT_symbol
14340       && fixp->fx_addsy == GOT_symbol)
14341     {
14342       if (!object_64bit)
14343         code = BFD_RELOC_386_GOTPC;
14344       else
14345         code = BFD_RELOC_X86_64_GOTPC32;
14346     }
14347   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14348       && GOT_symbol
14349       && fixp->fx_addsy == GOT_symbol)
14350     {
14351       code = BFD_RELOC_X86_64_GOTPC64;
14352     }
14353
14354   rel = XNEW (arelent);
14355   rel->sym_ptr_ptr = XNEW (asymbol *);
14356   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14357
14358   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14359
14360   if (!use_rela_relocations)
14361     {
14362       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14363          vtable entry to be used in the relocation's section offset.  */
14364       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14365         rel->address = fixp->fx_offset;
14366 #if defined (OBJ_COFF) && defined (TE_PE)
14367       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14368         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14369       else
14370 #endif
14371       rel->addend = 0;
14372     }
14373   /* Use the rela in 64bit mode.  */
14374   else
14375     {
14376       if (disallow_64bit_reloc)
14377         switch (code)
14378           {
14379           case BFD_RELOC_X86_64_DTPOFF64:
14380           case BFD_RELOC_X86_64_TPOFF64:
14381           case BFD_RELOC_64_PCREL:
14382           case BFD_RELOC_X86_64_GOTOFF64:
14383           case BFD_RELOC_X86_64_GOT64:
14384           case BFD_RELOC_X86_64_GOTPCREL64:
14385           case BFD_RELOC_X86_64_GOTPC64:
14386           case BFD_RELOC_X86_64_GOTPLT64:
14387           case BFD_RELOC_X86_64_PLTOFF64:
14388             as_bad_where (fixp->fx_file, fixp->fx_line,
14389                           _("cannot represent relocation type %s in x32 mode"),
14390                           bfd_get_reloc_code_name (code));
14391             break;
14392           default:
14393             break;
14394           }
14395
14396       if (!fixp->fx_pcrel)
14397         rel->addend = fixp->fx_offset;
14398       else
14399         switch (code)
14400           {
14401           case BFD_RELOC_X86_64_PLT32:
14402           case BFD_RELOC_X86_64_GOT32:
14403           case BFD_RELOC_X86_64_GOTPCREL:
14404           case BFD_RELOC_X86_64_GOTPCRELX:
14405           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14406           case BFD_RELOC_X86_64_TLSGD:
14407           case BFD_RELOC_X86_64_TLSLD:
14408           case BFD_RELOC_X86_64_GOTTPOFF:
14409           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14410           case BFD_RELOC_X86_64_TLSDESC_CALL:
14411             rel->addend = fixp->fx_offset - fixp->fx_size;
14412             break;
14413           default:
14414             rel->addend = (section->vma
14415                            - fixp->fx_size
14416                            + fixp->fx_addnumber
14417                            + md_pcrel_from (fixp));
14418             break;
14419           }
14420     }
14421
14422   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14423   if (rel->howto == NULL)
14424     {
14425       as_bad_where (fixp->fx_file, fixp->fx_line,
14426                     _("cannot represent relocation type %s"),
14427                     bfd_get_reloc_code_name (code));
14428       /* Set howto to a garbage value so that we can keep going.  */
14429       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14430       gas_assert (rel->howto != NULL);
14431     }
14432
14433   return rel;
14434 }
14435
14436 #include "tc-i386-intel.c"
14437
14438 void
14439 tc_x86_parse_to_dw2regnum (expressionS *exp)
14440 {
14441   int saved_naked_reg;
14442   char saved_register_dot;
14443
14444   saved_naked_reg = allow_naked_reg;
14445   allow_naked_reg = 1;
14446   saved_register_dot = register_chars['.'];
14447   register_chars['.'] = '.';
14448   allow_pseudo_reg = 1;
14449   expression_and_evaluate (exp);
14450   allow_pseudo_reg = 0;
14451   register_chars['.'] = saved_register_dot;
14452   allow_naked_reg = saved_naked_reg;
14453
14454   if (exp->X_op == O_register && exp->X_add_number >= 0)
14455     {
14456       if ((addressT) exp->X_add_number < i386_regtab_size)
14457         {
14458           exp->X_op = O_constant;
14459           exp->X_add_number = i386_regtab[exp->X_add_number]
14460                               .dw2_regnum[flag_code >> 1];
14461         }
14462       else
14463         exp->X_op = O_illegal;
14464     }
14465 }
14466
14467 void
14468 tc_x86_frame_initial_instructions (void)
14469 {
14470   static unsigned int sp_regno[2];
14471
14472   if (!sp_regno[flag_code >> 1])
14473     {
14474       char *saved_input = input_line_pointer;
14475       char sp[][4] = {"esp", "rsp"};
14476       expressionS exp;
14477
14478       input_line_pointer = sp[flag_code >> 1];
14479       tc_x86_parse_to_dw2regnum (&exp);
14480       gas_assert (exp.X_op == O_constant);
14481       sp_regno[flag_code >> 1] = exp.X_add_number;
14482       input_line_pointer = saved_input;
14483     }
14484
14485   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14486   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14487 }
14488
14489 int
14490 x86_dwarf2_addr_size (void)
14491 {
14492 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14493   if (x86_elf_abi == X86_64_X32_ABI)
14494     return 4;
14495 #endif
14496   return bfd_arch_bits_per_address (stdoutput) / 8;
14497 }
14498
14499 int
14500 i386_elf_section_type (const char *str, size_t len)
14501 {
14502   if (flag_code == CODE_64BIT
14503       && len == sizeof ("unwind") - 1
14504       && startswith (str, "unwind"))
14505     return SHT_X86_64_UNWIND;
14506
14507   return -1;
14508 }
14509
14510 #ifdef TE_SOLARIS
14511 void
14512 i386_solaris_fix_up_eh_frame (segT sec)
14513 {
14514   if (flag_code == CODE_64BIT)
14515     elf_section_type (sec) = SHT_X86_64_UNWIND;
14516 }
14517 #endif
14518
14519 #ifdef TE_PE
14520 void
14521 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14522 {
14523   expressionS exp;
14524
14525   exp.X_op = O_secrel;
14526   exp.X_add_symbol = symbol;
14527   exp.X_add_number = 0;
14528   emit_expr (&exp, size);
14529 }
14530 #endif
14531
14532 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14533 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14534
14535 bfd_vma
14536 x86_64_section_letter (int letter, const char **ptr_msg)
14537 {
14538   if (flag_code == CODE_64BIT)
14539     {
14540       if (letter == 'l')
14541         return SHF_X86_64_LARGE;
14542
14543       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14544     }
14545   else
14546     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14547   return -1;
14548 }
14549
14550 bfd_vma
14551 x86_64_section_word (char *str, size_t len)
14552 {
14553   if (len == 5 && flag_code == CODE_64BIT && startswith (str, "large"))
14554     return SHF_X86_64_LARGE;
14555
14556   return -1;
14557 }
14558
14559 static void
14560 handle_large_common (int small ATTRIBUTE_UNUSED)
14561 {
14562   if (flag_code != CODE_64BIT)
14563     {
14564       s_comm_internal (0, elf_common_parse);
14565       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14566     }
14567   else
14568     {
14569       static segT lbss_section;
14570       asection *saved_com_section_ptr = elf_com_section_ptr;
14571       asection *saved_bss_section = bss_section;
14572
14573       if (lbss_section == NULL)
14574         {
14575           flagword applicable;
14576           segT seg = now_seg;
14577           subsegT subseg = now_subseg;
14578
14579           /* The .lbss section is for local .largecomm symbols.  */
14580           lbss_section = subseg_new (".lbss", 0);
14581           applicable = bfd_applicable_section_flags (stdoutput);
14582           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14583           seg_info (lbss_section)->bss = 1;
14584
14585           subseg_set (seg, subseg);
14586         }
14587
14588       elf_com_section_ptr = &_bfd_elf_large_com_section;
14589       bss_section = lbss_section;
14590
14591       s_comm_internal (0, elf_common_parse);
14592
14593       elf_com_section_ptr = saved_com_section_ptr;
14594       bss_section = saved_bss_section;
14595     }
14596 }
14597 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */