gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2021 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifdef HAVE_LIMITS_H
  37 #include <limits.h>
  38 #else
  39 #ifdef HAVE_SYS_PARAM_H
  40 #include <sys/param.h>
  41 #endif
  42 #ifndef INT_MAX
  43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
  44 #endif
  45 #endif
  46
  47 #ifndef INFER_ADDR_PREFIX
  48 #define INFER_ADDR_PREFIX 1
  49 #endif
  50
  51 #ifndef DEFAULT_ARCH
  52 #define DEFAULT_ARCH "i386"
  53 #endif
  54
  55 #ifndef INLINE
  56 #if __GNUC__ >= 2
  57 #define INLINE __inline__
  58 #else
  59 #define INLINE
  60 #endif
  61 #endif
  62
  63 /* Prefixes will be emitted in the order defined below.
  64    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  65    instruction, and so must come before any prefixes.
  66    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  67    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  68 #define WAIT_PREFIX     0
  69 #define SEG_PREFIX      1
  70 #define ADDR_PREFIX     2
  71 #define DATA_PREFIX     3
  72 #define REP_PREFIX      4
  73 #define HLE_PREFIX      REP_PREFIX
  74 #define BND_PREFIX      REP_PREFIX
  75 #define LOCK_PREFIX     5
  76 #define REX_PREFIX      6       /* must come last.  */
  77 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  78
  79 /* we define the syntax here (modulo base,index,scale syntax) */
  80 #define REGISTER_PREFIX '%'
  81 #define IMMEDIATE_PREFIX '$'
  82 #define ABSOLUTE_PREFIX '*'
  83
  84 /* these are the instruction mnemonic suffixes in AT&T syntax or
  85    memory operand size in Intel syntax.  */
  86 #define WORD_MNEM_SUFFIX  'w'
  87 #define BYTE_MNEM_SUFFIX  'b'
  88 #define SHORT_MNEM_SUFFIX 's'
  89 #define LONG_MNEM_SUFFIX  'l'
  90 #define QWORD_MNEM_SUFFIX  'q'
  91 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  92    in instructions.  */
  93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  94
  95 #define END_OF_INSN '\0'
  96
  97 /* This matches the C -> StaticRounding alias in the opcode table.  */
  98 #define commutative staticrounding
  99
 100 /*
 101   'templates' is for grouping together 'template' structures for opcodes
 102   of the same name.  This is only used for storing the insns in the grand
 103   ole hash table of insns.
 104   The templates themselves start at START and range up to (but not including)
 105   END.
 106   */
 107 typedef struct
 108 {
 109   const insn_template *start;
 110   const insn_template *end;
 111 }
 112 templates;
 113
 114 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 115 typedef struct
 116 {
 117   unsigned int regmem;  /* codes register or memory operand */
 118   unsigned int reg;     /* codes register operand (or extended opcode) */
 119   unsigned int mode;    /* how to interpret regmem & reg */
 120 }
 121 modrm_byte;
 122
 123 /* x86-64 extension prefix.  */
 124 typedef int rex_byte;
 125
 126 /* 386 opcode byte to code indirect addressing.  */
 127 typedef struct
 128 {
 129   unsigned base;
 130   unsigned index;
 131   unsigned scale;
 132 }
 133 sib_byte;
 134
 135 /* x86 arch names, types and features */
 136 typedef struct
 137 {
 138   const char *name;             /* arch name */
 139   unsigned int len;             /* arch string length */
 140   enum processor_type type;     /* arch type */
 141   i386_cpu_flags flags;         /* cpu feature flags */
 142   unsigned int skip;            /* show_arch should skip this. */
 143 }
 144 arch_entry;
 145
 146 /* Used to turn off indicated flags.  */
 147 typedef struct
 148 {
 149   const char *name;             /* arch name */
 150   unsigned int len;             /* arch string length */
 151   i386_cpu_flags flags;         /* cpu feature flags */
 152 }
 153 noarch_entry;
 154
 155 static void update_code_flag (int, int);
 156 static void set_code_flag (int);
 157 static void set_16bit_gcc_code_flag (int);
 158 static void set_intel_syntax (int);
 159 static void set_intel_mnemonic (int);
 160 static void set_allow_index_reg (int);
 161 static void set_check (int);
 162 static void set_cpu_arch (int);
 163 #ifdef TE_PE
 164 static void pe_directive_secrel (int);
 165 #endif
 166 static void signed_cons (int);
 167 static char *output_invalid (int c);
 168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 169                                     const char *);
 170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 171                                        const char *);
 172 static int i386_att_operand (char *);
 173 static int i386_intel_operand (char *, int);
 174 static int i386_intel_simplify (expressionS *);
 175 static int i386_intel_parse_name (const char *, expressionS *);
 176 static const reg_entry *parse_register (char *, char **);
 177 static char *parse_insn (char *, char *);
 178 static char *parse_operands (char *, const char *);
 179 static void swap_operands (void);
 180 static void swap_2_operands (int, int);
 181 static enum flag_code i386_addressing_mode (void);
 182 static void optimize_imm (void);
 183 static void optimize_disp (void);
 184 static const insn_template *match_template (char);
 185 static int check_string (void);
 186 static int process_suffix (void);
 187 static int check_byte_reg (void);
 188 static int check_long_reg (void);
 189 static int check_qword_reg (void);
 190 static int check_word_reg (void);
 191 static int finalize_imm (void);
 192 static int process_operands (void);
 193 static const seg_entry *build_modrm_byte (void);
 194 static void output_insn (void);
 195 static void output_imm (fragS *, offsetT);
 196 static void output_disp (fragS *, offsetT);
 197 #ifndef I386COFF
 198 static void s_bss (int);
 199 #endif
 200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 202
 203 /* GNU_PROPERTY_X86_ISA_1_USED.  */
 204 static unsigned int x86_isa_1_used;
 205 /* GNU_PROPERTY_X86_FEATURE_2_USED.  */
 206 static unsigned int x86_feature_2_used;
 207 /* Generate x86 used ISA and feature properties.  */
 208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
 209 #endif
 210
 211 static const char *default_arch = DEFAULT_ARCH;
 212
 213 /* parse_register() returns this when a register alias cannot be used.  */
 214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
 215                                    { Dw2Inval, Dw2Inval } };
 216
 217 /* This struct describes rounding control and SAE in the instruction.  */
 218 struct RC_Operation
 219 {
 220   enum rc_type
 221     {
 222       rne = 0,
 223       rd,
 224       ru,
 225       rz,
 226       saeonly
 227     } type;
 228   int operand;
 229 };
 230
 231 static struct RC_Operation rc_op;
 232
 233 /* The struct describes masking, applied to OPERAND in the instruction.
 234    MASK is a pointer to the corresponding mask register.  ZEROING tells
 235    whether merging or zeroing mask is used.  */
 236 struct Mask_Operation
 237 {
 238   const reg_entry *mask;
 239   unsigned int zeroing;
 240   /* The operand where this operation is associated.  */
 241   int operand;
 242 };
 243
 244 static struct Mask_Operation mask_op;
 245
 246 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 247    broadcast factor.  */
 248 struct Broadcast_Operation
 249 {
 250   /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}.  */
 251   int type;
 252
 253   /* Index of broadcasted operand.  */
 254   int operand;
 255
 256   /* Number of bytes to broadcast.  */
 257   int bytes;
 258 };
 259
 260 static struct Broadcast_Operation broadcast_op;
 261
 262 /* VEX prefix.  */
 263 typedef struct
 264 {
 265   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 266   unsigned char bytes[4];
 267   unsigned int length;
 268   /* Destination or source register specifier.  */
 269   const reg_entry *register_specifier;
 270 } vex_prefix;
 271
 272 /* 'md_assemble ()' gathers together information and puts it into a
 273    i386_insn.  */
 274
 275 union i386_op
 276   {
 277     expressionS *disps;
 278     expressionS *imms;
 279     const reg_entry *regs;
 280   };
 281
 282 enum i386_error
 283   {
 284     operand_size_mismatch,
 285     operand_type_mismatch,
 286     register_type_mismatch,
 287     number_of_operands_mismatch,
 288     invalid_instruction_suffix,
 289     bad_imm4,
 290     unsupported_with_intel_mnemonic,
 291     unsupported_syntax,
 292     unsupported,
 293     invalid_sib_address,
 294     invalid_vsib_address,
 295     invalid_vector_register_set,
 296     invalid_tmm_register_set,
 297     unsupported_vector_index_register,
 298     unsupported_broadcast,
 299     broadcast_needed,
 300     unsupported_masking,
 301     mask_not_on_destination,
 302     no_default_mask,
 303     unsupported_rc_sae,
 304     rc_sae_operand_not_last_imm,
 305     invalid_register_operand,
 306   };
 307
 308 struct _i386_insn
 309   {
 310     /* TM holds the template for the insn were currently assembling.  */
 311     insn_template tm;
 312
 313     /* SUFFIX holds the instruction size suffix for byte, word, dword
 314        or qword, if given.  */
 315     char suffix;
 316
 317     /* OPCODE_LENGTH holds the number of base opcode bytes.  */
 318     unsigned char opcode_length;
 319
 320     /* OPERANDS gives the number of given operands.  */
 321     unsigned int operands;
 322
 323     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 324        of given register, displacement, memory operands and immediate
 325        operands.  */
 326     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 327
 328     /* TYPES [i] is the type (see above #defines) which tells us how to
 329        use OP[i] for the corresponding operand.  */
 330     i386_operand_type types[MAX_OPERANDS];
 331
 332     /* Displacement expression, immediate expression, or register for each
 333        operand.  */
 334     union i386_op op[MAX_OPERANDS];
 335
 336     /* Flags for operands.  */
 337     unsigned int flags[MAX_OPERANDS];
 338 #define Operand_PCrel 1
 339 #define Operand_Mem   2
 340
 341     /* Relocation type for operand */
 342     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 343
 344     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 345        the base index byte below.  */
 346     const reg_entry *base_reg;
 347     const reg_entry *index_reg;
 348     unsigned int log2_scale_factor;
 349
 350     /* SEG gives the seg_entries of this insn.  They are zero unless
 351        explicit segment overrides are given.  */
 352     const seg_entry *seg[2];
 353
 354     /* Copied first memory operand string, for re-checking.  */
 355     char *memop1_string;
 356
 357     /* PREFIX holds all the given prefix opcodes (usually null).
 358        PREFIXES is the number of prefix opcodes.  */
 359     unsigned int prefixes;
 360     unsigned char prefix[MAX_PREFIXES];
 361
 362     /* Register is in low 3 bits of opcode.  */
 363     bfd_boolean short_form;
 364
 365     /* The operand to a branch insn indicates an absolute branch.  */
 366     bfd_boolean jumpabsolute;
 367
 368     /* Extended states.  */
 369     enum
 370       {
 371         /* Use MMX state.  */
 372         xstate_mmx = 1 << 0,
 373         /* Use XMM state.  */
 374         xstate_xmm = 1 << 1,
 375         /* Use YMM state.  */
 376         xstate_ymm = 1 << 2 | xstate_xmm,
 377         /* Use ZMM state.  */
 378         xstate_zmm = 1 << 3 | xstate_ymm,
 379         /* Use TMM state.  */
 380         xstate_tmm = 1 << 4,
 381         /* Use MASK state.  */
 382         xstate_mask = 1 << 5
 383       } xstate;
 384
 385     /* Has GOTPC or TLS relocation.  */
 386     bfd_boolean has_gotpc_tls_reloc;
 387
 388     /* RM and SIB are the modrm byte and the sib byte where the
 389        addressing modes of this insn are encoded.  */
 390     modrm_byte rm;
 391     rex_byte rex;
 392     rex_byte vrex;
 393     sib_byte sib;
 394     vex_prefix vex;
 395
 396     /* Masking attributes.  */
 397     struct Mask_Operation *mask;
 398
 399     /* Rounding control and SAE attributes.  */
 400     struct RC_Operation *rounding;
 401
 402     /* Broadcasting attributes.  */
 403     struct Broadcast_Operation *broadcast;
 404
 405     /* Compressed disp8*N attribute.  */
 406     unsigned int memshift;
 407
 408     /* Prefer load or store in encoding.  */
 409     enum
 410       {
 411         dir_encoding_default = 0,
 412         dir_encoding_load,
 413         dir_encoding_store,
 414         dir_encoding_swap
 415       } dir_encoding;
 416
 417     /* Prefer 8bit, 16bit, 32bit displacement in encoding.  */
 418     enum
 419       {
 420         disp_encoding_default = 0,
 421         disp_encoding_8bit,
 422         disp_encoding_16bit,
 423         disp_encoding_32bit
 424       } disp_encoding;
 425
 426     /* Prefer the REX byte in encoding.  */
 427     bfd_boolean rex_encoding;
 428
 429     /* Disable instruction size optimization.  */
 430     bfd_boolean no_optimize;
 431
 432     /* How to encode vector instructions.  */
 433     enum
 434       {
 435         vex_encoding_default = 0,
 436         vex_encoding_vex,
 437         vex_encoding_vex3,
 438         vex_encoding_evex,
 439         vex_encoding_error
 440       } vec_encoding;
 441
 442     /* REP prefix.  */
 443     const char *rep_prefix;
 444
 445     /* HLE prefix.  */
 446     const char *hle_prefix;
 447
 448     /* Have BND prefix.  */
 449     const char *bnd_prefix;
 450
 451     /* Have NOTRACK prefix.  */
 452     const char *notrack_prefix;
 453
 454     /* Error message.  */
 455     enum i386_error error;
 456   };
 457
 458 typedef struct _i386_insn i386_insn;
 459
 460 /* Link RC type with corresponding string, that'll be looked for in
 461    asm.  */
 462 struct RC_name
 463 {
 464   enum rc_type type;
 465   const char *name;
 466   unsigned int len;
 467 };
 468
 469 static const struct RC_name RC_NamesTable[] =
 470 {
 471   {  rne, STRING_COMMA_LEN ("rn-sae") },
 472   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 473   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 474   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 475   {  saeonly,  STRING_COMMA_LEN ("sae") },
 476 };
 477
 478 /* List of chars besides those in app.c:symbol_chars that can start an
 479    operand.  Used to prevent the scrubber eating vital white-space.  */
 480 const char extra_symbol_chars[] = "*%-([{}"
 481 #ifdef LEX_AT
 482         "@"
 483 #endif
 484 #ifdef LEX_QM
 485         "?"
 486 #endif
 487         ;
 488
 489 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))     \
 490      && !defined (TE_GNU)                               \
 491      && !defined (TE_LINUX)                             \
 492      && !defined (TE_FreeBSD)                           \
 493      && !defined (TE_DragonFly)                         \
 494      && !defined (TE_NetBSD))
 495 /* This array holds the chars that always start a comment.  If the
 496    pre-processor is disabled, these aren't very useful.  The option
 497    --divide will remove '/' from this list.  */
 498 const char *i386_comment_chars = "#/";
 499 #define SVR4_COMMENT_CHARS 1
 500 #define PREFIX_SEPARATOR '\\'
 501
 502 #else
 503 const char *i386_comment_chars = "#";
 504 #define PREFIX_SEPARATOR '/'
 505 #endif
 506
 507 /* This array holds the chars that only start a comment at the beginning of
 508    a line.  If the line seems to have the form '# 123 filename'
 509    .line and .file directives will appear in the pre-processed output.
 510    Note that input_file.c hand checks for '#' at the beginning of the
 511    first line of the input file.  This is because the compiler outputs
 512    #NO_APP at the beginning of its output.
 513    Also note that comments started like this one will always work if
 514    '/' isn't otherwise defined.  */
 515 const char line_comment_chars[] = "#/";
 516
 517 const char line_separator_chars[] = ";";
 518
 519 /* Chars that can be used to separate mant from exp in floating point
 520    nums.  */
 521 const char EXP_CHARS[] = "eE";
 522
 523 /* Chars that mean this number is a floating point constant
 524    As in 0f12.456
 525    or    0d1.2345e12.  */
 526 const char FLT_CHARS[] = "fFdDxX";
 527
 528 /* Tables for lexical analysis.  */
 529 static char mnemonic_chars[256];
 530 static char register_chars[256];
 531 static char operand_chars[256];
 532 static char identifier_chars[256];
 533 static char digit_chars[256];
 534
 535 /* Lexical macros.  */
 536 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 537 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 538 #define is_register_char(x) (register_chars[(unsigned char) x])
 539 #define is_space_char(x) ((x) == ' ')
 540 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 541 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 542
 543 /* All non-digit non-letter characters that may occur in an operand.  */
 544 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 545
 546 /* md_assemble() always leaves the strings it's passed unaltered.  To
 547    effect this we maintain a stack of saved characters that we've smashed
 548    with '\0's (indicating end of strings for various sub-fields of the
 549    assembler instruction).  */
 550 static char save_stack[32];
 551 static char *save_stack_p;
 552 #define END_STRING_AND_SAVE(s) \
 553         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 554 #define RESTORE_END_STRING(s) \
 555         do { *(s) = *--save_stack_p; } while (0)
 556
 557 /* The instruction we're assembling.  */
 558 static i386_insn i;
 559
 560 /* Possible templates for current insn.  */
 561 static const templates *current_templates;
 562
 563 /* Per instruction expressionS buffers: max displacements & immediates.  */
 564 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 565 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 566
 567 /* Current operand we are working on.  */
 568 static int this_operand = -1;
 569
 570 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 571    these.  */
 572
 573 enum flag_code {
 574         CODE_32BIT,
 575         CODE_16BIT,
 576         CODE_64BIT };
 577
 578 static enum flag_code flag_code;
 579 static unsigned int object_64bit;
 580 static unsigned int disallow_64bit_reloc;
 581 static int use_rela_relocations = 0;
 582 /* __tls_get_addr/___tls_get_addr symbol for TLS.  */
 583 static const char *tls_get_addr;
 584
 585 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 586      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 587      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 588
 589 /* The ELF ABI to use.  */
 590 enum x86_elf_abi
 591 {
 592   I386_ABI,
 593   X86_64_ABI,
 594   X86_64_X32_ABI
 595 };
 596
 597 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 598 #endif
 599
 600 #if defined (TE_PE) || defined (TE_PEP)
 601 /* Use big object file format.  */
 602 static int use_big_obj = 0;
 603 #endif
 604
 605 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 606 /* 1 if generating code for a shared library.  */
 607 static int shared = 0;
 608 #endif
 609
 610 /* 1 for intel syntax,
 611    0 if att syntax.  */
 612 static int intel_syntax = 0;
 613
 614 static enum x86_64_isa
 615 {
 616   amd64 = 1,    /* AMD64 ISA.  */
 617   intel64       /* Intel64 ISA.  */
 618 } isa64;
 619
 620 /* 1 for intel mnemonic,
 621    0 if att mnemonic.  */
 622 static int intel_mnemonic = !SYSV386_COMPAT;
 623
 624 /* 1 if pseudo registers are permitted.  */
 625 static int allow_pseudo_reg = 0;
 626
 627 /* 1 if register prefix % not required.  */
 628 static int allow_naked_reg = 0;
 629
 630 /* 1 if the assembler should add BND prefix for all control-transferring
 631    instructions supporting it, even if this prefix wasn't specified
 632    explicitly.  */
 633 static int add_bnd_prefix = 0;
 634
 635 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 636 static int allow_index_reg = 0;
 637
 638 /* 1 if the assembler should ignore LOCK prefix, even if it was
 639    specified explicitly.  */
 640 static int omit_lock_prefix = 0;
 641
 642 /* 1 if the assembler should encode lfence, mfence, and sfence as
 643    "lock addl $0, (%{re}sp)".  */
 644 static int avoid_fence = 0;
 645
 646 /* 1 if lfence should be inserted after every load.  */
 647 static int lfence_after_load = 0;
 648
 649 /* Non-zero if lfence should be inserted before indirect branch.  */
 650 static enum lfence_before_indirect_branch_kind
 651   {
 652     lfence_branch_none = 0,
 653     lfence_branch_register,
 654     lfence_branch_memory,
 655     lfence_branch_all
 656   }
 657 lfence_before_indirect_branch;
 658
 659 /* Non-zero if lfence should be inserted before ret.  */
 660 static enum lfence_before_ret_kind
 661   {
 662     lfence_before_ret_none = 0,
 663     lfence_before_ret_not,
 664     lfence_before_ret_or,
 665     lfence_before_ret_shl
 666   }
 667 lfence_before_ret;
 668
 669 /* Types of previous instruction is .byte or prefix.  */
 670 static struct
 671   {
 672     segT seg;
 673     const char *file;
 674     const char *name;
 675     unsigned int line;
 676     enum last_insn_kind
 677       {
 678         last_insn_other = 0,
 679         last_insn_directive,
 680         last_insn_prefix
 681       } kind;
 682   } last_insn;
 683
 684 /* 1 if the assembler should generate relax relocations.  */
 685
 686 static int generate_relax_relocations
 687   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 688
 689 static enum check_kind
 690   {
 691     check_none = 0,
 692     check_warning,
 693     check_error
 694   }
 695 sse_check, operand_check = check_warning;
 696
 697 /* Non-zero if branches should be aligned within power of 2 boundary.  */
 698 static int align_branch_power = 0;
 699
 700 /* Types of branches to align.  */
 701 enum align_branch_kind
 702   {
 703     align_branch_none = 0,
 704     align_branch_jcc = 1,
 705     align_branch_fused = 2,
 706     align_branch_jmp = 3,
 707     align_branch_call = 4,
 708     align_branch_indirect = 5,
 709     align_branch_ret = 6
 710   };
 711
 712 /* Type bits of branches to align.  */
 713 enum align_branch_bit
 714   {
 715     align_branch_jcc_bit = 1 << align_branch_jcc,
 716     align_branch_fused_bit = 1 << align_branch_fused,
 717     align_branch_jmp_bit = 1 << align_branch_jmp,
 718     align_branch_call_bit = 1 << align_branch_call,
 719     align_branch_indirect_bit = 1 << align_branch_indirect,
 720     align_branch_ret_bit = 1 << align_branch_ret
 721   };
 722
 723 static unsigned int align_branch = (align_branch_jcc_bit
 724                                     | align_branch_fused_bit
 725                                     | align_branch_jmp_bit);
 726
 727 /* Types of condition jump used by macro-fusion.  */
 728 enum mf_jcc_kind
 729   {
 730     mf_jcc_jo = 0,  /* base opcode 0x70  */
 731     mf_jcc_jc,      /* base opcode 0x72  */
 732     mf_jcc_je,      /* base opcode 0x74  */
 733     mf_jcc_jna,     /* base opcode 0x76  */
 734     mf_jcc_js,      /* base opcode 0x78  */
 735     mf_jcc_jp,      /* base opcode 0x7a  */
 736     mf_jcc_jl,      /* base opcode 0x7c  */
 737     mf_jcc_jle,     /* base opcode 0x7e  */
 738   };
 739
 740 /* Types of compare flag-modifying insntructions used by macro-fusion.  */
 741 enum mf_cmp_kind
 742   {
 743     mf_cmp_test_and,  /* test/cmp */
 744     mf_cmp_alu_cmp,  /* add/sub/cmp */
 745     mf_cmp_incdec  /* inc/dec */
 746   };
 747
 748 /* The maximum padding size for fused jcc.  CMP like instruction can
 749    be 9 bytes and jcc can be 6 bytes.  Leave room just in case for
 750    prefixes.   */
 751 #define MAX_FUSED_JCC_PADDING_SIZE 20
 752
 753 /* The maximum number of prefixes added for an instruction.  */
 754 static unsigned int align_branch_prefix_size = 5;
 755
 756 /* Optimization:
 757    1. Clear the REX_W bit with register operand if possible.
 758    2. Above plus use 128bit vector instruction to clear the full vector
 759       register.
 760  */
 761 static int optimize = 0;
 762
 763 /* Optimization:
 764    1. Clear the REX_W bit with register operand if possible.
 765    2. Above plus use 128bit vector instruction to clear the full vector
 766       register.
 767    3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
 768       "testb $imm7,%r8".
 769  */
 770 static int optimize_for_space = 0;
 771
 772 /* Register prefix used for error message.  */
 773 static const char *register_prefix = "%";
 774
 775 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 776    leave, push, and pop instructions so that gcc has the same stack
 777    frame as in 32 bit mode.  */
 778 static char stackop_size = '\0';
 779
 780 /* Non-zero to optimize code alignment.  */
 781 int optimize_align_code = 1;
 782
 783 /* Non-zero to quieten some warnings.  */
 784 static int quiet_warnings = 0;
 785
 786 /* CPU name.  */
 787 static const char *cpu_arch_name = NULL;
 788 static char *cpu_sub_arch_name = NULL;
 789
 790 /* CPU feature flags.  */
 791 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 792
 793 /* If we have selected a cpu we are generating instructions for.  */
 794 static int cpu_arch_tune_set = 0;
 795
 796 /* Cpu we are generating instructions for.  */
 797 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 798
 799 /* CPU feature flags of cpu we are generating instructions for.  */
 800 static i386_cpu_flags cpu_arch_tune_flags;
 801
 802 /* CPU instruction set architecture used.  */
 803 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 804
 805 /* CPU feature flags of instruction set architecture used.  */
 806 i386_cpu_flags cpu_arch_isa_flags;
 807
 808 /* If set, conditional jumps are not automatically promoted to handle
 809    larger than a byte offset.  */
 810 static unsigned int no_cond_jump_promotion = 0;
 811
 812 /* Encode SSE instructions with VEX prefix.  */
 813 static unsigned int sse2avx;
 814
 815 /* Encode scalar AVX instructions with specific vector length.  */
 816 static enum
 817   {
 818     vex128 = 0,
 819     vex256
 820   } avxscalar;
 821
 822 /* Encode VEX WIG instructions with specific vex.w.  */
 823 static enum
 824   {
 825     vexw0 = 0,
 826     vexw1
 827   } vexwig;
 828
 829 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 830 static enum
 831   {
 832     evexl128 = 0,
 833     evexl256,
 834     evexl512
 835   } evexlig;
 836
 837 /* Encode EVEX WIG instructions with specific evex.w.  */
 838 static enum
 839   {
 840     evexw0 = 0,
 841     evexw1
 842   } evexwig;
 843
 844 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 845 static enum rc_type evexrcig = rne;
 846
 847 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 848 static symbolS *GOT_symbol;
 849
 850 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 851 unsigned int x86_dwarf2_return_column;
 852
 853 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 854 int x86_cie_data_alignment;
 855
 856 /* Interface to relax_segment.
 857    There are 3 major relax states for 386 jump insns because the
 858    different types of jumps add different sizes to frags when we're
 859    figuring out what sort of jump to choose to reach a given label.
 860
 861    BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
 862    branches which are handled by md_estimate_size_before_relax() and
 863    i386_generic_table_relax_frag().  */
 864
 865 /* Types.  */
 866 #define UNCOND_JUMP 0
 867 #define COND_JUMP 1
 868 #define COND_JUMP86 2
 869 #define BRANCH_PADDING 3
 870 #define BRANCH_PREFIX 4
 871 #define FUSED_JCC_PADDING 5
 872
 873 /* Sizes.  */
 874 #define CODE16  1
 875 #define SMALL   0
 876 #define SMALL16 (SMALL | CODE16)
 877 #define BIG     2
 878 #define BIG16   (BIG | CODE16)
 879
 880 #ifndef INLINE
 881 #ifdef __GNUC__
 882 #define INLINE __inline__
 883 #else
 884 #define INLINE
 885 #endif
 886 #endif
 887
 888 #define ENCODE_RELAX_STATE(type, size) \
 889   ((relax_substateT) (((type) << 2) | (size)))
 890 #define TYPE_FROM_RELAX_STATE(s) \
 891   ((s) >> 2)
 892 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 893     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 894
 895 /* This table is used by relax_frag to promote short jumps to long
 896    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 897    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 898    don't allow a short jump in a 32 bit code segment to be promoted to
 899    a 16 bit offset jump because it's slower (requires data size
 900    prefix), and doesn't work, unless the destination is in the bottom
 901    64k of the code segment (The top 16 bits of eip are zeroed).  */
 902
 903 const relax_typeS md_relax_table[] =
 904 {
 905   /* The fields are:
 906      1) most positive reach of this state,
 907      2) most negative reach of this state,
 908      3) how many bytes this mode will have in the variable part of the frag
 909      4) which index into the table to try if we can't fit into this one.  */
 910
 911   /* UNCOND_JUMP states.  */
 912   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 913   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 914   /* dword jmp adds 4 bytes to frag:
 915      0 extra opcode bytes, 4 displacement bytes.  */
 916   {0, 0, 4, 0},
 917   /* word jmp adds 2 byte2 to frag:
 918      0 extra opcode bytes, 2 displacement bytes.  */
 919   {0, 0, 2, 0},
 920
 921   /* COND_JUMP states.  */
 922   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 923   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 924   /* dword conditionals adds 5 bytes to frag:
 925      1 extra opcode byte, 4 displacement bytes.  */
 926   {0, 0, 5, 0},
 927   /* word conditionals add 3 bytes to frag:
 928      1 extra opcode byte, 2 displacement bytes.  */
 929   {0, 0, 3, 0},
 930
 931   /* COND_JUMP86 states.  */
 932   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 933   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 934   /* dword conditionals adds 5 bytes to frag:
 935      1 extra opcode byte, 4 displacement bytes.  */
 936   {0, 0, 5, 0},
 937   /* word conditionals add 4 bytes to frag:
 938      1 displacement byte and a 3 byte long branch insn.  */
 939   {0, 0, 4, 0}
 940 };
 941
 942 static const arch_entry cpu_arch[] =
 943 {
 944   /* Do not replace the first two entries - i386_target_format()
 945      relies on them being there in this order.  */
 946   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 947     CPU_GENERIC32_FLAGS, 0 },
 948   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 949     CPU_GENERIC64_FLAGS, 0 },
 950   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 951     CPU_NONE_FLAGS, 0 },
 952   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 953     CPU_I186_FLAGS, 0 },
 954   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 955     CPU_I286_FLAGS, 0 },
 956   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 957     CPU_I386_FLAGS, 0 },
 958   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 959     CPU_I486_FLAGS, 0 },
 960   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 961     CPU_I586_FLAGS, 0 },
 962   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 963     CPU_I686_FLAGS, 0 },
 964   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 965     CPU_I586_FLAGS, 0 },
 966   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 967     CPU_PENTIUMPRO_FLAGS, 0 },
 968   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 969     CPU_P2_FLAGS, 0 },
 970   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 971     CPU_P3_FLAGS, 0 },
 972   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 973     CPU_P4_FLAGS, 0 },
 974   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 975     CPU_CORE_FLAGS, 0 },
 976   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 977     CPU_NOCONA_FLAGS, 0 },
 978   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 979     CPU_CORE_FLAGS, 1 },
 980   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 981     CPU_CORE_FLAGS, 0 },
 982   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 983     CPU_CORE2_FLAGS, 1 },
 984   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 985     CPU_CORE2_FLAGS, 0 },
 986   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 987     CPU_COREI7_FLAGS, 0 },
 988   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 989     CPU_L1OM_FLAGS, 0 },
 990   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 991     CPU_K1OM_FLAGS, 0 },
 992   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 993     CPU_IAMCU_FLAGS, 0 },
 994   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 995     CPU_K6_FLAGS, 0 },
 996   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 997     CPU_K6_2_FLAGS, 0 },
 998   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 999     CPU_ATHLON_FLAGS, 0 },
1000   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
1001     CPU_K8_FLAGS, 1 },
1002   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
1003     CPU_K8_FLAGS, 0 },
1004   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1005     CPU_K8_FLAGS, 0 },
1006   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1007     CPU_AMDFAM10_FLAGS, 0 },
1008   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1009     CPU_BDVER1_FLAGS, 0 },
1010   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1011     CPU_BDVER2_FLAGS, 0 },
1012   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1013     CPU_BDVER3_FLAGS, 0 },
1014   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1015     CPU_BDVER4_FLAGS, 0 },
1016   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1017     CPU_ZNVER1_FLAGS, 0 },
1018   { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1019     CPU_ZNVER2_FLAGS, 0 },
1020   { STRING_COMMA_LEN ("znver3"), PROCESSOR_ZNVER,
1021     CPU_ZNVER3_FLAGS, 0 },
1022   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1023     CPU_BTVER1_FLAGS, 0 },
1024   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1025     CPU_BTVER2_FLAGS, 0 },
1026   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1027     CPU_8087_FLAGS, 0 },
1028   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1029     CPU_287_FLAGS, 0 },
1030   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1031     CPU_387_FLAGS, 0 },
1032   { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1033     CPU_687_FLAGS, 0 },
1034   { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1035     CPU_CMOV_FLAGS, 0 },
1036   { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1037     CPU_FXSR_FLAGS, 0 },
1038   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1039     CPU_MMX_FLAGS, 0 },
1040   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1041     CPU_SSE_FLAGS, 0 },
1042   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1043     CPU_SSE2_FLAGS, 0 },
1044   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1045     CPU_SSE3_FLAGS, 0 },
1046   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1047     CPU_SSE4A_FLAGS, 0 },
1048   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1049     CPU_SSSE3_FLAGS, 0 },
1050   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1051     CPU_SSE4_1_FLAGS, 0 },
1052   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1053     CPU_SSE4_2_FLAGS, 0 },
1054   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1055     CPU_SSE4_2_FLAGS, 0 },
1056   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1057     CPU_AVX_FLAGS, 0 },
1058   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1059     CPU_AVX2_FLAGS, 0 },
1060   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1061     CPU_AVX512F_FLAGS, 0 },
1062   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1063     CPU_AVX512CD_FLAGS, 0 },
1064   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1065     CPU_AVX512ER_FLAGS, 0 },
1066   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1067     CPU_AVX512PF_FLAGS, 0 },
1068   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1069     CPU_AVX512DQ_FLAGS, 0 },
1070   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1071     CPU_AVX512BW_FLAGS, 0 },
1072   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1073     CPU_AVX512VL_FLAGS, 0 },
1074   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1075     CPU_VMX_FLAGS, 0 },
1076   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1077     CPU_VMFUNC_FLAGS, 0 },
1078   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1079     CPU_SMX_FLAGS, 0 },
1080   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1081     CPU_XSAVE_FLAGS, 0 },
1082   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1083     CPU_XSAVEOPT_FLAGS, 0 },
1084   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1085     CPU_XSAVEC_FLAGS, 0 },
1086   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1087     CPU_XSAVES_FLAGS, 0 },
1088   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1089     CPU_AES_FLAGS, 0 },
1090   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1091     CPU_PCLMUL_FLAGS, 0 },
1092   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1093     CPU_PCLMUL_FLAGS, 1 },
1094   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1095     CPU_FSGSBASE_FLAGS, 0 },
1096   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1097     CPU_RDRND_FLAGS, 0 },
1098   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1099     CPU_F16C_FLAGS, 0 },
1100   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1101     CPU_BMI2_FLAGS, 0 },
1102   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1103     CPU_FMA_FLAGS, 0 },
1104   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1105     CPU_FMA4_FLAGS, 0 },
1106   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1107     CPU_XOP_FLAGS, 0 },
1108   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1109     CPU_LWP_FLAGS, 0 },
1110   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1111     CPU_MOVBE_FLAGS, 0 },
1112   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1113     CPU_CX16_FLAGS, 0 },
1114   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1115     CPU_EPT_FLAGS, 0 },
1116   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1117     CPU_LZCNT_FLAGS, 0 },
1118   { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1119     CPU_POPCNT_FLAGS, 0 },
1120   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1121     CPU_HLE_FLAGS, 0 },
1122   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1123     CPU_RTM_FLAGS, 0 },
1124   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1125     CPU_INVPCID_FLAGS, 0 },
1126   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1127     CPU_CLFLUSH_FLAGS, 0 },
1128   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1129     CPU_NOP_FLAGS, 0 },
1130   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1131     CPU_SYSCALL_FLAGS, 0 },
1132   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1133     CPU_RDTSCP_FLAGS, 0 },
1134   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1135     CPU_3DNOW_FLAGS, 0 },
1136   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1137     CPU_3DNOWA_FLAGS, 0 },
1138   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1139     CPU_PADLOCK_FLAGS, 0 },
1140   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1141     CPU_SVME_FLAGS, 1 },
1142   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1143     CPU_SVME_FLAGS, 0 },
1144   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1145     CPU_SSE4A_FLAGS, 0 },
1146   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1147     CPU_ABM_FLAGS, 0 },
1148   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1149     CPU_BMI_FLAGS, 0 },
1150   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1151     CPU_TBM_FLAGS, 0 },
1152   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1153     CPU_ADX_FLAGS, 0 },
1154   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1155     CPU_RDSEED_FLAGS, 0 },
1156   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1157     CPU_PRFCHW_FLAGS, 0 },
1158   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1159     CPU_SMAP_FLAGS, 0 },
1160   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1161     CPU_MPX_FLAGS, 0 },
1162   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1163     CPU_SHA_FLAGS, 0 },
1164   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1165     CPU_CLFLUSHOPT_FLAGS, 0 },
1166   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1167     CPU_PREFETCHWT1_FLAGS, 0 },
1168   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1169     CPU_SE1_FLAGS, 0 },
1170   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1171     CPU_CLWB_FLAGS, 0 },
1172   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1173     CPU_AVX512IFMA_FLAGS, 0 },
1174   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1175     CPU_AVX512VBMI_FLAGS, 0 },
1176   { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1177     CPU_AVX512_4FMAPS_FLAGS, 0 },
1178   { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1179     CPU_AVX512_4VNNIW_FLAGS, 0 },
1180   { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1181     CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1182   { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1183     CPU_AVX512_VBMI2_FLAGS, 0 },
1184   { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1185     CPU_AVX512_VNNI_FLAGS, 0 },
1186   { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1187     CPU_AVX512_BITALG_FLAGS, 0 },
1188   { STRING_COMMA_LEN (".avx_vnni"), PROCESSOR_UNKNOWN,
1189     CPU_AVX_VNNI_FLAGS, 0 },
1190   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1191     CPU_CLZERO_FLAGS, 0 },
1192   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1193     CPU_MWAITX_FLAGS, 0 },
1194   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1195     CPU_OSPKE_FLAGS, 0 },
1196   { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1197     CPU_RDPID_FLAGS, 0 },
1198   { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1199     CPU_PTWRITE_FLAGS, 0 },
1200   { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1201     CPU_IBT_FLAGS, 0 },
1202   { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1203     CPU_SHSTK_FLAGS, 0 },
1204   { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1205     CPU_GFNI_FLAGS, 0 },
1206   { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1207     CPU_VAES_FLAGS, 0 },
1208   { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1209     CPU_VPCLMULQDQ_FLAGS, 0 },
1210   { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1211     CPU_WBNOINVD_FLAGS, 0 },
1212   { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1213     CPU_PCONFIG_FLAGS, 0 },
1214   { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1215     CPU_WAITPKG_FLAGS, 0 },
1216   { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1217     CPU_CLDEMOTE_FLAGS, 0 },
1218   { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1219     CPU_AMX_INT8_FLAGS, 0 },
1220   { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1221     CPU_AMX_BF16_FLAGS, 0 },
1222   { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1223     CPU_AMX_TILE_FLAGS, 0 },
1224   { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1225     CPU_MOVDIRI_FLAGS, 0 },
1226   { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1227     CPU_MOVDIR64B_FLAGS, 0 },
1228   { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1229     CPU_AVX512_BF16_FLAGS, 0 },
1230   { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1231     CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1232   { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1233     CPU_TDX_FLAGS, 0 },
1234   { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1235     CPU_ENQCMD_FLAGS, 0 },
1236   { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1237     CPU_SERIALIZE_FLAGS, 0 },
1238   { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1239     CPU_RDPRU_FLAGS, 0 },
1240   { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1241     CPU_MCOMMIT_FLAGS, 0 },
1242   { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1243     CPU_SEV_ES_FLAGS, 0 },
1244   { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1245     CPU_TSXLDTRK_FLAGS, 0 },
1246   { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1247     CPU_KL_FLAGS, 0 },
1248   { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1249     CPU_WIDEKL_FLAGS, 0 },
1250   { STRING_COMMA_LEN (".uintr"), PROCESSOR_UNKNOWN,
1251     CPU_UINTR_FLAGS, 0 },
1252   { STRING_COMMA_LEN (".hreset"), PROCESSOR_UNKNOWN,
1253     CPU_HRESET_FLAGS, 0 },
1254 };
1255
1256 static const noarch_entry cpu_noarch[] =
1257 {
1258   { STRING_COMMA_LEN ("no87"),  CPU_ANY_X87_FLAGS },
1259   { STRING_COMMA_LEN ("no287"),  CPU_ANY_287_FLAGS },
1260   { STRING_COMMA_LEN ("no387"),  CPU_ANY_387_FLAGS },
1261   { STRING_COMMA_LEN ("no687"),  CPU_ANY_687_FLAGS },
1262   { STRING_COMMA_LEN ("nocmov"),  CPU_ANY_CMOV_FLAGS },
1263   { STRING_COMMA_LEN ("nofxsr"),  CPU_ANY_FXSR_FLAGS },
1264   { STRING_COMMA_LEN ("nommx"),  CPU_ANY_MMX_FLAGS },
1265   { STRING_COMMA_LEN ("nosse"),  CPU_ANY_SSE_FLAGS },
1266   { STRING_COMMA_LEN ("nosse2"),  CPU_ANY_SSE2_FLAGS },
1267   { STRING_COMMA_LEN ("nosse3"),  CPU_ANY_SSE3_FLAGS },
1268   { STRING_COMMA_LEN ("nosse4a"),  CPU_ANY_SSE4A_FLAGS },
1269   { STRING_COMMA_LEN ("nossse3"),  CPU_ANY_SSSE3_FLAGS },
1270   { STRING_COMMA_LEN ("nosse4.1"),  CPU_ANY_SSE4_1_FLAGS },
1271   { STRING_COMMA_LEN ("nosse4.2"),  CPU_ANY_SSE4_2_FLAGS },
1272   { STRING_COMMA_LEN ("nosse4"),  CPU_ANY_SSE4_1_FLAGS },
1273   { STRING_COMMA_LEN ("noavx"),  CPU_ANY_AVX_FLAGS },
1274   { STRING_COMMA_LEN ("noavx2"),  CPU_ANY_AVX2_FLAGS },
1275   { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1276   { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1277   { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1278   { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1279   { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1280   { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1281   { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1282   { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1283   { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1284   { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1285   { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1286   { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1287   { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1288   { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1289   { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1290   { STRING_COMMA_LEN ("noavx_vnni"), CPU_ANY_AVX_VNNI_FLAGS },
1291   { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1292   { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1293   { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1294   { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1295   { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1296   { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1297   { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1298   { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1299   { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1300     CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1301   { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1302   { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1303   { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1304   { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1305   { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1306   { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1307   { STRING_COMMA_LEN ("nouintr"), CPU_ANY_UINTR_FLAGS },
1308   { STRING_COMMA_LEN ("nohreset"), CPU_ANY_HRESET_FLAGS },
1309 };
1310
1311 #ifdef I386COFF
1312 /* Like s_lcomm_internal in gas/read.c but the alignment string
1313    is allowed to be optional.  */
1314
1315 static symbolS *
1316 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1317 {
1318   addressT align = 0;
1319
1320   SKIP_WHITESPACE ();
1321
1322   if (needs_align
1323       && *input_line_pointer == ',')
1324     {
1325       align = parse_align (needs_align - 1);
1326
1327       if (align == (addressT) -1)
1328         return NULL;
1329     }
1330   else
1331     {
1332       if (size >= 8)
1333         align = 3;
1334       else if (size >= 4)
1335         align = 2;
1336       else if (size >= 2)
1337         align = 1;
1338       else
1339         align = 0;
1340     }
1341
1342   bss_alloc (symbolP, size, align);
1343   return symbolP;
1344 }
1345
1346 static void
1347 pe_lcomm (int needs_align)
1348 {
1349   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1350 }
1351 #endif
1352
1353 const pseudo_typeS md_pseudo_table[] =
1354 {
1355 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1356   {"align", s_align_bytes, 0},
1357 #else
1358   {"align", s_align_ptwo, 0},
1359 #endif
1360   {"arch", set_cpu_arch, 0},
1361 #ifndef I386COFF
1362   {"bss", s_bss, 0},
1363 #else
1364   {"lcomm", pe_lcomm, 1},
1365 #endif
1366   {"ffloat", float_cons, 'f'},
1367   {"dfloat", float_cons, 'd'},
1368   {"tfloat", float_cons, 'x'},
1369   {"value", cons, 2},
1370   {"slong", signed_cons, 4},
1371   {"noopt", s_ignore, 0},
1372   {"optim", s_ignore, 0},
1373   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1374   {"code16", set_code_flag, CODE_16BIT},
1375   {"code32", set_code_flag, CODE_32BIT},
1376 #ifdef BFD64
1377   {"code64", set_code_flag, CODE_64BIT},
1378 #endif
1379   {"intel_syntax", set_intel_syntax, 1},
1380   {"att_syntax", set_intel_syntax, 0},
1381   {"intel_mnemonic", set_intel_mnemonic, 1},
1382   {"att_mnemonic", set_intel_mnemonic, 0},
1383   {"allow_index_reg", set_allow_index_reg, 1},
1384   {"disallow_index_reg", set_allow_index_reg, 0},
1385   {"sse_check", set_check, 0},
1386   {"operand_check", set_check, 1},
1387 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1388   {"largecomm", handle_large_common, 0},
1389 #else
1390   {"file", dwarf2_directive_file, 0},
1391   {"loc", dwarf2_directive_loc, 0},
1392   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1393 #endif
1394 #ifdef TE_PE
1395   {"secrel32", pe_directive_secrel, 0},
1396 #endif
1397   {0, 0, 0}
1398 };
1399
1400 /* For interface with expression ().  */
1401 extern char *input_line_pointer;
1402
1403 /* Hash table for instruction mnemonic lookup.  */
1404 static htab_t op_hash;
1405
1406 /* Hash table for register lookup.  */
1407 static htab_t reg_hash;
1408 \f
1409   /* Various efficient no-op patterns for aligning code labels.
1410      Note: Don't try to assemble the instructions in the comments.
1411      0L and 0w are not legal.  */
1412 static const unsigned char f32_1[] =
1413   {0x90};                               /* nop                  */
1414 static const unsigned char f32_2[] =
1415   {0x66,0x90};                          /* xchg %ax,%ax         */
1416 static const unsigned char f32_3[] =
1417   {0x8d,0x76,0x00};                     /* leal 0(%esi),%esi    */
1418 static const unsigned char f32_4[] =
1419   {0x8d,0x74,0x26,0x00};                /* leal 0(%esi,1),%esi  */
1420 static const unsigned char f32_6[] =
1421   {0x8d,0xb6,0x00,0x00,0x00,0x00};      /* leal 0L(%esi),%esi   */
1422 static const unsigned char f32_7[] =
1423   {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1424 static const unsigned char f16_3[] =
1425   {0x8d,0x74,0x00};                     /* lea 0(%si),%si       */
1426 static const unsigned char f16_4[] =
1427   {0x8d,0xb4,0x00,0x00};                /* lea 0W(%si),%si      */
1428 static const unsigned char jump_disp8[] =
1429   {0xeb};                               /* jmp disp8           */
1430 static const unsigned char jump32_disp32[] =
1431   {0xe9};                               /* jmp disp32          */
1432 static const unsigned char jump16_disp32[] =
1433   {0x66,0xe9};                          /* jmp disp32          */
1434 /* 32-bit NOPs patterns.  */
1435 static const unsigned char *const f32_patt[] = {
1436   f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1437 };
1438 /* 16-bit NOPs patterns.  */
1439 static const unsigned char *const f16_patt[] = {
1440   f32_1, f32_2, f16_3, f16_4
1441 };
1442 /* nopl (%[re]ax) */
1443 static const unsigned char alt_3[] =
1444   {0x0f,0x1f,0x00};
1445 /* nopl 0(%[re]ax) */
1446 static const unsigned char alt_4[] =
1447   {0x0f,0x1f,0x40,0x00};
1448 /* nopl 0(%[re]ax,%[re]ax,1) */
1449 static const unsigned char alt_5[] =
1450   {0x0f,0x1f,0x44,0x00,0x00};
1451 /* nopw 0(%[re]ax,%[re]ax,1) */
1452 static const unsigned char alt_6[] =
1453   {0x66,0x0f,0x1f,0x44,0x00,0x00};
1454 /* nopl 0L(%[re]ax) */
1455 static const unsigned char alt_7[] =
1456   {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1457 /* nopl 0L(%[re]ax,%[re]ax,1) */
1458 static const unsigned char alt_8[] =
1459   {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1460 /* nopw 0L(%[re]ax,%[re]ax,1) */
1461 static const unsigned char alt_9[] =
1462   {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1463 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1464 static const unsigned char alt_10[] =
1465   {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1466 /* data16 nopw %cs:0L(%eax,%eax,1) */
1467 static const unsigned char alt_11[] =
1468   {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1469 /* 32-bit and 64-bit NOPs patterns.  */
1470 static const unsigned char *const alt_patt[] = {
1471   f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1472   alt_9, alt_10, alt_11
1473 };
1474
1475 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1476    size of a single NOP instruction MAX_SINGLE_NOP_SIZE.  */
1477
1478 static void
1479 i386_output_nops (char *where, const unsigned char *const *patt,
1480                   int count, int max_single_nop_size)
1481
1482 {
1483   /* Place the longer NOP first.  */
1484   int last;
1485   int offset;
1486   const unsigned char *nops;
1487
1488   if (max_single_nop_size < 1)
1489     {
1490       as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1491                 max_single_nop_size);
1492       return;
1493     }
1494
1495   nops = patt[max_single_nop_size - 1];
1496
1497   /* Use the smaller one if the requsted one isn't available.  */
1498   if (nops == NULL)
1499     {
1500       max_single_nop_size--;
1501       nops = patt[max_single_nop_size - 1];
1502     }
1503
1504   last = count % max_single_nop_size;
1505
1506   count -= last;
1507   for (offset = 0; offset < count; offset += max_single_nop_size)
1508     memcpy (where + offset, nops, max_single_nop_size);
1509
1510   if (last)
1511     {
1512       nops = patt[last - 1];
1513       if (nops == NULL)
1514         {
1515           /* Use the smaller one plus one-byte NOP if the needed one
1516              isn't available.  */
1517           last--;
1518           nops = patt[last - 1];
1519           memcpy (where + offset, nops, last);
1520           where[offset + last] = *patt[0];
1521         }
1522       else
1523         memcpy (where + offset, nops, last);
1524     }
1525 }
1526
1527 static INLINE int
1528 fits_in_imm7 (offsetT num)
1529 {
1530   return (num & 0x7f) == num;
1531 }
1532
1533 static INLINE int
1534 fits_in_imm31 (offsetT num)
1535 {
1536   return (num & 0x7fffffff) == num;
1537 }
1538
1539 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1540    single NOP instruction LIMIT.  */
1541
1542 void
1543 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1544 {
1545   const unsigned char *const *patt = NULL;
1546   int max_single_nop_size;
1547   /* Maximum number of NOPs before switching to jump over NOPs.  */
1548   int max_number_of_nops;
1549
1550   switch (fragP->fr_type)
1551     {
1552     case rs_fill_nop:
1553     case rs_align_code:
1554       break;
1555     case rs_machine_dependent:
1556       /* Allow NOP padding for jumps and calls.  */
1557       if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1558           || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1559         break;
1560       /* Fall through.  */
1561     default:
1562       return;
1563     }
1564
1565   /* We need to decide which NOP sequence to use for 32bit and
1566      64bit. When -mtune= is used:
1567
1568      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1569      PROCESSOR_GENERIC32, f32_patt will be used.
1570      2. For the rest, alt_patt will be used.
1571
1572      When -mtune= isn't used, alt_patt will be used if
1573      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1574      be used.
1575
1576      When -march= or .arch is used, we can't use anything beyond
1577      cpu_arch_isa_flags.   */
1578
1579   if (flag_code == CODE_16BIT)
1580     {
1581       patt = f16_patt;
1582       max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1583       /* Limit number of NOPs to 2 in 16-bit mode.  */
1584       max_number_of_nops = 2;
1585     }
1586   else
1587     {
1588       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1589         {
1590           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1591           switch (cpu_arch_tune)
1592             {
1593             case PROCESSOR_UNKNOWN:
1594               /* We use cpu_arch_isa_flags to check if we SHOULD
1595                  optimize with nops.  */
1596               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1597                 patt = alt_patt;
1598               else
1599                 patt = f32_patt;
1600               break;
1601             case PROCESSOR_PENTIUM4:
1602             case PROCESSOR_NOCONA:
1603             case PROCESSOR_CORE:
1604             case PROCESSOR_CORE2:
1605             case PROCESSOR_COREI7:
1606             case PROCESSOR_L1OM:
1607             case PROCESSOR_K1OM:
1608             case PROCESSOR_GENERIC64:
1609             case PROCESSOR_K6:
1610             case PROCESSOR_ATHLON:
1611             case PROCESSOR_K8:
1612             case PROCESSOR_AMDFAM10:
1613             case PROCESSOR_BD:
1614             case PROCESSOR_ZNVER:
1615             case PROCESSOR_BT:
1616               patt = alt_patt;
1617               break;
1618             case PROCESSOR_I386:
1619             case PROCESSOR_I486:
1620             case PROCESSOR_PENTIUM:
1621             case PROCESSOR_PENTIUMPRO:
1622             case PROCESSOR_IAMCU:
1623             case PROCESSOR_GENERIC32:
1624               patt = f32_patt;
1625               break;
1626             }
1627         }
1628       else
1629         {
1630           switch (fragP->tc_frag_data.tune)
1631             {
1632             case PROCESSOR_UNKNOWN:
1633               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1634                  PROCESSOR_UNKNOWN.  */
1635               abort ();
1636               break;
1637
1638             case PROCESSOR_I386:
1639             case PROCESSOR_I486:
1640             case PROCESSOR_PENTIUM:
1641             case PROCESSOR_IAMCU:
1642             case PROCESSOR_K6:
1643             case PROCESSOR_ATHLON:
1644             case PROCESSOR_K8:
1645             case PROCESSOR_AMDFAM10:
1646             case PROCESSOR_BD:
1647             case PROCESSOR_ZNVER:
1648             case PROCESSOR_BT:
1649             case PROCESSOR_GENERIC32:
1650               /* We use cpu_arch_isa_flags to check if we CAN optimize
1651                  with nops.  */
1652               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1653                 patt = alt_patt;
1654               else
1655                 patt = f32_patt;
1656               break;
1657             case PROCESSOR_PENTIUMPRO:
1658             case PROCESSOR_PENTIUM4:
1659             case PROCESSOR_NOCONA:
1660             case PROCESSOR_CORE:
1661             case PROCESSOR_CORE2:
1662             case PROCESSOR_COREI7:
1663             case PROCESSOR_L1OM:
1664             case PROCESSOR_K1OM:
1665               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1666                 patt = alt_patt;
1667               else
1668                 patt = f32_patt;
1669               break;
1670             case PROCESSOR_GENERIC64:
1671               patt = alt_patt;
1672               break;
1673             }
1674         }
1675
1676       if (patt == f32_patt)
1677         {
1678           max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1679           /* Limit number of NOPs to 2 for older processors.  */
1680           max_number_of_nops = 2;
1681         }
1682       else
1683         {
1684           max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1685           /* Limit number of NOPs to 7 for newer processors.  */
1686           max_number_of_nops = 7;
1687         }
1688     }
1689
1690   if (limit == 0)
1691     limit = max_single_nop_size;
1692
1693   if (fragP->fr_type == rs_fill_nop)
1694     {
1695       /* Output NOPs for .nop directive.  */
1696       if (limit > max_single_nop_size)
1697         {
1698           as_bad_where (fragP->fr_file, fragP->fr_line,
1699                         _("invalid single nop size: %d "
1700                           "(expect within [0, %d])"),
1701                         limit, max_single_nop_size);
1702           return;
1703         }
1704     }
1705   else if (fragP->fr_type != rs_machine_dependent)
1706     fragP->fr_var = count;
1707
1708   if ((count / max_single_nop_size) > max_number_of_nops)
1709     {
1710       /* Generate jump over NOPs.  */
1711       offsetT disp = count - 2;
1712       if (fits_in_imm7 (disp))
1713         {
1714           /* Use "jmp disp8" if possible.  */
1715           count = disp;
1716           where[0] = jump_disp8[0];
1717           where[1] = count;
1718           where += 2;
1719         }
1720       else
1721         {
1722           unsigned int size_of_jump;
1723
1724           if (flag_code == CODE_16BIT)
1725             {
1726               where[0] = jump16_disp32[0];
1727               where[1] = jump16_disp32[1];
1728               size_of_jump = 2;
1729             }
1730           else
1731             {
1732               where[0] = jump32_disp32[0];
1733               size_of_jump = 1;
1734             }
1735
1736           count -= size_of_jump + 4;
1737           if (!fits_in_imm31 (count))
1738             {
1739               as_bad_where (fragP->fr_file, fragP->fr_line,
1740                             _("jump over nop padding out of range"));
1741               return;
1742             }
1743
1744           md_number_to_chars (where + size_of_jump, count, 4);
1745           where += size_of_jump + 4;
1746         }
1747     }
1748
1749   /* Generate multiple NOPs.  */
1750   i386_output_nops (where, patt, count, limit);
1751 }
1752
1753 static INLINE int
1754 operand_type_all_zero (const union i386_operand_type *x)
1755 {
1756   switch (ARRAY_SIZE(x->array))
1757     {
1758     case 3:
1759       if (x->array[2])
1760         return 0;
1761       /* Fall through.  */
1762     case 2:
1763       if (x->array[1])
1764         return 0;
1765       /* Fall through.  */
1766     case 1:
1767       return !x->array[0];
1768     default:
1769       abort ();
1770     }
1771 }
1772
1773 static INLINE void
1774 operand_type_set (union i386_operand_type *x, unsigned int v)
1775 {
1776   switch (ARRAY_SIZE(x->array))
1777     {
1778     case 3:
1779       x->array[2] = v;
1780       /* Fall through.  */
1781     case 2:
1782       x->array[1] = v;
1783       /* Fall through.  */
1784     case 1:
1785       x->array[0] = v;
1786       /* Fall through.  */
1787       break;
1788     default:
1789       abort ();
1790     }
1791
1792   x->bitfield.class = ClassNone;
1793   x->bitfield.instance = InstanceNone;
1794 }
1795
1796 static INLINE int
1797 operand_type_equal (const union i386_operand_type *x,
1798                     const union i386_operand_type *y)
1799 {
1800   switch (ARRAY_SIZE(x->array))
1801     {
1802     case 3:
1803       if (x->array[2] != y->array[2])
1804         return 0;
1805       /* Fall through.  */
1806     case 2:
1807       if (x->array[1] != y->array[1])
1808         return 0;
1809       /* Fall through.  */
1810     case 1:
1811       return x->array[0] == y->array[0];
1812       break;
1813     default:
1814       abort ();
1815     }
1816 }
1817
1818 static INLINE int
1819 cpu_flags_all_zero (const union i386_cpu_flags *x)
1820 {
1821   switch (ARRAY_SIZE(x->array))
1822     {
1823     case 4:
1824       if (x->array[3])
1825         return 0;
1826       /* Fall through.  */
1827     case 3:
1828       if (x->array[2])
1829         return 0;
1830       /* Fall through.  */
1831     case 2:
1832       if (x->array[1])
1833         return 0;
1834       /* Fall through.  */
1835     case 1:
1836       return !x->array[0];
1837     default:
1838       abort ();
1839     }
1840 }
1841
1842 static INLINE int
1843 cpu_flags_equal (const union i386_cpu_flags *x,
1844                  const union i386_cpu_flags *y)
1845 {
1846   switch (ARRAY_SIZE(x->array))
1847     {
1848     case 4:
1849       if (x->array[3] != y->array[3])
1850         return 0;
1851       /* Fall through.  */
1852     case 3:
1853       if (x->array[2] != y->array[2])
1854         return 0;
1855       /* Fall through.  */
1856     case 2:
1857       if (x->array[1] != y->array[1])
1858         return 0;
1859       /* Fall through.  */
1860     case 1:
1861       return x->array[0] == y->array[0];
1862       break;
1863     default:
1864       abort ();
1865     }
1866 }
1867
1868 static INLINE int
1869 cpu_flags_check_cpu64 (i386_cpu_flags f)
1870 {
1871   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1872            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1873 }
1874
1875 static INLINE i386_cpu_flags
1876 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1877 {
1878   switch (ARRAY_SIZE (x.array))
1879     {
1880     case 4:
1881       x.array [3] &= y.array [3];
1882       /* Fall through.  */
1883     case 3:
1884       x.array [2] &= y.array [2];
1885       /* Fall through.  */
1886     case 2:
1887       x.array [1] &= y.array [1];
1888       /* Fall through.  */
1889     case 1:
1890       x.array [0] &= y.array [0];
1891       break;
1892     default:
1893       abort ();
1894     }
1895   return x;
1896 }
1897
1898 static INLINE i386_cpu_flags
1899 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1900 {
1901   switch (ARRAY_SIZE (x.array))
1902     {
1903     case 4:
1904       x.array [3] |= y.array [3];
1905       /* Fall through.  */
1906     case 3:
1907       x.array [2] |= y.array [2];
1908       /* Fall through.  */
1909     case 2:
1910       x.array [1] |= y.array [1];
1911       /* Fall through.  */
1912     case 1:
1913       x.array [0] |= y.array [0];
1914       break;
1915     default:
1916       abort ();
1917     }
1918   return x;
1919 }
1920
1921 static INLINE i386_cpu_flags
1922 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1923 {
1924   switch (ARRAY_SIZE (x.array))
1925     {
1926     case 4:
1927       x.array [3] &= ~y.array [3];
1928       /* Fall through.  */
1929     case 3:
1930       x.array [2] &= ~y.array [2];
1931       /* Fall through.  */
1932     case 2:
1933       x.array [1] &= ~y.array [1];
1934       /* Fall through.  */
1935     case 1:
1936       x.array [0] &= ~y.array [0];
1937       break;
1938     default:
1939       abort ();
1940     }
1941   return x;
1942 }
1943
1944 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1945
1946 #define CPU_FLAGS_ARCH_MATCH            0x1
1947 #define CPU_FLAGS_64BIT_MATCH           0x2
1948
1949 #define CPU_FLAGS_PERFECT_MATCH \
1950   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1951
1952 /* Return CPU flags match bits. */
1953
1954 static int
1955 cpu_flags_match (const insn_template *t)
1956 {
1957   i386_cpu_flags x = t->cpu_flags;
1958   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1959
1960   x.bitfield.cpu64 = 0;
1961   x.bitfield.cpuno64 = 0;
1962
1963   if (cpu_flags_all_zero (&x))
1964     {
1965       /* This instruction is available on all archs.  */
1966       match |= CPU_FLAGS_ARCH_MATCH;
1967     }
1968   else
1969     {
1970       /* This instruction is available only on some archs.  */
1971       i386_cpu_flags cpu = cpu_arch_flags;
1972
1973       /* AVX512VL is no standalone feature - match it and then strip it.  */
1974       if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1975         return match;
1976       x.bitfield.cpuavx512vl = 0;
1977
1978       cpu = cpu_flags_and (x, cpu);
1979       if (!cpu_flags_all_zero (&cpu))
1980         {
1981           if (x.bitfield.cpuavx)
1982             {
1983               /* We need to check a few extra flags with AVX.  */
1984               if (cpu.bitfield.cpuavx
1985                   && (!t->opcode_modifier.sse2avx
1986                       || (sse2avx && !i.prefix[DATA_PREFIX]))
1987                   && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1988                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1989                   && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1990                 match |= CPU_FLAGS_ARCH_MATCH;
1991             }
1992           else if (x.bitfield.cpuavx512f)
1993             {
1994               /* We need to check a few extra flags with AVX512F.  */
1995               if (cpu.bitfield.cpuavx512f
1996                   && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1997                   && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1998                   && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1999                 match |= CPU_FLAGS_ARCH_MATCH;
2000             }
2001           else
2002             match |= CPU_FLAGS_ARCH_MATCH;
2003         }
2004     }
2005   return match;
2006 }
2007
2008 static INLINE i386_operand_type
2009 operand_type_and (i386_operand_type x, i386_operand_type y)
2010 {
2011   if (x.bitfield.class != y.bitfield.class)
2012     x.bitfield.class = ClassNone;
2013   if (x.bitfield.instance != y.bitfield.instance)
2014     x.bitfield.instance = InstanceNone;
2015
2016   switch (ARRAY_SIZE (x.array))
2017     {
2018     case 3:
2019       x.array [2] &= y.array [2];
2020       /* Fall through.  */
2021     case 2:
2022       x.array [1] &= y.array [1];
2023       /* Fall through.  */
2024     case 1:
2025       x.array [0] &= y.array [0];
2026       break;
2027     default:
2028       abort ();
2029     }
2030   return x;
2031 }
2032
2033 static INLINE i386_operand_type
2034 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2035 {
2036   gas_assert (y.bitfield.class == ClassNone);
2037   gas_assert (y.bitfield.instance == InstanceNone);
2038
2039   switch (ARRAY_SIZE (x.array))
2040     {
2041     case 3:
2042       x.array [2] &= ~y.array [2];
2043       /* Fall through.  */
2044     case 2:
2045       x.array [1] &= ~y.array [1];
2046       /* Fall through.  */
2047     case 1:
2048       x.array [0] &= ~y.array [0];
2049       break;
2050     default:
2051       abort ();
2052     }
2053   return x;
2054 }
2055
2056 static INLINE i386_operand_type
2057 operand_type_or (i386_operand_type x, i386_operand_type y)
2058 {
2059   gas_assert (x.bitfield.class == ClassNone ||
2060               y.bitfield.class == ClassNone ||
2061               x.bitfield.class == y.bitfield.class);
2062   gas_assert (x.bitfield.instance == InstanceNone ||
2063               y.bitfield.instance == InstanceNone ||
2064               x.bitfield.instance == y.bitfield.instance);
2065
2066   switch (ARRAY_SIZE (x.array))
2067     {
2068     case 3:
2069       x.array [2] |= y.array [2];
2070       /* Fall through.  */
2071     case 2:
2072       x.array [1] |= y.array [1];
2073       /* Fall through.  */
2074     case 1:
2075       x.array [0] |= y.array [0];
2076       break;
2077     default:
2078       abort ();
2079     }
2080   return x;
2081 }
2082
2083 static INLINE i386_operand_type
2084 operand_type_xor (i386_operand_type x, i386_operand_type y)
2085 {
2086   gas_assert (y.bitfield.class == ClassNone);
2087   gas_assert (y.bitfield.instance == InstanceNone);
2088
2089   switch (ARRAY_SIZE (x.array))
2090     {
2091     case 3:
2092       x.array [2] ^= y.array [2];
2093       /* Fall through.  */
2094     case 2:
2095       x.array [1] ^= y.array [1];
2096       /* Fall through.  */
2097     case 1:
2098       x.array [0] ^= y.array [0];
2099       break;
2100     default:
2101       abort ();
2102     }
2103   return x;
2104 }
2105
2106 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2107 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2108 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2109 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2110 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2111 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2112 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2113 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2114 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2115 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2116 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2117 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2118 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2119 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2120 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2121 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2122 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2123
2124 enum operand_type
2125 {
2126   reg,
2127   imm,
2128   disp,
2129   anymem
2130 };
2131
2132 static INLINE int
2133 operand_type_check (i386_operand_type t, enum operand_type c)
2134 {
2135   switch (c)
2136     {
2137     case reg:
2138       return t.bitfield.class == Reg;
2139
2140     case imm:
2141       return (t.bitfield.imm8
2142               || t.bitfield.imm8s
2143               || t.bitfield.imm16
2144               || t.bitfield.imm32
2145               || t.bitfield.imm32s
2146               || t.bitfield.imm64);
2147
2148     case disp:
2149       return (t.bitfield.disp8
2150               || t.bitfield.disp16
2151               || t.bitfield.disp32
2152               || t.bitfield.disp32s
2153               || t.bitfield.disp64);
2154
2155     case anymem:
2156       return (t.bitfield.disp8
2157               || t.bitfield.disp16
2158               || t.bitfield.disp32
2159               || t.bitfield.disp32s
2160               || t.bitfield.disp64
2161               || t.bitfield.baseindex);
2162
2163     default:
2164       abort ();
2165     }
2166
2167   return 0;
2168 }
2169
2170 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2171    between operand GIVEN and opeand WANTED for instruction template T.  */
2172
2173 static INLINE int
2174 match_operand_size (const insn_template *t, unsigned int wanted,
2175                     unsigned int given)
2176 {
2177   return !((i.types[given].bitfield.byte
2178             && !t->operand_types[wanted].bitfield.byte)
2179            || (i.types[given].bitfield.word
2180                && !t->operand_types[wanted].bitfield.word)
2181            || (i.types[given].bitfield.dword
2182                && !t->operand_types[wanted].bitfield.dword)
2183            || (i.types[given].bitfield.qword
2184                && !t->operand_types[wanted].bitfield.qword)
2185            || (i.types[given].bitfield.tbyte
2186                && !t->operand_types[wanted].bitfield.tbyte));
2187 }
2188
2189 /* Return 1 if there is no conflict in SIMD register between operand
2190    GIVEN and opeand WANTED for instruction template T.  */
2191
2192 static INLINE int
2193 match_simd_size (const insn_template *t, unsigned int wanted,
2194                  unsigned int given)
2195 {
2196   return !((i.types[given].bitfield.xmmword
2197             && !t->operand_types[wanted].bitfield.xmmword)
2198            || (i.types[given].bitfield.ymmword
2199                && !t->operand_types[wanted].bitfield.ymmword)
2200            || (i.types[given].bitfield.zmmword
2201                && !t->operand_types[wanted].bitfield.zmmword)
2202            || (i.types[given].bitfield.tmmword
2203                && !t->operand_types[wanted].bitfield.tmmword));
2204 }
2205
2206 /* Return 1 if there is no conflict in any size between operand GIVEN
2207    and opeand WANTED for instruction template T.  */
2208
2209 static INLINE int
2210 match_mem_size (const insn_template *t, unsigned int wanted,
2211                 unsigned int given)
2212 {
2213   return (match_operand_size (t, wanted, given)
2214           && !((i.types[given].bitfield.unspecified
2215                 && !i.broadcast
2216                 && !t->operand_types[wanted].bitfield.unspecified)
2217                || (i.types[given].bitfield.fword
2218                    && !t->operand_types[wanted].bitfield.fword)
2219                /* For scalar opcode templates to allow register and memory
2220                   operands at the same time, some special casing is needed
2221                   here.  Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2222                   down-conversion vpmov*.  */
2223                || ((t->operand_types[wanted].bitfield.class == RegSIMD
2224                     && t->operand_types[wanted].bitfield.byte
2225                        + t->operand_types[wanted].bitfield.word
2226                        + t->operand_types[wanted].bitfield.dword
2227                        + t->operand_types[wanted].bitfield.qword
2228                        > !!t->opcode_modifier.broadcast)
2229                    ? (i.types[given].bitfield.xmmword
2230                       || i.types[given].bitfield.ymmword
2231                       || i.types[given].bitfield.zmmword)
2232                    : !match_simd_size(t, wanted, given))));
2233 }
2234
2235 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2236    operands for instruction template T, and it has MATCH_REVERSE set if there
2237    is no size conflict on any operands for the template with operands reversed
2238    (and the template allows for reversing in the first place).  */
2239
2240 #define MATCH_STRAIGHT 1
2241 #define MATCH_REVERSE  2
2242
2243 static INLINE unsigned int
2244 operand_size_match (const insn_template *t)
2245 {
2246   unsigned int j, match = MATCH_STRAIGHT;
2247
2248   /* Don't check non-absolute jump instructions.  */
2249   if (t->opcode_modifier.jump
2250       && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2251     return match;
2252
2253   /* Check memory and accumulator operand size.  */
2254   for (j = 0; j < i.operands; j++)
2255     {
2256       if (i.types[j].bitfield.class != Reg
2257           && i.types[j].bitfield.class != RegSIMD
2258           && t->opcode_modifier.anysize)
2259         continue;
2260
2261       if (t->operand_types[j].bitfield.class == Reg
2262           && !match_operand_size (t, j, j))
2263         {
2264           match = 0;
2265           break;
2266         }
2267
2268       if (t->operand_types[j].bitfield.class == RegSIMD
2269           && !match_simd_size (t, j, j))
2270         {
2271           match = 0;
2272           break;
2273         }
2274
2275       if (t->operand_types[j].bitfield.instance == Accum
2276           && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2277         {
2278           match = 0;
2279           break;
2280         }
2281
2282       if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2283         {
2284           match = 0;
2285           break;
2286         }
2287     }
2288
2289   if (!t->opcode_modifier.d)
2290     {
2291     mismatch:
2292       if (!match)
2293         i.error = operand_size_mismatch;
2294       return match;
2295     }
2296
2297   /* Check reverse.  */
2298   gas_assert (i.operands >= 2 && i.operands <= 3);
2299
2300   for (j = 0; j < i.operands; j++)
2301     {
2302       unsigned int given = i.operands - j - 1;
2303
2304       if (t->operand_types[j].bitfield.class == Reg
2305           && !match_operand_size (t, j, given))
2306         goto mismatch;
2307
2308       if (t->operand_types[j].bitfield.class == RegSIMD
2309           && !match_simd_size (t, j, given))
2310         goto mismatch;
2311
2312       if (t->operand_types[j].bitfield.instance == Accum
2313           && (!match_operand_size (t, j, given)
2314               || !match_simd_size (t, j, given)))
2315         goto mismatch;
2316
2317       if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2318         goto mismatch;
2319     }
2320
2321   return match | MATCH_REVERSE;
2322 }
2323
2324 static INLINE int
2325 operand_type_match (i386_operand_type overlap,
2326                     i386_operand_type given)
2327 {
2328   i386_operand_type temp = overlap;
2329
2330   temp.bitfield.unspecified = 0;
2331   temp.bitfield.byte = 0;
2332   temp.bitfield.word = 0;
2333   temp.bitfield.dword = 0;
2334   temp.bitfield.fword = 0;
2335   temp.bitfield.qword = 0;
2336   temp.bitfield.tbyte = 0;
2337   temp.bitfield.xmmword = 0;
2338   temp.bitfield.ymmword = 0;
2339   temp.bitfield.zmmword = 0;
2340   temp.bitfield.tmmword = 0;
2341   if (operand_type_all_zero (&temp))
2342     goto mismatch;
2343
2344   if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2345     return 1;
2346
2347  mismatch:
2348   i.error = operand_type_mismatch;
2349   return 0;
2350 }
2351
2352 /* If given types g0 and g1 are registers they must be of the same type
2353    unless the expected operand type register overlap is null.
2354    Some Intel syntax memory operand size checking also happens here.  */
2355
2356 static INLINE int
2357 operand_type_register_match (i386_operand_type g0,
2358                              i386_operand_type t0,
2359                              i386_operand_type g1,
2360                              i386_operand_type t1)
2361 {
2362   if (g0.bitfield.class != Reg
2363       && g0.bitfield.class != RegSIMD
2364       && (!operand_type_check (g0, anymem)
2365           || g0.bitfield.unspecified
2366           || (t0.bitfield.class != Reg
2367               && t0.bitfield.class != RegSIMD)))
2368     return 1;
2369
2370   if (g1.bitfield.class != Reg
2371       && g1.bitfield.class != RegSIMD
2372       && (!operand_type_check (g1, anymem)
2373           || g1.bitfield.unspecified
2374           || (t1.bitfield.class != Reg
2375               && t1.bitfield.class != RegSIMD)))
2376     return 1;
2377
2378   if (g0.bitfield.byte == g1.bitfield.byte
2379       && g0.bitfield.word == g1.bitfield.word
2380       && g0.bitfield.dword == g1.bitfield.dword
2381       && g0.bitfield.qword == g1.bitfield.qword
2382       && g0.bitfield.xmmword == g1.bitfield.xmmword
2383       && g0.bitfield.ymmword == g1.bitfield.ymmword
2384       && g0.bitfield.zmmword == g1.bitfield.zmmword)
2385     return 1;
2386
2387   if (!(t0.bitfield.byte & t1.bitfield.byte)
2388       && !(t0.bitfield.word & t1.bitfield.word)
2389       && !(t0.bitfield.dword & t1.bitfield.dword)
2390       && !(t0.bitfield.qword & t1.bitfield.qword)
2391       && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2392       && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2393       && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2394     return 1;
2395
2396   i.error = register_type_mismatch;
2397
2398   return 0;
2399 }
2400
2401 static INLINE unsigned int
2402 register_number (const reg_entry *r)
2403 {
2404   unsigned int nr = r->reg_num;
2405
2406   if (r->reg_flags & RegRex)
2407     nr += 8;
2408
2409   if (r->reg_flags & RegVRex)
2410     nr += 16;
2411
2412   return nr;
2413 }
2414
2415 static INLINE unsigned int
2416 mode_from_disp_size (i386_operand_type t)
2417 {
2418   if (t.bitfield.disp8)
2419     return 1;
2420   else if (t.bitfield.disp16
2421            || t.bitfield.disp32
2422            || t.bitfield.disp32s)
2423     return 2;
2424   else
2425     return 0;
2426 }
2427
2428 static INLINE int
2429 fits_in_signed_byte (addressT num)
2430 {
2431   return num + 0x80 <= 0xff;
2432 }
2433
2434 static INLINE int
2435 fits_in_unsigned_byte (addressT num)
2436 {
2437   return num <= 0xff;
2438 }
2439
2440 static INLINE int
2441 fits_in_unsigned_word (addressT num)
2442 {
2443   return num <= 0xffff;
2444 }
2445
2446 static INLINE int
2447 fits_in_signed_word (addressT num)
2448 {
2449   return num + 0x8000 <= 0xffff;
2450 }
2451
2452 static INLINE int
2453 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2454 {
2455 #ifndef BFD64
2456   return 1;
2457 #else
2458   return num + 0x80000000 <= 0xffffffff;
2459 #endif
2460 }                               /* fits_in_signed_long() */
2461
2462 static INLINE int
2463 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2464 {
2465 #ifndef BFD64
2466   return 1;
2467 #else
2468   return num <= 0xffffffff;
2469 #endif
2470 }                               /* fits_in_unsigned_long() */
2471
2472 static INLINE int
2473 fits_in_disp8 (offsetT num)
2474 {
2475   int shift = i.memshift;
2476   unsigned int mask;
2477
2478   if (shift == -1)
2479     abort ();
2480
2481   mask = (1 << shift) - 1;
2482
2483   /* Return 0 if NUM isn't properly aligned.  */
2484   if ((num & mask))
2485     return 0;
2486
2487   /* Check if NUM will fit in 8bit after shift.  */
2488   return fits_in_signed_byte (num >> shift);
2489 }
2490
2491 static INLINE int
2492 fits_in_imm4 (offsetT num)
2493 {
2494   return (num & 0xf) == num;
2495 }
2496
2497 static i386_operand_type
2498 smallest_imm_type (offsetT num)
2499 {
2500   i386_operand_type t;
2501
2502   operand_type_set (&t, 0);
2503   t.bitfield.imm64 = 1;
2504
2505   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2506     {
2507       /* This code is disabled on the 486 because all the Imm1 forms
2508          in the opcode table are slower on the i486.  They're the
2509          versions with the implicitly specified single-position
2510          displacement, which has another syntax if you really want to
2511          use that form.  */
2512       t.bitfield.imm1 = 1;
2513       t.bitfield.imm8 = 1;
2514       t.bitfield.imm8s = 1;
2515       t.bitfield.imm16 = 1;
2516       t.bitfield.imm32 = 1;
2517       t.bitfield.imm32s = 1;
2518     }
2519   else if (fits_in_signed_byte (num))
2520     {
2521       t.bitfield.imm8 = 1;
2522       t.bitfield.imm8s = 1;
2523       t.bitfield.imm16 = 1;
2524       t.bitfield.imm32 = 1;
2525       t.bitfield.imm32s = 1;
2526     }
2527   else if (fits_in_unsigned_byte (num))
2528     {
2529       t.bitfield.imm8 = 1;
2530       t.bitfield.imm16 = 1;
2531       t.bitfield.imm32 = 1;
2532       t.bitfield.imm32s = 1;
2533     }
2534   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2535     {
2536       t.bitfield.imm16 = 1;
2537       t.bitfield.imm32 = 1;
2538       t.bitfield.imm32s = 1;
2539     }
2540   else if (fits_in_signed_long (num))
2541     {
2542       t.bitfield.imm32 = 1;
2543       t.bitfield.imm32s = 1;
2544     }
2545   else if (fits_in_unsigned_long (num))
2546     t.bitfield.imm32 = 1;
2547
2548   return t;
2549 }
2550
2551 static offsetT
2552 offset_in_range (offsetT val, int size)
2553 {
2554   addressT mask;
2555
2556   switch (size)
2557     {
2558     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2559     case 2: mask = ((addressT) 1 << 16) - 1; break;
2560     case 4: mask = ((addressT) 2 << 31) - 1; break;
2561 #ifdef BFD64
2562     case 8: mask = ((addressT) 2 << 63) - 1; break;
2563 #endif
2564     default: abort ();
2565     }
2566
2567   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2568     {
2569       char buf1[40], buf2[40];
2570
2571       sprint_value (buf1, val);
2572       sprint_value (buf2, val & mask);
2573       as_warn (_("%s shortened to %s"), buf1, buf2);
2574     }
2575   return val & mask;
2576 }
2577
2578 enum PREFIX_GROUP
2579 {
2580   PREFIX_EXIST = 0,
2581   PREFIX_LOCK,
2582   PREFIX_REP,
2583   PREFIX_DS,
2584   PREFIX_OTHER
2585 };
2586
2587 /* Returns
2588    a. PREFIX_EXIST if attempting to add a prefix where one from the
2589    same class already exists.
2590    b. PREFIX_LOCK if lock prefix is added.
2591    c. PREFIX_REP if rep/repne prefix is added.
2592    d. PREFIX_DS if ds prefix is added.
2593    e. PREFIX_OTHER if other prefix is added.
2594  */
2595
2596 static enum PREFIX_GROUP
2597 add_prefix (unsigned int prefix)
2598 {
2599   enum PREFIX_GROUP ret = PREFIX_OTHER;
2600   unsigned int q;
2601
2602   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2603       && flag_code == CODE_64BIT)
2604     {
2605       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2606           || (i.prefix[REX_PREFIX] & prefix & REX_R)
2607           || (i.prefix[REX_PREFIX] & prefix & REX_X)
2608           || (i.prefix[REX_PREFIX] & prefix & REX_B))
2609         ret = PREFIX_EXIST;
2610       q = REX_PREFIX;
2611     }
2612   else
2613     {
2614       switch (prefix)
2615         {
2616         default:
2617           abort ();
2618
2619         case DS_PREFIX_OPCODE:
2620           ret = PREFIX_DS;
2621           /* Fall through.  */
2622         case CS_PREFIX_OPCODE:
2623         case ES_PREFIX_OPCODE:
2624         case FS_PREFIX_OPCODE:
2625         case GS_PREFIX_OPCODE:
2626         case SS_PREFIX_OPCODE:
2627           q = SEG_PREFIX;
2628           break;
2629
2630         case REPNE_PREFIX_OPCODE:
2631         case REPE_PREFIX_OPCODE:
2632           q = REP_PREFIX;
2633           ret = PREFIX_REP;
2634           break;
2635
2636         case LOCK_PREFIX_OPCODE:
2637           q = LOCK_PREFIX;
2638           ret = PREFIX_LOCK;
2639           break;
2640
2641         case FWAIT_OPCODE:
2642           q = WAIT_PREFIX;
2643           break;
2644
2645         case ADDR_PREFIX_OPCODE:
2646           q = ADDR_PREFIX;
2647           break;
2648
2649         case DATA_PREFIX_OPCODE:
2650           q = DATA_PREFIX;
2651           break;
2652         }
2653       if (i.prefix[q] != 0)
2654         ret = PREFIX_EXIST;
2655     }
2656
2657   if (ret)
2658     {
2659       if (!i.prefix[q])
2660         ++i.prefixes;
2661       i.prefix[q] |= prefix;
2662     }
2663   else
2664     as_bad (_("same type of prefix used twice"));
2665
2666   return ret;
2667 }
2668
2669 static void
2670 update_code_flag (int value, int check)
2671 {
2672   PRINTF_LIKE ((*as_error));
2673
2674   flag_code = (enum flag_code) value;
2675   if (flag_code == CODE_64BIT)
2676     {
2677       cpu_arch_flags.bitfield.cpu64 = 1;
2678       cpu_arch_flags.bitfield.cpuno64 = 0;
2679     }
2680   else
2681     {
2682       cpu_arch_flags.bitfield.cpu64 = 0;
2683       cpu_arch_flags.bitfield.cpuno64 = 1;
2684     }
2685   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2686     {
2687       if (check)
2688         as_error = as_fatal;
2689       else
2690         as_error = as_bad;
2691       (*as_error) (_("64bit mode not supported on `%s'."),
2692                    cpu_arch_name ? cpu_arch_name : default_arch);
2693     }
2694   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2695     {
2696       if (check)
2697         as_error = as_fatal;
2698       else
2699         as_error = as_bad;
2700       (*as_error) (_("32bit mode not supported on `%s'."),
2701                    cpu_arch_name ? cpu_arch_name : default_arch);
2702     }
2703   stackop_size = '\0';
2704 }
2705
2706 static void
2707 set_code_flag (int value)
2708 {
2709   update_code_flag (value, 0);
2710 }
2711
2712 static void
2713 set_16bit_gcc_code_flag (int new_code_flag)
2714 {
2715   flag_code = (enum flag_code) new_code_flag;
2716   if (flag_code != CODE_16BIT)
2717     abort ();
2718   cpu_arch_flags.bitfield.cpu64 = 0;
2719   cpu_arch_flags.bitfield.cpuno64 = 1;
2720   stackop_size = LONG_MNEM_SUFFIX;
2721 }
2722
2723 static void
2724 set_intel_syntax (int syntax_flag)
2725 {
2726   /* Find out if register prefixing is specified.  */
2727   int ask_naked_reg = 0;
2728
2729   SKIP_WHITESPACE ();
2730   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2731     {
2732       char *string;
2733       int e = get_symbol_name (&string);
2734
2735       if (strcmp (string, "prefix") == 0)
2736         ask_naked_reg = 1;
2737       else if (strcmp (string, "noprefix") == 0)
2738         ask_naked_reg = -1;
2739       else
2740         as_bad (_("bad argument to syntax directive."));
2741       (void) restore_line_pointer (e);
2742     }
2743   demand_empty_rest_of_line ();
2744
2745   intel_syntax = syntax_flag;
2746
2747   if (ask_naked_reg == 0)
2748     allow_naked_reg = (intel_syntax
2749                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2750   else
2751     allow_naked_reg = (ask_naked_reg < 0);
2752
2753   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2754
2755   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2756   identifier_chars['$'] = intel_syntax ? '$' : 0;
2757   register_prefix = allow_naked_reg ? "" : "%";
2758 }
2759
2760 static void
2761 set_intel_mnemonic (int mnemonic_flag)
2762 {
2763   intel_mnemonic = mnemonic_flag;
2764 }
2765
2766 static void
2767 set_allow_index_reg (int flag)
2768 {
2769   allow_index_reg = flag;
2770 }
2771
2772 static void
2773 set_check (int what)
2774 {
2775   enum check_kind *kind;
2776   const char *str;
2777
2778   if (what)
2779     {
2780       kind = &operand_check;
2781       str = "operand";
2782     }
2783   else
2784     {
2785       kind = &sse_check;
2786       str = "sse";
2787     }
2788
2789   SKIP_WHITESPACE ();
2790
2791   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2792     {
2793       char *string;
2794       int e = get_symbol_name (&string);
2795
2796       if (strcmp (string, "none") == 0)
2797         *kind = check_none;
2798       else if (strcmp (string, "warning") == 0)
2799         *kind = check_warning;
2800       else if (strcmp (string, "error") == 0)
2801         *kind = check_error;
2802       else
2803         as_bad (_("bad argument to %s_check directive."), str);
2804       (void) restore_line_pointer (e);
2805     }
2806   else
2807     as_bad (_("missing argument for %s_check directive"), str);
2808
2809   demand_empty_rest_of_line ();
2810 }
2811
2812 static void
2813 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2814                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2815 {
2816 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2817   static const char *arch;
2818
2819   /* Intel LIOM is only supported on ELF.  */
2820   if (!IS_ELF)
2821     return;
2822
2823   if (!arch)
2824     {
2825       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2826          use default_arch.  */
2827       arch = cpu_arch_name;
2828       if (!arch)
2829         arch = default_arch;
2830     }
2831
2832   /* If we are targeting Intel MCU, we must enable it.  */
2833   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2834       || new_flag.bitfield.cpuiamcu)
2835     return;
2836
2837   /* If we are targeting Intel L1OM, we must enable it.  */
2838   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2839       || new_flag.bitfield.cpul1om)
2840     return;
2841
2842   /* If we are targeting Intel K1OM, we must enable it.  */
2843   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2844       || new_flag.bitfield.cpuk1om)
2845     return;
2846
2847   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2848 #endif
2849 }
2850
2851 static void
2852 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2853 {
2854   SKIP_WHITESPACE ();
2855
2856   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2857     {
2858       char *string;
2859       int e = get_symbol_name (&string);
2860       unsigned int j;
2861       i386_cpu_flags flags;
2862
2863       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2864         {
2865           if (strcmp (string, cpu_arch[j].name) == 0)
2866             {
2867               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2868
2869               if (*string != '.')
2870                 {
2871                   cpu_arch_name = cpu_arch[j].name;
2872                   cpu_sub_arch_name = NULL;
2873                   cpu_arch_flags = cpu_arch[j].flags;
2874                   if (flag_code == CODE_64BIT)
2875                     {
2876                       cpu_arch_flags.bitfield.cpu64 = 1;
2877                       cpu_arch_flags.bitfield.cpuno64 = 0;
2878                     }
2879                   else
2880                     {
2881                       cpu_arch_flags.bitfield.cpu64 = 0;
2882                       cpu_arch_flags.bitfield.cpuno64 = 1;
2883                     }
2884                   cpu_arch_isa = cpu_arch[j].type;
2885                   cpu_arch_isa_flags = cpu_arch[j].flags;
2886                   if (!cpu_arch_tune_set)
2887                     {
2888                       cpu_arch_tune = cpu_arch_isa;
2889                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2890                     }
2891                   break;
2892                 }
2893
2894               flags = cpu_flags_or (cpu_arch_flags,
2895                                     cpu_arch[j].flags);
2896
2897               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898                 {
2899                   if (cpu_sub_arch_name)
2900                     {
2901                       char *name = cpu_sub_arch_name;
2902                       cpu_sub_arch_name = concat (name,
2903                                                   cpu_arch[j].name,
2904                                                   (const char *) NULL);
2905                       free (name);
2906                     }
2907                   else
2908                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2909                   cpu_arch_flags = flags;
2910                   cpu_arch_isa_flags = flags;
2911                 }
2912               else
2913                 cpu_arch_isa_flags
2914                   = cpu_flags_or (cpu_arch_isa_flags,
2915                                   cpu_arch[j].flags);
2916               (void) restore_line_pointer (e);
2917               demand_empty_rest_of_line ();
2918               return;
2919             }
2920         }
2921
2922       if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2923         {
2924           /* Disable an ISA extension.  */
2925           for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2926             if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2927               {
2928                 flags = cpu_flags_and_not (cpu_arch_flags,
2929                                            cpu_noarch[j].flags);
2930                 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2931                   {
2932                     if (cpu_sub_arch_name)
2933                       {
2934                         char *name = cpu_sub_arch_name;
2935                         cpu_sub_arch_name = concat (name, string,
2936                                                     (const char *) NULL);
2937                         free (name);
2938                       }
2939                     else
2940                       cpu_sub_arch_name = xstrdup (string);
2941                     cpu_arch_flags = flags;
2942                     cpu_arch_isa_flags = flags;
2943                   }
2944                 (void) restore_line_pointer (e);
2945                 demand_empty_rest_of_line ();
2946                 return;
2947               }
2948
2949           j = ARRAY_SIZE (cpu_arch);
2950         }
2951
2952       if (j >= ARRAY_SIZE (cpu_arch))
2953         as_bad (_("no such architecture: `%s'"), string);
2954
2955       *input_line_pointer = e;
2956     }
2957   else
2958     as_bad (_("missing cpu architecture"));
2959
2960   no_cond_jump_promotion = 0;
2961   if (*input_line_pointer == ','
2962       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2963     {
2964       char *string;
2965       char e;
2966
2967       ++input_line_pointer;
2968       e = get_symbol_name (&string);
2969
2970       if (strcmp (string, "nojumps") == 0)
2971         no_cond_jump_promotion = 1;
2972       else if (strcmp (string, "jumps") == 0)
2973         ;
2974       else
2975         as_bad (_("no such architecture modifier: `%s'"), string);
2976
2977       (void) restore_line_pointer (e);
2978     }
2979
2980   demand_empty_rest_of_line ();
2981 }
2982
2983 enum bfd_architecture
2984 i386_arch (void)
2985 {
2986   if (cpu_arch_isa == PROCESSOR_L1OM)
2987     {
2988       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2989           || flag_code != CODE_64BIT)
2990         as_fatal (_("Intel L1OM is 64bit ELF only"));
2991       return bfd_arch_l1om;
2992     }
2993   else if (cpu_arch_isa == PROCESSOR_K1OM)
2994     {
2995       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2996           || flag_code != CODE_64BIT)
2997         as_fatal (_("Intel K1OM is 64bit ELF only"));
2998       return bfd_arch_k1om;
2999     }
3000   else if (cpu_arch_isa == PROCESSOR_IAMCU)
3001     {
3002       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3003           || flag_code == CODE_64BIT)
3004         as_fatal (_("Intel MCU is 32bit ELF only"));
3005       return bfd_arch_iamcu;
3006     }
3007   else
3008     return bfd_arch_i386;
3009 }
3010
3011 unsigned long
3012 i386_mach (void)
3013 {
3014   if (!strncmp (default_arch, "x86_64", 6))
3015     {
3016       if (cpu_arch_isa == PROCESSOR_L1OM)
3017         {
3018           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3019               || default_arch[6] != '\0')
3020             as_fatal (_("Intel L1OM is 64bit ELF only"));
3021           return bfd_mach_l1om;
3022         }
3023       else if (cpu_arch_isa == PROCESSOR_K1OM)
3024         {
3025           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3026               || default_arch[6] != '\0')
3027             as_fatal (_("Intel K1OM is 64bit ELF only"));
3028           return bfd_mach_k1om;
3029         }
3030       else if (default_arch[6] == '\0')
3031         return bfd_mach_x86_64;
3032       else
3033         return bfd_mach_x64_32;
3034     }
3035   else if (!strcmp (default_arch, "i386")
3036            || !strcmp (default_arch, "iamcu"))
3037     {
3038       if (cpu_arch_isa == PROCESSOR_IAMCU)
3039         {
3040           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3041             as_fatal (_("Intel MCU is 32bit ELF only"));
3042           return bfd_mach_i386_iamcu;
3043         }
3044       else
3045         return bfd_mach_i386_i386;
3046     }
3047   else
3048     as_fatal (_("unknown architecture"));
3049 }
3050 \f
3051 void
3052 md_begin (void)
3053 {
3054   /* Support pseudo prefixes like {disp32}.  */
3055   lex_type ['{'] = LEX_BEGIN_NAME;
3056
3057   /* Initialize op_hash hash table.  */
3058   op_hash = str_htab_create ();
3059
3060   {
3061     const insn_template *optab;
3062     templates *core_optab;
3063
3064     /* Setup for loop.  */
3065     optab = i386_optab;
3066     core_optab = XNEW (templates);
3067     core_optab->start = optab;
3068
3069     while (1)
3070       {
3071         ++optab;
3072         if (optab->name == NULL
3073             || strcmp (optab->name, (optab - 1)->name) != 0)
3074           {
3075             /* different name --> ship out current template list;
3076                add to hash table; & begin anew.  */
3077             core_optab->end = optab;
3078             if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3079               as_fatal (_("duplicate %s"), (optab - 1)->name);
3080
3081             if (optab->name == NULL)
3082               break;
3083             core_optab = XNEW (templates);
3084             core_optab->start = optab;
3085           }
3086       }
3087   }
3088
3089   /* Initialize reg_hash hash table.  */
3090   reg_hash = str_htab_create ();
3091   {
3092     const reg_entry *regtab;
3093     unsigned int regtab_size = i386_regtab_size;
3094
3095     for (regtab = i386_regtab; regtab_size--; regtab++)
3096       if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3097         as_fatal (_("duplicate %s"), regtab->reg_name);
3098   }
3099
3100   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
3101   {
3102     int c;
3103     char *p;
3104
3105     for (c = 0; c < 256; c++)
3106       {
3107         if (ISDIGIT (c))
3108           {
3109             digit_chars[c] = c;
3110             mnemonic_chars[c] = c;
3111             register_chars[c] = c;
3112             operand_chars[c] = c;
3113           }
3114         else if (ISLOWER (c))
3115           {
3116             mnemonic_chars[c] = c;
3117             register_chars[c] = c;
3118             operand_chars[c] = c;
3119           }
3120         else if (ISUPPER (c))
3121           {
3122             mnemonic_chars[c] = TOLOWER (c);
3123             register_chars[c] = mnemonic_chars[c];
3124             operand_chars[c] = c;
3125           }
3126         else if (c == '{' || c == '}')
3127           {
3128             mnemonic_chars[c] = c;
3129             operand_chars[c] = c;
3130           }
3131 #ifdef SVR4_COMMENT_CHARS
3132         else if (c == '\\' && strchr (i386_comment_chars, '/'))
3133           operand_chars[c] = c;
3134 #endif
3135
3136         if (ISALPHA (c) || ISDIGIT (c))
3137           identifier_chars[c] = c;
3138         else if (c >= 128)
3139           {
3140             identifier_chars[c] = c;
3141             operand_chars[c] = c;
3142           }
3143       }
3144
3145 #ifdef LEX_AT
3146     identifier_chars['@'] = '@';
3147 #endif
3148 #ifdef LEX_QM
3149     identifier_chars['?'] = '?';
3150     operand_chars['?'] = '?';
3151 #endif
3152     digit_chars['-'] = '-';
3153     mnemonic_chars['_'] = '_';
3154     mnemonic_chars['-'] = '-';
3155     mnemonic_chars['.'] = '.';
3156     identifier_chars['_'] = '_';
3157     identifier_chars['.'] = '.';
3158
3159     for (p = operand_special_chars; *p != '\0'; p++)
3160       operand_chars[(unsigned char) *p] = *p;
3161   }
3162
3163   if (flag_code == CODE_64BIT)
3164     {
3165 #if defined (OBJ_COFF) && defined (TE_PE)
3166       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3167                                   ? 32 : 16);
3168 #else
3169       x86_dwarf2_return_column = 16;
3170 #endif
3171       x86_cie_data_alignment = -8;
3172     }
3173   else
3174     {
3175       x86_dwarf2_return_column = 8;
3176       x86_cie_data_alignment = -4;
3177     }
3178
3179   /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3180      can be turned into BRANCH_PREFIX frag.  */
3181   if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3182     abort ();
3183 }
3184
3185 void
3186 i386_print_statistics (FILE *file)
3187 {
3188   htab_print_statistics (file, "i386 opcode", op_hash);
3189   htab_print_statistics (file, "i386 register", reg_hash);
3190 }
3191 \f
3192 #ifdef DEBUG386
3193
3194 /* Debugging routines for md_assemble.  */
3195 static void pte (insn_template *);
3196 static void pt (i386_operand_type);
3197 static void pe (expressionS *);
3198 static void ps (symbolS *);
3199
3200 static void
3201 pi (const char *line, i386_insn *x)
3202 {
3203   unsigned int j;
3204
3205   fprintf (stdout, "%s: template ", line);
3206   pte (&x->tm);
3207   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
3208            x->base_reg ? x->base_reg->reg_name : "none",
3209            x->index_reg ? x->index_reg->reg_name : "none",
3210            x->log2_scale_factor);
3211   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
3212            x->rm.mode, x->rm.reg, x->rm.regmem);
3213   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
3214            x->sib.base, x->sib.index, x->sib.scale);
3215   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
3216            (x->rex & REX_W) != 0,
3217            (x->rex & REX_R) != 0,
3218            (x->rex & REX_X) != 0,
3219            (x->rex & REX_B) != 0);
3220   for (j = 0; j < x->operands; j++)
3221     {
3222       fprintf (stdout, "    #%d:  ", j + 1);
3223       pt (x->types[j]);
3224       fprintf (stdout, "\n");
3225       if (x->types[j].bitfield.class == Reg
3226           || x->types[j].bitfield.class == RegMMX
3227           || x->types[j].bitfield.class == RegSIMD
3228           || x->types[j].bitfield.class == RegMask
3229           || x->types[j].bitfield.class == SReg
3230           || x->types[j].bitfield.class == RegCR
3231           || x->types[j].bitfield.class == RegDR
3232           || x->types[j].bitfield.class == RegTR
3233           || x->types[j].bitfield.class == RegBND)
3234         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3235       if (operand_type_check (x->types[j], imm))
3236         pe (x->op[j].imms);
3237       if (operand_type_check (x->types[j], disp))
3238         pe (x->op[j].disps);
3239     }
3240 }
3241
3242 static void
3243 pte (insn_template *t)
3244 {
3245   static const unsigned char opc_pfx[] = { 0, 0x66, 0xf3, 0xf2 };
3246   static const char *const opc_spc[] = {
3247     NULL, "0f", "0f38", "0f3a", NULL, NULL, NULL, NULL,
3248     "XOP08", "XOP09", "XOP0A",
3249   };
3250   unsigned int j;
3251
3252   fprintf (stdout, " %d operands ", t->operands);
3253   if (opc_pfx[t->opcode_modifier.opcodeprefix])
3254     fprintf (stdout, "pfx %x ", opc_pfx[t->opcode_modifier.opcodeprefix]);
3255   if (opc_spc[t->opcode_modifier.opcodespace])
3256     fprintf (stdout, "space %s ", opc_spc[t->opcode_modifier.opcodespace]);
3257   fprintf (stdout, "opcode %x ", t->base_opcode);
3258   if (t->extension_opcode != None)
3259     fprintf (stdout, "ext %x ", t->extension_opcode);
3260   if (t->opcode_modifier.d)
3261     fprintf (stdout, "D");
3262   if (t->opcode_modifier.w)
3263     fprintf (stdout, "W");
3264   fprintf (stdout, "\n");
3265   for (j = 0; j < t->operands; j++)
3266     {
3267       fprintf (stdout, "    #%d type ", j + 1);
3268       pt (t->operand_types[j]);
3269       fprintf (stdout, "\n");
3270     }
3271 }
3272
3273 static void
3274 pe (expressionS *e)
3275 {
3276   fprintf (stdout, "    operation     %d\n", e->X_op);
3277   fprintf (stdout, "    add_number    %ld (%lx)\n",
3278            (long) e->X_add_number, (long) e->X_add_number);
3279   if (e->X_add_symbol)
3280     {
3281       fprintf (stdout, "    add_symbol    ");
3282       ps (e->X_add_symbol);
3283       fprintf (stdout, "\n");
3284     }
3285   if (e->X_op_symbol)
3286     {
3287       fprintf (stdout, "    op_symbol    ");
3288       ps (e->X_op_symbol);
3289       fprintf (stdout, "\n");
3290     }
3291 }
3292
3293 static void
3294 ps (symbolS *s)
3295 {
3296   fprintf (stdout, "%s type %s%s",
3297            S_GET_NAME (s),
3298            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3299            segment_name (S_GET_SEGMENT (s)));
3300 }
3301
3302 static struct type_name
3303   {
3304     i386_operand_type mask;
3305     const char *name;
3306   }
3307 const type_names[] =
3308 {
3309   { OPERAND_TYPE_REG8, "r8" },
3310   { OPERAND_TYPE_REG16, "r16" },
3311   { OPERAND_TYPE_REG32, "r32" },
3312   { OPERAND_TYPE_REG64, "r64" },
3313   { OPERAND_TYPE_ACC8, "acc8" },
3314   { OPERAND_TYPE_ACC16, "acc16" },
3315   { OPERAND_TYPE_ACC32, "acc32" },
3316   { OPERAND_TYPE_ACC64, "acc64" },
3317   { OPERAND_TYPE_IMM8, "i8" },
3318   { OPERAND_TYPE_IMM8, "i8s" },
3319   { OPERAND_TYPE_IMM16, "i16" },
3320   { OPERAND_TYPE_IMM32, "i32" },
3321   { OPERAND_TYPE_IMM32S, "i32s" },
3322   { OPERAND_TYPE_IMM64, "i64" },
3323   { OPERAND_TYPE_IMM1, "i1" },
3324   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3325   { OPERAND_TYPE_DISP8, "d8" },
3326   { OPERAND_TYPE_DISP16, "d16" },
3327   { OPERAND_TYPE_DISP32, "d32" },
3328   { OPERAND_TYPE_DISP32S, "d32s" },
3329   { OPERAND_TYPE_DISP64, "d64" },
3330   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3331   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3332   { OPERAND_TYPE_CONTROL, "control reg" },
3333   { OPERAND_TYPE_TEST, "test reg" },
3334   { OPERAND_TYPE_DEBUG, "debug reg" },
3335   { OPERAND_TYPE_FLOATREG, "FReg" },
3336   { OPERAND_TYPE_FLOATACC, "FAcc" },
3337   { OPERAND_TYPE_SREG, "SReg" },
3338   { OPERAND_TYPE_REGMMX, "rMMX" },
3339   { OPERAND_TYPE_REGXMM, "rXMM" },
3340   { OPERAND_TYPE_REGYMM, "rYMM" },
3341   { OPERAND_TYPE_REGZMM, "rZMM" },
3342   { OPERAND_TYPE_REGTMM, "rTMM" },
3343   { OPERAND_TYPE_REGMASK, "Mask reg" },
3344 };
3345
3346 static void
3347 pt (i386_operand_type t)
3348 {
3349   unsigned int j;
3350   i386_operand_type a;
3351
3352   for (j = 0; j < ARRAY_SIZE (type_names); j++)
3353     {
3354       a = operand_type_and (t, type_names[j].mask);
3355       if (operand_type_equal (&a, &type_names[j].mask))
3356         fprintf (stdout, "%s, ",  type_names[j].name);
3357     }
3358   fflush (stdout);
3359 }
3360
3361 #endif /* DEBUG386 */
3362 \f
3363 static bfd_reloc_code_real_type
3364 reloc (unsigned int size,
3365        int pcrel,
3366        int sign,
3367        bfd_reloc_code_real_type other)
3368 {
3369   if (other != NO_RELOC)
3370     {
3371       reloc_howto_type *rel;
3372
3373       if (size == 8)
3374         switch (other)
3375           {
3376           case BFD_RELOC_X86_64_GOT32:
3377             return BFD_RELOC_X86_64_GOT64;
3378             break;
3379           case BFD_RELOC_X86_64_GOTPLT64:
3380             return BFD_RELOC_X86_64_GOTPLT64;
3381             break;
3382           case BFD_RELOC_X86_64_PLTOFF64:
3383             return BFD_RELOC_X86_64_PLTOFF64;
3384             break;
3385           case BFD_RELOC_X86_64_GOTPC32:
3386             other = BFD_RELOC_X86_64_GOTPC64;
3387             break;
3388           case BFD_RELOC_X86_64_GOTPCREL:
3389             other = BFD_RELOC_X86_64_GOTPCREL64;
3390             break;
3391           case BFD_RELOC_X86_64_TPOFF32:
3392             other = BFD_RELOC_X86_64_TPOFF64;
3393             break;
3394           case BFD_RELOC_X86_64_DTPOFF32:
3395             other = BFD_RELOC_X86_64_DTPOFF64;
3396             break;
3397           default:
3398             break;
3399           }
3400
3401 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3402       if (other == BFD_RELOC_SIZE32)
3403         {
3404           if (size == 8)
3405             other = BFD_RELOC_SIZE64;
3406           if (pcrel)
3407             {
3408               as_bad (_("there are no pc-relative size relocations"));
3409               return NO_RELOC;
3410             }
3411         }
3412 #endif
3413
3414       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
3415       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3416         sign = -1;
3417
3418       rel = bfd_reloc_type_lookup (stdoutput, other);
3419       if (!rel)
3420         as_bad (_("unknown relocation (%u)"), other);
3421       else if (size != bfd_get_reloc_size (rel))
3422         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3423                 bfd_get_reloc_size (rel),
3424                 size);
3425       else if (pcrel && !rel->pc_relative)
3426         as_bad (_("non-pc-relative relocation for pc-relative field"));
3427       else if ((rel->complain_on_overflow == complain_overflow_signed
3428                 && !sign)
3429                || (rel->complain_on_overflow == complain_overflow_unsigned
3430                    && sign > 0))
3431         as_bad (_("relocated field and relocation type differ in signedness"));
3432       else
3433         return other;
3434       return NO_RELOC;
3435     }
3436
3437   if (pcrel)
3438     {
3439       if (!sign)
3440         as_bad (_("there are no unsigned pc-relative relocations"));
3441       switch (size)
3442         {
3443         case 1: return BFD_RELOC_8_PCREL;
3444         case 2: return BFD_RELOC_16_PCREL;
3445         case 4: return BFD_RELOC_32_PCREL;
3446         case 8: return BFD_RELOC_64_PCREL;
3447         }
3448       as_bad (_("cannot do %u byte pc-relative relocation"), size);
3449     }
3450   else
3451     {
3452       if (sign > 0)
3453         switch (size)
3454           {
3455           case 4: return BFD_RELOC_X86_64_32S;
3456           }
3457       else
3458         switch (size)
3459           {
3460           case 1: return BFD_RELOC_8;
3461           case 2: return BFD_RELOC_16;
3462           case 4: return BFD_RELOC_32;
3463           case 8: return BFD_RELOC_64;
3464           }
3465       as_bad (_("cannot do %s %u byte relocation"),
3466               sign > 0 ? "signed" : "unsigned", size);
3467     }
3468
3469   return NO_RELOC;
3470 }
3471
3472 /* Here we decide which fixups can be adjusted to make them relative to
3473    the beginning of the section instead of the symbol.  Basically we need
3474    to make sure that the dynamic relocations are done correctly, so in
3475    some cases we force the original symbol to be used.  */
3476
3477 int
3478 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3479 {
3480 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3481   if (!IS_ELF)
3482     return 1;
3483
3484   /* Don't adjust pc-relative references to merge sections in 64-bit
3485      mode.  */
3486   if (use_rela_relocations
3487       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3488       && fixP->fx_pcrel)
3489     return 0;
3490
3491   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3492      and changed later by validate_fix.  */
3493   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3494       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3495     return 0;
3496
3497   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
3498      for size relocations.  */
3499   if (fixP->fx_r_type == BFD_RELOC_SIZE32
3500       || fixP->fx_r_type == BFD_RELOC_SIZE64
3501       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3502       || fixP->fx_r_type == BFD_RELOC_386_GOT32
3503       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3504       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3505       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3506       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3507       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3508       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3509       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3510       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3511       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3512       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3513       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3514       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3515       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3516       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3517       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3518       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3519       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3520       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3521       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3522       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3523       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3524       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3525       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3526       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3527       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3528       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3529       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3530     return 0;
3531 #endif
3532   return 1;
3533 }
3534
3535 static int
3536 intel_float_operand (const char *mnemonic)
3537 {
3538   /* Note that the value returned is meaningful only for opcodes with (memory)
3539      operands, hence the code here is free to improperly handle opcodes that
3540      have no operands (for better performance and smaller code). */
3541
3542   if (mnemonic[0] != 'f')
3543     return 0; /* non-math */
3544
3545   switch (mnemonic[1])
3546     {
3547     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3548        the fs segment override prefix not currently handled because no
3549        call path can make opcodes without operands get here */
3550     case 'i':
3551       return 2 /* integer op */;
3552     case 'l':
3553       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3554         return 3; /* fldcw/fldenv */
3555       break;
3556     case 'n':
3557       if (mnemonic[2] != 'o' /* fnop */)
3558         return 3; /* non-waiting control op */
3559       break;
3560     case 'r':
3561       if (mnemonic[2] == 's')
3562         return 3; /* frstor/frstpm */
3563       break;
3564     case 's':
3565       if (mnemonic[2] == 'a')
3566         return 3; /* fsave */
3567       if (mnemonic[2] == 't')
3568         {
3569           switch (mnemonic[3])
3570             {
3571             case 'c': /* fstcw */
3572             case 'd': /* fstdw */
3573             case 'e': /* fstenv */
3574             case 's': /* fsts[gw] */
3575               return 3;
3576             }
3577         }
3578       break;
3579     case 'x':
3580       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3581         return 0; /* fxsave/fxrstor are not really math ops */
3582       break;
3583     }
3584
3585   return 1;
3586 }
3587
3588 static INLINE void
3589 install_template (const insn_template *t)
3590 {
3591   unsigned int l;
3592
3593   i.tm = *t;
3594
3595   /* Note that for pseudo prefixes this produces a length of 1. But for them
3596      the length isn't interesting at all.  */
3597   for (l = 1; l < 4; ++l)
3598     if (!(t->base_opcode >> (8 * l)))
3599       break;
3600
3601   i.opcode_length = l;
3602 }
3603
3604 /* Build the VEX prefix.  */
3605
3606 static void
3607 build_vex_prefix (const insn_template *t)
3608 {
3609   unsigned int register_specifier;
3610   unsigned int vector_length;
3611   unsigned int w;
3612
3613   /* Check register specifier.  */
3614   if (i.vex.register_specifier)
3615     {
3616       register_specifier =
3617         ~register_number (i.vex.register_specifier) & 0xf;
3618       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3619     }
3620   else
3621     register_specifier = 0xf;
3622
3623   /* Use 2-byte VEX prefix by swapping destination and source operand
3624      if there are more than 1 register operand.  */
3625   if (i.reg_operands > 1
3626       && i.vec_encoding != vex_encoding_vex3
3627       && i.dir_encoding == dir_encoding_default
3628       && i.operands == i.reg_operands
3629       && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3630       && i.tm.opcode_modifier.opcodespace == SPACE_0F
3631       && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3632       && i.rex == REX_B)
3633     {
3634       unsigned int xchg = i.operands - 1;
3635       union i386_op temp_op;
3636       i386_operand_type temp_type;
3637
3638       temp_type = i.types[xchg];
3639       i.types[xchg] = i.types[0];
3640       i.types[0] = temp_type;
3641       temp_op = i.op[xchg];
3642       i.op[xchg] = i.op[0];
3643       i.op[0] = temp_op;
3644
3645       gas_assert (i.rm.mode == 3);
3646
3647       i.rex = REX_R;
3648       xchg = i.rm.regmem;
3649       i.rm.regmem = i.rm.reg;
3650       i.rm.reg = xchg;
3651
3652       if (i.tm.opcode_modifier.d)
3653         i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3654                             ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3655       else /* Use the next insn.  */
3656         install_template (&t[1]);
3657     }
3658
3659   /* Use 2-byte VEX prefix by swapping commutative source operands if there
3660      are no memory operands and at least 3 register ones.  */
3661   if (i.reg_operands >= 3
3662       && i.vec_encoding != vex_encoding_vex3
3663       && i.reg_operands == i.operands - i.imm_operands
3664       && i.tm.opcode_modifier.vex
3665       && i.tm.opcode_modifier.commutative
3666       && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3667       && i.rex == REX_B
3668       && i.vex.register_specifier
3669       && !(i.vex.register_specifier->reg_flags & RegRex))
3670     {
3671       unsigned int xchg = i.operands - i.reg_operands;
3672       union i386_op temp_op;
3673       i386_operand_type temp_type;
3674
3675       gas_assert (i.tm.opcode_modifier.opcodespace == SPACE_0F);
3676       gas_assert (!i.tm.opcode_modifier.sae);
3677       gas_assert (operand_type_equal (&i.types[i.operands - 2],
3678                                       &i.types[i.operands - 3]));
3679       gas_assert (i.rm.mode == 3);
3680
3681       temp_type = i.types[xchg];
3682       i.types[xchg] = i.types[xchg + 1];
3683       i.types[xchg + 1] = temp_type;
3684       temp_op = i.op[xchg];
3685       i.op[xchg] = i.op[xchg + 1];
3686       i.op[xchg + 1] = temp_op;
3687
3688       i.rex = 0;
3689       xchg = i.rm.regmem | 8;
3690       i.rm.regmem = ~register_specifier & 0xf;
3691       gas_assert (!(i.rm.regmem & 8));
3692       i.vex.register_specifier += xchg - i.rm.regmem;
3693       register_specifier = ~xchg & 0xf;
3694     }
3695
3696   if (i.tm.opcode_modifier.vex == VEXScalar)
3697     vector_length = avxscalar;
3698   else if (i.tm.opcode_modifier.vex == VEX256)
3699     vector_length = 1;
3700   else
3701     {
3702       unsigned int op;
3703
3704       /* Determine vector length from the last multi-length vector
3705          operand.  */
3706       vector_length = 0;
3707       for (op = t->operands; op--;)
3708         if (t->operand_types[op].bitfield.xmmword
3709             && t->operand_types[op].bitfield.ymmword
3710             && i.types[op].bitfield.ymmword)
3711           {
3712             vector_length = 1;
3713             break;
3714           }
3715     }
3716
3717   /* Check the REX.W bit and VEXW.  */
3718   if (i.tm.opcode_modifier.vexw == VEXWIG)
3719     w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3720   else if (i.tm.opcode_modifier.vexw)
3721     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3722   else
3723     w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3724
3725   /* Use 2-byte VEX prefix if possible.  */
3726   if (w == 0
3727       && i.vec_encoding != vex_encoding_vex3
3728       && i.tm.opcode_modifier.opcodespace == SPACE_0F
3729       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3730     {
3731       /* 2-byte VEX prefix.  */
3732       unsigned int r;
3733
3734       i.vex.length = 2;
3735       i.vex.bytes[0] = 0xc5;
3736
3737       /* Check the REX.R bit.  */
3738       r = (i.rex & REX_R) ? 0 : 1;
3739       i.vex.bytes[1] = (r << 7
3740                         | register_specifier << 3
3741                         | vector_length << 2
3742                         | i.tm.opcode_modifier.opcodeprefix);
3743     }
3744   else
3745     {
3746       /* 3-byte VEX prefix.  */
3747       i.vex.length = 3;
3748
3749       switch (i.tm.opcode_modifier.opcodespace)
3750         {
3751         case SPACE_0F:
3752         case SPACE_0F38:
3753         case SPACE_0F3A:
3754           i.vex.bytes[0] = 0xc4;
3755           break;
3756         case SPACE_XOP08:
3757         case SPACE_XOP09:
3758         case SPACE_XOP0A:
3759           i.vex.bytes[0] = 0x8f;
3760           break;
3761         default:
3762           abort ();
3763         }
3764
3765       /* The high 3 bits of the second VEX byte are 1's compliment
3766          of RXB bits from REX.  */
3767       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3768
3769       i.vex.bytes[2] = (w << 7
3770                         | register_specifier << 3
3771                         | vector_length << 2
3772                         | i.tm.opcode_modifier.opcodeprefix);
3773     }
3774 }
3775
3776 static INLINE bfd_boolean
3777 is_evex_encoding (const insn_template *t)
3778 {
3779   return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3780          || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3781          || t->opcode_modifier.sae;
3782 }
3783
3784 static INLINE bfd_boolean
3785 is_any_vex_encoding (const insn_template *t)
3786 {
3787   return t->opcode_modifier.vex || is_evex_encoding (t);
3788 }
3789
3790 /* Build the EVEX prefix.  */
3791
3792 static void
3793 build_evex_prefix (void)
3794 {
3795   unsigned int register_specifier, w;
3796   rex_byte vrex_used = 0;
3797
3798   /* Check register specifier.  */
3799   if (i.vex.register_specifier)
3800     {
3801       gas_assert ((i.vrex & REX_X) == 0);
3802
3803       register_specifier = i.vex.register_specifier->reg_num;
3804       if ((i.vex.register_specifier->reg_flags & RegRex))
3805         register_specifier += 8;
3806       /* The upper 16 registers are encoded in the fourth byte of the
3807          EVEX prefix.  */
3808       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3809         i.vex.bytes[3] = 0x8;
3810       register_specifier = ~register_specifier & 0xf;
3811     }
3812   else
3813     {
3814       register_specifier = 0xf;
3815
3816       /* Encode upper 16 vector index register in the fourth byte of
3817          the EVEX prefix.  */
3818       if (!(i.vrex & REX_X))
3819         i.vex.bytes[3] = 0x8;
3820       else
3821         vrex_used |= REX_X;
3822     }
3823
3824   /* 4 byte EVEX prefix.  */
3825   i.vex.length = 4;
3826   i.vex.bytes[0] = 0x62;
3827
3828   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3829      bits from REX.  */
3830   gas_assert (i.tm.opcode_modifier.opcodespace >= SPACE_0F);
3831   gas_assert (i.tm.opcode_modifier.opcodespace <= SPACE_0F3A);
3832   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3833
3834   /* The fifth bit of the second EVEX byte is 1's compliment of the
3835      REX_R bit in VREX.  */
3836   if (!(i.vrex & REX_R))
3837     i.vex.bytes[1] |= 0x10;
3838   else
3839     vrex_used |= REX_R;
3840
3841   if ((i.reg_operands + i.imm_operands) == i.operands)
3842     {
3843       /* When all operands are registers, the REX_X bit in REX is not
3844          used.  We reuse it to encode the upper 16 registers, which is
3845          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3846          as 1's compliment.  */
3847       if ((i.vrex & REX_B))
3848         {
3849           vrex_used |= REX_B;
3850           i.vex.bytes[1] &= ~0x40;
3851         }
3852     }
3853
3854   /* EVEX instructions shouldn't need the REX prefix.  */
3855   i.vrex &= ~vrex_used;
3856   gas_assert (i.vrex == 0);
3857
3858   /* Check the REX.W bit and VEXW.  */
3859   if (i.tm.opcode_modifier.vexw == VEXWIG)
3860     w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3861   else if (i.tm.opcode_modifier.vexw)
3862     w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3863   else
3864     w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3865
3866   /* The third byte of the EVEX prefix.  */
3867   i.vex.bytes[2] = ((w << 7)
3868                     | (register_specifier << 3)
3869                     | 4 /* Encode the U bit.  */
3870                     | i.tm.opcode_modifier.opcodeprefix);
3871
3872   /* The fourth byte of the EVEX prefix.  */
3873   /* The zeroing-masking bit.  */
3874   if (i.mask && i.mask->zeroing)
3875     i.vex.bytes[3] |= 0x80;
3876
3877   /* Don't always set the broadcast bit if there is no RC.  */
3878   if (!i.rounding)
3879     {
3880       /* Encode the vector length.  */
3881       unsigned int vec_length;
3882
3883       if (!i.tm.opcode_modifier.evex
3884           || i.tm.opcode_modifier.evex == EVEXDYN)
3885         {
3886           unsigned int op;
3887
3888           /* Determine vector length from the last multi-length vector
3889              operand.  */
3890           for (op = i.operands; op--;)
3891             if (i.tm.operand_types[op].bitfield.xmmword
3892                 + i.tm.operand_types[op].bitfield.ymmword
3893                 + i.tm.operand_types[op].bitfield.zmmword > 1)
3894               {
3895                 if (i.types[op].bitfield.zmmword)
3896                   {
3897                     i.tm.opcode_modifier.evex = EVEX512;
3898                     break;
3899                   }
3900                 else if (i.types[op].bitfield.ymmword)
3901                   {
3902                     i.tm.opcode_modifier.evex = EVEX256;
3903                     break;
3904                   }
3905                 else if (i.types[op].bitfield.xmmword)
3906                   {
3907                     i.tm.opcode_modifier.evex = EVEX128;
3908                     break;
3909                   }
3910                 else if (i.broadcast && (int) op == i.broadcast->operand)
3911                   {
3912                     switch (i.broadcast->bytes)
3913                       {
3914                         case 64:
3915                           i.tm.opcode_modifier.evex = EVEX512;
3916                           break;
3917                         case 32:
3918                           i.tm.opcode_modifier.evex = EVEX256;
3919                           break;
3920                         case 16:
3921                           i.tm.opcode_modifier.evex = EVEX128;
3922                           break;
3923                         default:
3924                           abort ();
3925                       }
3926                     break;
3927                   }
3928               }
3929
3930           if (op >= MAX_OPERANDS)
3931             abort ();
3932         }
3933
3934       switch (i.tm.opcode_modifier.evex)
3935         {
3936         case EVEXLIG: /* LL' is ignored */
3937           vec_length = evexlig << 5;
3938           break;
3939         case EVEX128:
3940           vec_length = 0 << 5;
3941           break;
3942         case EVEX256:
3943           vec_length = 1 << 5;
3944           break;
3945         case EVEX512:
3946           vec_length = 2 << 5;
3947           break;
3948         default:
3949           abort ();
3950           break;
3951         }
3952       i.vex.bytes[3] |= vec_length;
3953       /* Encode the broadcast bit.  */
3954       if (i.broadcast)
3955         i.vex.bytes[3] |= 0x10;
3956     }
3957   else
3958     {
3959       if (i.rounding->type != saeonly)
3960         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3961       else
3962         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3963     }
3964
3965   if (i.mask && i.mask->mask)
3966     i.vex.bytes[3] |= i.mask->mask->reg_num;
3967 }
3968
3969 static void
3970 process_immext (void)
3971 {
3972   expressionS *exp;
3973
3974   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3975      which is coded in the same place as an 8-bit immediate field
3976      would be.  Here we fake an 8-bit immediate operand from the
3977      opcode suffix stored in tm.extension_opcode.
3978
3979      AVX instructions also use this encoding, for some of
3980      3 argument instructions.  */
3981
3982   gas_assert (i.imm_operands <= 1
3983               && (i.operands <= 2
3984                   || (is_any_vex_encoding (&i.tm)
3985                       && i.operands <= 4)));
3986
3987   exp = &im_expressions[i.imm_operands++];
3988   i.op[i.operands].imms = exp;
3989   i.types[i.operands] = imm8;
3990   i.operands++;
3991   exp->X_op = O_constant;
3992   exp->X_add_number = i.tm.extension_opcode;
3993   i.tm.extension_opcode = None;
3994 }
3995
3996
3997 static int
3998 check_hle (void)
3999 {
4000   switch (i.tm.opcode_modifier.prefixok)
4001     {
4002     default:
4003       abort ();
4004     case PrefixLock:
4005     case PrefixNone:
4006     case PrefixNoTrack:
4007     case PrefixRep:
4008       as_bad (_("invalid instruction `%s' after `%s'"),
4009               i.tm.name, i.hle_prefix);
4010       return 0;
4011     case PrefixHLELock:
4012       if (i.prefix[LOCK_PREFIX])
4013         return 1;
4014       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4015       return 0;
4016     case PrefixHLEAny:
4017       return 1;
4018     case PrefixHLERelease:
4019       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4020         {
4021           as_bad (_("instruction `%s' after `xacquire' not allowed"),
4022                   i.tm.name);
4023           return 0;
4024         }
4025       if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4026         {
4027           as_bad (_("memory destination needed for instruction `%s'"
4028                     " after `xrelease'"), i.tm.name);
4029           return 0;
4030         }
4031       return 1;
4032     }
4033 }
4034
4035 /* Try the shortest encoding by shortening operand size.  */
4036
4037 static void
4038 optimize_encoding (void)
4039 {
4040   unsigned int j;
4041
4042   if (optimize_for_space
4043       && !is_any_vex_encoding (&i.tm)
4044       && i.reg_operands == 1
4045       && i.imm_operands == 1
4046       && !i.types[1].bitfield.byte
4047       && i.op[0].imms->X_op == O_constant
4048       && fits_in_imm7 (i.op[0].imms->X_add_number)
4049       && (i.tm.base_opcode == 0xa8
4050           || (i.tm.base_opcode == 0xf6
4051               && i.tm.extension_opcode == 0x0)))
4052     {
4053       /* Optimize: -Os:
4054            test $imm7, %r64/%r32/%r16  -> test $imm7, %r8
4055        */
4056       unsigned int base_regnum = i.op[1].regs->reg_num;
4057       if (flag_code == CODE_64BIT || base_regnum < 4)
4058         {
4059           i.types[1].bitfield.byte = 1;
4060           /* Ignore the suffix.  */
4061           i.suffix = 0;
4062           /* Convert to byte registers.  */
4063           if (i.types[1].bitfield.word)
4064             j = 16;
4065           else if (i.types[1].bitfield.dword)
4066             j = 32;
4067           else
4068             j = 48;
4069           if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4070             j += 8;
4071           i.op[1].regs -= j;
4072         }
4073     }
4074   else if (flag_code == CODE_64BIT
4075            && !is_any_vex_encoding (&i.tm)
4076            && ((i.types[1].bitfield.qword
4077                 && i.reg_operands == 1
4078                 && i.imm_operands == 1
4079                 && i.op[0].imms->X_op == O_constant
4080                 && ((i.tm.base_opcode == 0xb8
4081                      && i.tm.extension_opcode == None
4082                      && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4083                     || (fits_in_imm31 (i.op[0].imms->X_add_number)
4084                         && ((i.tm.base_opcode == 0x24
4085                              || i.tm.base_opcode == 0xa8)
4086                             || (i.tm.base_opcode == 0x80
4087                                 && i.tm.extension_opcode == 0x4)
4088                             || ((i.tm.base_opcode == 0xf6
4089                                  || (i.tm.base_opcode | 1) == 0xc7)
4090                                 && i.tm.extension_opcode == 0x0)))
4091                     || (fits_in_imm7 (i.op[0].imms->X_add_number)
4092                         && i.tm.base_opcode == 0x83
4093                         && i.tm.extension_opcode == 0x4)))
4094                || (i.types[0].bitfield.qword
4095                    && ((i.reg_operands == 2
4096                         && i.op[0].regs == i.op[1].regs
4097                         && (i.tm.base_opcode == 0x30
4098                             || i.tm.base_opcode == 0x28))
4099                        || (i.reg_operands == 1
4100                            && i.operands == 1
4101                            && i.tm.base_opcode == 0x30)))))
4102     {
4103       /* Optimize: -O:
4104            andq $imm31, %r64   -> andl $imm31, %r32
4105            andq $imm7, %r64    -> andl $imm7, %r32
4106            testq $imm31, %r64  -> testl $imm31, %r32
4107            xorq %r64, %r64     -> xorl %r32, %r32
4108            subq %r64, %r64     -> subl %r32, %r32
4109            movq $imm31, %r64   -> movl $imm31, %r32
4110            movq $imm32, %r64   -> movl $imm32, %r32
4111         */
4112       i.tm.opcode_modifier.norex64 = 1;
4113       if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4114         {
4115           /* Handle
4116                movq $imm31, %r64   -> movl $imm31, %r32
4117                movq $imm32, %r64   -> movl $imm32, %r32
4118            */
4119           i.tm.operand_types[0].bitfield.imm32 = 1;
4120           i.tm.operand_types[0].bitfield.imm32s = 0;
4121           i.tm.operand_types[0].bitfield.imm64 = 0;
4122           i.types[0].bitfield.imm32 = 1;
4123           i.types[0].bitfield.imm32s = 0;
4124           i.types[0].bitfield.imm64 = 0;
4125           i.types[1].bitfield.dword = 1;
4126           i.types[1].bitfield.qword = 0;
4127           if ((i.tm.base_opcode | 1) == 0xc7)
4128             {
4129               /* Handle
4130                    movq $imm31, %r64   -> movl $imm31, %r32
4131                */
4132               i.tm.base_opcode = 0xb8;
4133               i.tm.extension_opcode = None;
4134               i.tm.opcode_modifier.w = 0;
4135               i.tm.opcode_modifier.modrm = 0;
4136             }
4137         }
4138     }
4139   else if (optimize > 1
4140            && !optimize_for_space
4141            && !is_any_vex_encoding (&i.tm)
4142            && i.reg_operands == 2
4143            && i.op[0].regs == i.op[1].regs
4144            && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4145                || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4146            && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4147     {
4148       /* Optimize: -O2:
4149            andb %rN, %rN  -> testb %rN, %rN
4150            andw %rN, %rN  -> testw %rN, %rN
4151            andq %rN, %rN  -> testq %rN, %rN
4152            orb %rN, %rN   -> testb %rN, %rN
4153            orw %rN, %rN   -> testw %rN, %rN
4154            orq %rN, %rN   -> testq %rN, %rN
4155
4156            and outside of 64-bit mode
4157
4158            andl %rN, %rN  -> testl %rN, %rN
4159            orl %rN, %rN   -> testl %rN, %rN
4160        */
4161       i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4162     }
4163   else if (i.reg_operands == 3
4164            && i.op[0].regs == i.op[1].regs
4165            && !i.types[2].bitfield.xmmword
4166            && (i.tm.opcode_modifier.vex
4167                || ((!i.mask || i.mask->zeroing)
4168                    && !i.rounding
4169                    && is_evex_encoding (&i.tm)
4170                    && (i.vec_encoding != vex_encoding_evex
4171                        || cpu_arch_isa_flags.bitfield.cpuavx512vl
4172                        || i.tm.cpu_flags.bitfield.cpuavx512vl
4173                        || (i.tm.operand_types[2].bitfield.zmmword
4174                            && i.types[2].bitfield.ymmword))))
4175            && ((i.tm.base_opcode == 0x55
4176                 || i.tm.base_opcode == 0x57
4177                 || i.tm.base_opcode == 0xdf
4178                 || i.tm.base_opcode == 0xef
4179                 || i.tm.base_opcode == 0xf8
4180                 || i.tm.base_opcode == 0xf9
4181                 || i.tm.base_opcode == 0xfa
4182                 || i.tm.base_opcode == 0xfb
4183                 || i.tm.base_opcode == 0x42
4184                 || i.tm.base_opcode == 0x47)
4185                && i.tm.extension_opcode == None))
4186     {
4187       /* Optimize: -O1:
4188            VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4189            vpsubq and vpsubw:
4190              EVEX VOP %zmmM, %zmmM, %zmmN
4191                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4192                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4193              EVEX VOP %ymmM, %ymmM, %ymmN
4194                -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4195                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4196              VEX VOP %ymmM, %ymmM, %ymmN
4197                -> VEX VOP %xmmM, %xmmM, %xmmN
4198            VOP, one of vpandn and vpxor:
4199              VEX VOP %ymmM, %ymmM, %ymmN
4200                -> VEX VOP %xmmM, %xmmM, %xmmN
4201            VOP, one of vpandnd and vpandnq:
4202              EVEX VOP %zmmM, %zmmM, %zmmN
4203                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4204                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4205              EVEX VOP %ymmM, %ymmM, %ymmN
4206                -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4207                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4208            VOP, one of vpxord and vpxorq:
4209              EVEX VOP %zmmM, %zmmM, %zmmN
4210                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4211                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4212              EVEX VOP %ymmM, %ymmM, %ymmN
4213                -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4214                -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4215            VOP, one of kxord and kxorq:
4216              VEX VOP %kM, %kM, %kN
4217                -> VEX kxorw %kM, %kM, %kN
4218            VOP, one of kandnd and kandnq:
4219              VEX VOP %kM, %kM, %kN
4220                -> VEX kandnw %kM, %kM, %kN
4221        */
4222       if (is_evex_encoding (&i.tm))
4223         {
4224           if (i.vec_encoding != vex_encoding_evex)
4225             {
4226               i.tm.opcode_modifier.vex = VEX128;
4227               i.tm.opcode_modifier.vexw = VEXW0;
4228               i.tm.opcode_modifier.evex = 0;
4229             }
4230           else if (optimize > 1)
4231             i.tm.opcode_modifier.evex = EVEX128;
4232           else
4233             return;
4234         }
4235       else if (i.tm.operand_types[0].bitfield.class == RegMask)
4236         {
4237           i.tm.opcode_modifier.opcodeprefix = PREFIX_NONE;
4238           i.tm.opcode_modifier.vexw = VEXW0;
4239         }
4240       else
4241         i.tm.opcode_modifier.vex = VEX128;
4242
4243       if (i.tm.opcode_modifier.vex)
4244         for (j = 0; j < 3; j++)
4245           {
4246             i.types[j].bitfield.xmmword = 1;
4247             i.types[j].bitfield.ymmword = 0;
4248           }
4249     }
4250   else if (i.vec_encoding != vex_encoding_evex
4251            && !i.types[0].bitfield.zmmword
4252            && !i.types[1].bitfield.zmmword
4253            && !i.mask
4254            && !i.broadcast
4255            && is_evex_encoding (&i.tm)
4256            && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4257                || (i.tm.base_opcode & ~4) == 0xdb
4258                || (i.tm.base_opcode & ~4) == 0xeb)
4259            && i.tm.extension_opcode == None)
4260     {
4261       /* Optimize: -O1:
4262            VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4263            vmovdqu32 and vmovdqu64:
4264              EVEX VOP %xmmM, %xmmN
4265                -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4266              EVEX VOP %ymmM, %ymmN
4267                -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4268              EVEX VOP %xmmM, mem
4269                -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4270              EVEX VOP %ymmM, mem
4271                -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4272              EVEX VOP mem, %xmmN
4273                -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4274              EVEX VOP mem, %ymmN
4275                -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4276            VOP, one of vpand, vpandn, vpor, vpxor:
4277              EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4278                -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4279              EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4280                -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4281              EVEX VOP{d,q} mem, %xmmM, %xmmN
4282                -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4283              EVEX VOP{d,q} mem, %ymmM, %ymmN
4284                -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4285        */
4286       for (j = 0; j < i.operands; j++)
4287         if (operand_type_check (i.types[j], disp)
4288             && i.op[j].disps->X_op == O_constant)
4289           {
4290             /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4291                has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4292                bytes, we choose EVEX Disp8 over VEX Disp32.  */
4293             int evex_disp8, vex_disp8;
4294             unsigned int memshift = i.memshift;
4295             offsetT n = i.op[j].disps->X_add_number;
4296
4297             evex_disp8 = fits_in_disp8 (n);
4298             i.memshift = 0;
4299             vex_disp8 = fits_in_disp8 (n);
4300             if (evex_disp8 != vex_disp8)
4301               {
4302                 i.memshift = memshift;
4303                 return;
4304               }
4305
4306             i.types[j].bitfield.disp8 = vex_disp8;
4307             break;
4308           }
4309       if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4310           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2)
4311         i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
4312       i.tm.opcode_modifier.vex
4313         = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4314       i.tm.opcode_modifier.vexw = VEXW0;
4315       /* VPAND, VPOR, and VPXOR are commutative.  */
4316       if (i.reg_operands == 3 && i.tm.base_opcode != 0xdf)
4317         i.tm.opcode_modifier.commutative = 1;
4318       i.tm.opcode_modifier.evex = 0;
4319       i.tm.opcode_modifier.masking = 0;
4320       i.tm.opcode_modifier.broadcast = 0;
4321       i.tm.opcode_modifier.disp8memshift = 0;
4322       i.memshift = 0;
4323       if (j < i.operands)
4324         i.types[j].bitfield.disp8
4325           = fits_in_disp8 (i.op[j].disps->X_add_number);
4326     }
4327 }
4328
4329 /* Return non-zero for load instruction.  */
4330
4331 static int
4332 load_insn_p (void)
4333 {
4334   unsigned int dest;
4335   int any_vex_p = is_any_vex_encoding (&i.tm);
4336   unsigned int base_opcode = i.tm.base_opcode | 1;
4337
4338   if (!any_vex_p)
4339     {
4340       /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4341          prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4342          bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote.  */
4343       if (i.tm.opcode_modifier.anysize)
4344         return 0;
4345
4346       /* pop, popf, popa.   */
4347       if (strcmp (i.tm.name, "pop") == 0
4348           || i.tm.base_opcode == 0x9d
4349           || i.tm.base_opcode == 0x61)
4350         return 1;
4351
4352       /* movs, cmps, lods, scas.  */
4353       if ((i.tm.base_opcode | 0xb) == 0xaf)
4354         return 1;
4355
4356       /* outs, xlatb.  */
4357       if (base_opcode == 0x6f
4358           || i.tm.base_opcode == 0xd7)
4359         return 1;
4360       /* NB: For AMD-specific insns with implicit memory operands,
4361          they're intentionally not covered.  */
4362     }
4363
4364   /* No memory operand.  */
4365   if (!i.mem_operands)
4366     return 0;
4367
4368   if (any_vex_p)
4369     {
4370       /* vldmxcsr.  */
4371       if (i.tm.base_opcode == 0xae
4372           && i.tm.opcode_modifier.vex
4373           && i.tm.opcode_modifier.opcodespace == SPACE_0F
4374           && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4375           && i.tm.extension_opcode == 2)
4376         return 1;
4377     }
4378   else
4379     {
4380       /* test, not, neg, mul, imul, div, idiv.  */
4381       if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4382           && i.tm.extension_opcode != 1)
4383         return 1;
4384
4385       /* inc, dec.  */
4386       if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4387         return 1;
4388
4389       /* add, or, adc, sbb, and, sub, xor, cmp.  */
4390       if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4391         return 1;
4392
4393       /* bt, bts, btr, btc.  */
4394       if (i.tm.base_opcode == 0xfba
4395           && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4396         return 1;
4397
4398       /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4399       if ((base_opcode == 0xc1
4400            || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4401           && i.tm.extension_opcode != 6)
4402         return 1;
4403
4404       /* cmpxchg8b, cmpxchg16b, xrstors, vmptrld.  */
4405       if (i.tm.base_opcode == 0xfc7
4406           && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4407           && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3
4408               || i.tm.extension_opcode == 6))
4409         return 1;
4410
4411       /* fxrstor, ldmxcsr, xrstor.  */
4412       if (i.tm.base_opcode == 0xfae
4413           && (i.tm.extension_opcode == 1
4414               || i.tm.extension_opcode == 2
4415               || i.tm.extension_opcode == 5))
4416         return 1;
4417
4418       /* lgdt, lidt, lmsw.  */
4419       if (i.tm.base_opcode == 0xf01
4420           && (i.tm.extension_opcode == 2
4421               || i.tm.extension_opcode == 3
4422               || i.tm.extension_opcode == 6))
4423         return 1;
4424
4425       /* Check for x87 instructions.  */
4426       if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4427         {
4428           /* Skip fst, fstp, fstenv, fstcw.  */
4429           if (i.tm.base_opcode == 0xd9
4430               && (i.tm.extension_opcode == 2
4431                   || i.tm.extension_opcode == 3
4432                   || i.tm.extension_opcode == 6
4433                   || i.tm.extension_opcode == 7))
4434             return 0;
4435
4436           /* Skip fisttp, fist, fistp, fstp.  */
4437           if (i.tm.base_opcode == 0xdb
4438               && (i.tm.extension_opcode == 1
4439                   || i.tm.extension_opcode == 2
4440                   || i.tm.extension_opcode == 3
4441                   || i.tm.extension_opcode == 7))
4442             return 0;
4443
4444           /* Skip fisttp, fst, fstp, fsave, fstsw.  */
4445           if (i.tm.base_opcode == 0xdd
4446               && (i.tm.extension_opcode == 1
4447                   || i.tm.extension_opcode == 2
4448                   || i.tm.extension_opcode == 3
4449                   || i.tm.extension_opcode == 6
4450                   || i.tm.extension_opcode == 7))
4451             return 0;
4452
4453           /* Skip fisttp, fist, fistp, fbstp, fistp.  */
4454           if (i.tm.base_opcode == 0xdf
4455               && (i.tm.extension_opcode == 1
4456                   || i.tm.extension_opcode == 2
4457                   || i.tm.extension_opcode == 3
4458                   || i.tm.extension_opcode == 6
4459                   || i.tm.extension_opcode == 7))
4460             return 0;
4461
4462           return 1;
4463         }
4464     }
4465
4466   dest = i.operands - 1;
4467
4468   /* Check fake imm8 operand and 3 source operands.  */
4469   if ((i.tm.opcode_modifier.immext
4470        || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4471       && i.types[dest].bitfield.imm8)
4472     dest--;
4473
4474   /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd  */
4475   if (!any_vex_p
4476       && (base_opcode == 0x1
4477           || base_opcode == 0x9
4478           || base_opcode == 0x11
4479           || base_opcode == 0x19
4480           || base_opcode == 0x21
4481           || base_opcode == 0x29
4482           || base_opcode == 0x31
4483           || base_opcode == 0x39
4484           || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4485           || base_opcode == 0xfc1))
4486     return 1;
4487
4488   /* Check for load instruction.  */
4489   return (i.types[dest].bitfield.class != ClassNone
4490           || i.types[dest].bitfield.instance == Accum);
4491 }
4492
4493 /* Output lfence, 0xfaee8, after instruction.  */
4494
4495 static void
4496 insert_lfence_after (void)
4497 {
4498   if (lfence_after_load && load_insn_p ())
4499     {
4500       /* There are also two REP string instructions that require
4501          special treatment. Specifically, the compare string (CMPS)
4502          and scan string (SCAS) instructions set EFLAGS in a manner
4503          that depends on the data being compared/scanned. When used
4504          with a REP prefix, the number of iterations may therefore
4505          vary depending on this data. If the data is a program secret
4506          chosen by the adversary using an LVI method,
4507          then this data-dependent behavior may leak some aspect
4508          of the secret.  */
4509       if (((i.tm.base_opcode | 0x1) == 0xa7
4510            || (i.tm.base_opcode | 0x1) == 0xaf)
4511           && i.prefix[REP_PREFIX])
4512         {
4513             as_warn (_("`%s` changes flags which would affect control flow behavior"),
4514                      i.tm.name);
4515         }
4516       char *p = frag_more (3);
4517       *p++ = 0xf;
4518       *p++ = 0xae;
4519       *p = 0xe8;
4520     }
4521 }
4522
4523 /* Output lfence, 0xfaee8, before instruction.  */
4524
4525 static void
4526 insert_lfence_before (void)
4527 {
4528   char *p;
4529
4530   if (is_any_vex_encoding (&i.tm))
4531     return;
4532
4533   if (i.tm.base_opcode == 0xff
4534       && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4535     {
4536       /* Insert lfence before indirect branch if needed.  */
4537
4538       if (lfence_before_indirect_branch == lfence_branch_none)
4539         return;
4540
4541       if (i.operands != 1)
4542         abort ();
4543
4544       if (i.reg_operands == 1)
4545         {
4546           /* Indirect branch via register.  Don't insert lfence with
4547              -mlfence-after-load=yes.  */
4548           if (lfence_after_load
4549               || lfence_before_indirect_branch == lfence_branch_memory)
4550             return;
4551         }
4552       else if (i.mem_operands == 1
4553                && lfence_before_indirect_branch != lfence_branch_register)
4554         {
4555           as_warn (_("indirect `%s` with memory operand should be avoided"),
4556                    i.tm.name);
4557           return;
4558         }
4559       else
4560         return;
4561
4562       if (last_insn.kind != last_insn_other
4563           && last_insn.seg == now_seg)
4564         {
4565           as_warn_where (last_insn.file, last_insn.line,
4566                          _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4567                          last_insn.name, i.tm.name);
4568           return;
4569         }
4570
4571       p = frag_more (3);
4572       *p++ = 0xf;
4573       *p++ = 0xae;
4574       *p = 0xe8;
4575       return;
4576     }
4577
4578   /* Output or/not/shl and lfence before near ret.  */
4579   if (lfence_before_ret != lfence_before_ret_none
4580       && (i.tm.base_opcode == 0xc2
4581           || i.tm.base_opcode == 0xc3))
4582     {
4583       if (last_insn.kind != last_insn_other
4584           && last_insn.seg == now_seg)
4585         {
4586           as_warn_where (last_insn.file, last_insn.line,
4587                          _("`%s` skips -mlfence-before-ret on `%s`"),
4588                          last_insn.name, i.tm.name);
4589           return;
4590         }
4591
4592       /* Near ret ingore operand size override under CPU64.  */
4593       char prefix = flag_code == CODE_64BIT
4594                     ? 0x48
4595                     : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4596
4597       if (lfence_before_ret == lfence_before_ret_not)
4598         {
4599           /* not: 0xf71424, may add prefix
4600              for operand size override or 64-bit code.  */
4601           p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4602           if (prefix)
4603             *p++ = prefix;
4604           *p++ = 0xf7;
4605           *p++ = 0x14;
4606           *p++ = 0x24;
4607           if (prefix)
4608             *p++ = prefix;
4609           *p++ = 0xf7;
4610           *p++ = 0x14;
4611           *p++ = 0x24;
4612         }
4613       else
4614         {
4615           p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4616           if (prefix)
4617             *p++ = prefix;
4618           if (lfence_before_ret == lfence_before_ret_or)
4619             {
4620               /* or: 0x830c2400, may add prefix
4621                  for operand size override or 64-bit code.  */
4622               *p++ = 0x83;
4623               *p++ = 0x0c;
4624             }
4625           else
4626             {
4627               /* shl: 0xc1242400, may add prefix
4628                  for operand size override or 64-bit code.  */
4629               *p++ = 0xc1;
4630               *p++ = 0x24;
4631             }
4632
4633           *p++ = 0x24;
4634           *p++ = 0x0;
4635         }
4636
4637       *p++ = 0xf;
4638       *p++ = 0xae;
4639       *p = 0xe8;
4640     }
4641 }
4642
4643 /* This is the guts of the machine-dependent assembler.  LINE points to a
4644    machine dependent instruction.  This function is supposed to emit
4645    the frags/bytes it assembles to.  */
4646
4647 void
4648 md_assemble (char *line)
4649 {
4650   unsigned int j;
4651   char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4652   const insn_template *t;
4653
4654   /* Initialize globals.  */
4655   memset (&i, '\0', sizeof (i));
4656   for (j = 0; j < MAX_OPERANDS; j++)
4657     i.reloc[j] = NO_RELOC;
4658   memset (disp_expressions, '\0', sizeof (disp_expressions));
4659   memset (im_expressions, '\0', sizeof (im_expressions));
4660   save_stack_p = save_stack;
4661
4662   /* First parse an instruction mnemonic & call i386_operand for the operands.
4663      We assume that the scrubber has arranged it so that line[0] is the valid
4664      start of a (possibly prefixed) mnemonic.  */
4665
4666   line = parse_insn (line, mnemonic);
4667   if (line == NULL)
4668     return;
4669   mnem_suffix = i.suffix;
4670
4671   line = parse_operands (line, mnemonic);
4672   this_operand = -1;
4673   xfree (i.memop1_string);
4674   i.memop1_string = NULL;
4675   if (line == NULL)
4676     return;
4677
4678   /* Now we've parsed the mnemonic into a set of templates, and have the
4679      operands at hand.  */
4680
4681   /* All Intel opcodes have reversed operands except for "bound", "enter",
4682      "invlpg*", "monitor*", "mwait*", "tpause", "umwait", "pvalidate",
4683      "rmpadjust", and "rmpupdate".  We also don't reverse intersegment "jmp"
4684      and "call" instructions with 2 immediate operands so that the immediate
4685      segment precedes the offset consistently in Intel and AT&T modes.  */
4686   if (intel_syntax
4687       && i.operands > 1
4688       && (strcmp (mnemonic, "bound") != 0)
4689       && (strncmp (mnemonic, "invlpg", 6) != 0)
4690       && (strncmp (mnemonic, "monitor", 7) != 0)
4691       && (strncmp (mnemonic, "mwait", 5) != 0)
4692       && (strcmp (mnemonic, "pvalidate") != 0)
4693       && (strncmp (mnemonic, "rmp", 3) != 0)
4694       && (strcmp (mnemonic, "tpause") != 0)
4695       && (strcmp (mnemonic, "umwait") != 0)
4696       && !(operand_type_check (i.types[0], imm)
4697            && operand_type_check (i.types[1], imm)))
4698     swap_operands ();
4699
4700   /* The order of the immediates should be reversed
4701      for 2 immediates extrq and insertq instructions */
4702   if (i.imm_operands == 2
4703       && (strcmp (mnemonic, "extrq") == 0
4704           || strcmp (mnemonic, "insertq") == 0))
4705       swap_2_operands (0, 1);
4706
4707   if (i.imm_operands)
4708     optimize_imm ();
4709
4710   /* Don't optimize displacement for movabs since it only takes 64bit
4711      displacement.  */
4712   if (i.disp_operands
4713       && i.disp_encoding != disp_encoding_32bit
4714       && (flag_code != CODE_64BIT
4715           || strcmp (mnemonic, "movabs") != 0))
4716     optimize_disp ();
4717
4718   /* Next, we find a template that matches the given insn,
4719      making sure the overlap of the given operands types is consistent
4720      with the template operand types.  */
4721
4722   if (!(t = match_template (mnem_suffix)))
4723     return;
4724
4725   if (sse_check != check_none
4726       && !i.tm.opcode_modifier.noavx
4727       && !i.tm.cpu_flags.bitfield.cpuavx
4728       && !i.tm.cpu_flags.bitfield.cpuavx512f
4729       && (i.tm.cpu_flags.bitfield.cpusse
4730           || i.tm.cpu_flags.bitfield.cpusse2
4731           || i.tm.cpu_flags.bitfield.cpusse3
4732           || i.tm.cpu_flags.bitfield.cpussse3
4733           || i.tm.cpu_flags.bitfield.cpusse4_1
4734           || i.tm.cpu_flags.bitfield.cpusse4_2
4735           || i.tm.cpu_flags.bitfield.cpupclmul
4736           || i.tm.cpu_flags.bitfield.cpuaes
4737           || i.tm.cpu_flags.bitfield.cpusha
4738           || i.tm.cpu_flags.bitfield.cpugfni))
4739     {
4740       (sse_check == check_warning
4741        ? as_warn
4742        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4743     }
4744
4745   if (i.tm.opcode_modifier.fwait)
4746     if (!add_prefix (FWAIT_OPCODE))
4747       return;
4748
4749   /* Check if REP prefix is OK.  */
4750   if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
4751     {
4752       as_bad (_("invalid instruction `%s' after `%s'"),
4753                 i.tm.name, i.rep_prefix);
4754       return;
4755     }
4756
4757   /* Check for lock without a lockable instruction.  Destination operand
4758      must be memory unless it is xchg (0x86).  */
4759   if (i.prefix[LOCK_PREFIX]
4760       && (i.tm.opcode_modifier.prefixok < PrefixLock
4761           || i.mem_operands == 0
4762           || (i.tm.base_opcode != 0x86
4763               && !(i.flags[i.operands - 1] & Operand_Mem))))
4764     {
4765       as_bad (_("expecting lockable instruction after `lock'"));
4766       return;
4767     }
4768
4769   /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns.  */
4770   if (i.prefix[DATA_PREFIX]
4771       && (is_any_vex_encoding (&i.tm)
4772           || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4773           || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4774     {
4775       as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4776       return;
4777     }
4778
4779   /* Check if HLE prefix is OK.  */
4780   if (i.hle_prefix && !check_hle ())
4781     return;
4782
4783   /* Check BND prefix.  */
4784   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4785     as_bad (_("expecting valid branch instruction after `bnd'"));
4786
4787   /* Check NOTRACK prefix.  */
4788   if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
4789     as_bad (_("expecting indirect branch instruction after `notrack'"));
4790
4791   if (i.tm.cpu_flags.bitfield.cpumpx)
4792     {
4793       if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4794         as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4795       else if (flag_code != CODE_16BIT
4796                ? i.prefix[ADDR_PREFIX]
4797                : i.mem_operands && !i.prefix[ADDR_PREFIX])
4798         as_bad (_("16-bit address isn't allowed in MPX instructions"));
4799     }
4800
4801   /* Insert BND prefix.  */
4802   if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4803     {
4804       if (!i.prefix[BND_PREFIX])
4805         add_prefix (BND_PREFIX_OPCODE);
4806       else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4807         {
4808           as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4809           i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4810         }
4811     }
4812
4813   /* Check string instruction segment overrides.  */
4814   if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4815     {
4816       gas_assert (i.mem_operands);
4817       if (!check_string ())
4818         return;
4819       i.disp_operands = 0;
4820     }
4821
4822   if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4823     optimize_encoding ();
4824
4825   if (!process_suffix ())
4826     return;
4827
4828   /* Update operand types and check extended states.  */
4829   for (j = 0; j < i.operands; j++)
4830     {
4831       i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4832       switch (i.tm.operand_types[j].bitfield.class)
4833         {
4834         default:
4835           break;
4836         case RegMMX:
4837           i.xstate |= xstate_mmx;
4838           break;
4839         case RegMask:
4840           i.xstate |= xstate_mask;
4841           break;
4842         case RegSIMD:
4843           if (i.tm.operand_types[j].bitfield.tmmword)
4844             i.xstate |= xstate_tmm;
4845           else if (i.tm.operand_types[j].bitfield.zmmword)
4846             i.xstate |= xstate_zmm;
4847           else if (i.tm.operand_types[j].bitfield.ymmword)
4848             i.xstate |= xstate_ymm;
4849           else if (i.tm.operand_types[j].bitfield.xmmword)
4850             i.xstate |= xstate_xmm;
4851           break;
4852         }
4853     }
4854
4855   /* Make still unresolved immediate matches conform to size of immediate
4856      given in i.suffix.  */
4857   if (!finalize_imm ())
4858     return;
4859
4860   if (i.types[0].bitfield.imm1)
4861     i.imm_operands = 0; /* kludge for shift insns.  */
4862
4863   /* We only need to check those implicit registers for instructions
4864      with 3 operands or less.  */
4865   if (i.operands <= 3)
4866     for (j = 0; j < i.operands; j++)
4867       if (i.types[j].bitfield.instance != InstanceNone
4868           && !i.types[j].bitfield.xmmword)
4869         i.reg_operands--;
4870
4871   /* For insns with operands there are more diddles to do to the opcode.  */
4872   if (i.operands)
4873     {
4874       if (!process_operands ())
4875         return;
4876     }
4877   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4878     {
4879       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
4880       as_warn (_("translating to `%sp'"), i.tm.name);
4881     }
4882
4883   if (is_any_vex_encoding (&i.tm))
4884     {
4885       if (!cpu_arch_flags.bitfield.cpui286)
4886         {
4887           as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4888                   i.tm.name);
4889           return;
4890         }
4891
4892       /* Check for explicit REX prefix.  */
4893       if (i.prefix[REX_PREFIX] || i.rex_encoding)
4894         {
4895           as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4896           return;
4897         }
4898
4899       if (i.tm.opcode_modifier.vex)
4900         build_vex_prefix (t);
4901       else
4902         build_evex_prefix ();
4903
4904       /* The individual REX.RXBW bits got consumed.  */
4905       i.rex &= REX_OPCODE;
4906     }
4907
4908   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
4909      instructions may define INT_OPCODE as well, so avoid this corner
4910      case for those instructions that use MODRM.  */
4911   if (i.tm.base_opcode == INT_OPCODE
4912       && !i.tm.opcode_modifier.modrm
4913       && i.op[0].imms->X_add_number == 3)
4914     {
4915       i.tm.base_opcode = INT3_OPCODE;
4916       i.imm_operands = 0;
4917     }
4918
4919   if ((i.tm.opcode_modifier.jump == JUMP
4920        || i.tm.opcode_modifier.jump == JUMP_BYTE
4921        || i.tm.opcode_modifier.jump == JUMP_DWORD)
4922       && i.op[0].disps->X_op == O_constant)
4923     {
4924       /* Convert "jmp constant" (and "call constant") to a jump (call) to
4925          the absolute address given by the constant.  Since ix86 jumps and
4926          calls are pc relative, we need to generate a reloc.  */
4927       i.op[0].disps->X_add_symbol = &abs_symbol;
4928       i.op[0].disps->X_op = O_symbol;
4929     }
4930
4931   /* For 8 bit registers we need an empty rex prefix.  Also if the
4932      instruction already has a prefix, we need to convert old
4933      registers to new ones.  */
4934
4935   if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4936        && (i.op[0].regs->reg_flags & RegRex64) != 0)
4937       || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4938           && (i.op[1].regs->reg_flags & RegRex64) != 0)
4939       || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4940            || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4941           && i.rex != 0))
4942     {
4943       int x;
4944
4945       i.rex |= REX_OPCODE;
4946       for (x = 0; x < 2; x++)
4947         {
4948           /* Look for 8 bit operand that uses old registers.  */
4949           if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4950               && (i.op[x].regs->reg_flags & RegRex64) == 0)
4951             {
4952               gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4953               /* In case it is "hi" register, give up.  */
4954               if (i.op[x].regs->reg_num > 3)
4955                 as_bad (_("can't encode register '%s%s' in an "
4956                           "instruction requiring REX prefix."),
4957                         register_prefix, i.op[x].regs->reg_name);
4958
4959               /* Otherwise it is equivalent to the extended register.
4960                  Since the encoding doesn't change this is merely
4961                  cosmetic cleanup for debug output.  */
4962
4963               i.op[x].regs = i.op[x].regs + 8;
4964             }
4965         }
4966     }
4967
4968   if (i.rex == 0 && i.rex_encoding)
4969     {
4970       /* Check if we can add a REX_OPCODE byte.  Look for 8 bit operand
4971          that uses legacy register.  If it is "hi" register, don't add
4972          the REX_OPCODE byte.  */
4973       int x;
4974       for (x = 0; x < 2; x++)
4975         if (i.types[x].bitfield.class == Reg
4976             && i.types[x].bitfield.byte
4977             && (i.op[x].regs->reg_flags & RegRex64) == 0
4978             && i.op[x].regs->reg_num > 3)
4979           {
4980             gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4981             i.rex_encoding = FALSE;
4982             break;
4983           }
4984
4985       if (i.rex_encoding)
4986         i.rex = REX_OPCODE;
4987     }
4988
4989   if (i.rex != 0)
4990     add_prefix (REX_OPCODE | i.rex);
4991
4992   insert_lfence_before ();
4993
4994   /* We are ready to output the insn.  */
4995   output_insn ();
4996
4997   insert_lfence_after ();
4998
4999   last_insn.seg = now_seg;
5000
5001   if (i.tm.opcode_modifier.isprefix)
5002     {
5003       last_insn.kind = last_insn_prefix;
5004       last_insn.name = i.tm.name;
5005       last_insn.file = as_where (&last_insn.line);
5006     }
5007   else
5008     last_insn.kind = last_insn_other;
5009 }
5010
5011 static char *
5012 parse_insn (char *line, char *mnemonic)
5013 {
5014   char *l = line;
5015   char *token_start = l;
5016   char *mnem_p;
5017   int supported;
5018   const insn_template *t;
5019   char *dot_p = NULL;
5020
5021   while (1)
5022     {
5023       mnem_p = mnemonic;
5024       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5025         {
5026           if (*mnem_p == '.')
5027             dot_p = mnem_p;
5028           mnem_p++;
5029           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5030             {
5031               as_bad (_("no such instruction: `%s'"), token_start);
5032               return NULL;
5033             }
5034           l++;
5035         }
5036       if (!is_space_char (*l)
5037           && *l != END_OF_INSN
5038           && (intel_syntax
5039               || (*l != PREFIX_SEPARATOR
5040                   && *l != ',')))
5041         {
5042           as_bad (_("invalid character %s in mnemonic"),
5043                   output_invalid (*l));
5044           return NULL;
5045         }
5046       if (token_start == l)
5047         {
5048           if (!intel_syntax && *l == PREFIX_SEPARATOR)
5049             as_bad (_("expecting prefix; got nothing"));
5050           else
5051             as_bad (_("expecting mnemonic; got nothing"));
5052           return NULL;
5053         }
5054
5055       /* Look up instruction (or prefix) via hash table.  */
5056       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5057
5058       if (*l != END_OF_INSN
5059           && (!is_space_char (*l) || l[1] != END_OF_INSN)
5060           && current_templates
5061           && current_templates->start->opcode_modifier.isprefix)
5062         {
5063           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5064             {
5065               as_bad ((flag_code != CODE_64BIT
5066                        ? _("`%s' is only supported in 64-bit mode")
5067                        : _("`%s' is not supported in 64-bit mode")),
5068                       current_templates->start->name);
5069               return NULL;
5070             }
5071           /* If we are in 16-bit mode, do not allow addr16 or data16.
5072              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
5073           if ((current_templates->start->opcode_modifier.size == SIZE16
5074                || current_templates->start->opcode_modifier.size == SIZE32)
5075               && flag_code != CODE_64BIT
5076               && ((current_templates->start->opcode_modifier.size == SIZE32)
5077                   ^ (flag_code == CODE_16BIT)))
5078             {
5079               as_bad (_("redundant %s prefix"),
5080                       current_templates->start->name);
5081               return NULL;
5082             }
5083
5084           if (current_templates->start->base_opcode == PSEUDO_PREFIX)
5085             {
5086               /* Handle pseudo prefixes.  */
5087               switch (current_templates->start->extension_opcode)
5088                 {
5089                 case Prefix_Disp8:
5090                   /* {disp8} */
5091                   i.disp_encoding = disp_encoding_8bit;
5092                   break;
5093                 case Prefix_Disp16:
5094                   /* {disp16} */
5095                   i.disp_encoding = disp_encoding_16bit;
5096                   break;
5097                 case Prefix_Disp32:
5098                   /* {disp32} */
5099                   i.disp_encoding = disp_encoding_32bit;
5100                   break;
5101                 case Prefix_Load:
5102                   /* {load} */
5103                   i.dir_encoding = dir_encoding_load;
5104                   break;
5105                 case Prefix_Store:
5106                   /* {store} */
5107                   i.dir_encoding = dir_encoding_store;
5108                   break;
5109                 case Prefix_VEX:
5110                   /* {vex} */
5111                   i.vec_encoding = vex_encoding_vex;
5112                   break;
5113                 case Prefix_VEX3:
5114                   /* {vex3} */
5115                   i.vec_encoding = vex_encoding_vex3;
5116                   break;
5117                 case Prefix_EVEX:
5118                   /* {evex} */
5119                   i.vec_encoding = vex_encoding_evex;
5120                   break;
5121                 case Prefix_REX:
5122                   /* {rex} */
5123                   i.rex_encoding = TRUE;
5124                   break;
5125                 case Prefix_NoOptimize:
5126                   /* {nooptimize} */
5127                   i.no_optimize = TRUE;
5128                   break;
5129                 default:
5130                   abort ();
5131                 }
5132             }
5133           else
5134             {
5135               /* Add prefix, checking for repeated prefixes.  */
5136               switch (add_prefix (current_templates->start->base_opcode))
5137                 {
5138                 case PREFIX_EXIST:
5139                   return NULL;
5140                 case PREFIX_DS:
5141                   if (current_templates->start->cpu_flags.bitfield.cpuibt)
5142                     i.notrack_prefix = current_templates->start->name;
5143                   break;
5144                 case PREFIX_REP:
5145                   if (current_templates->start->cpu_flags.bitfield.cpuhle)
5146                     i.hle_prefix = current_templates->start->name;
5147                   else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5148                     i.bnd_prefix = current_templates->start->name;
5149                   else
5150                     i.rep_prefix = current_templates->start->name;
5151                   break;
5152                 default:
5153                   break;
5154                 }
5155             }
5156           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
5157           token_start = ++l;
5158         }
5159       else
5160         break;
5161     }
5162
5163   if (!current_templates)
5164     {
5165       /* Deprecated functionality (new code should use pseudo-prefixes instead):
5166          Check if we should swap operand or force 32bit displacement in
5167          encoding.  */
5168       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5169         i.dir_encoding = dir_encoding_swap;
5170       else if (mnem_p - 3 == dot_p
5171                && dot_p[1] == 'd'
5172                && dot_p[2] == '8')
5173         i.disp_encoding = disp_encoding_8bit;
5174       else if (mnem_p - 4 == dot_p
5175                && dot_p[1] == 'd'
5176                && dot_p[2] == '3'
5177                && dot_p[3] == '2')
5178         i.disp_encoding = disp_encoding_32bit;
5179       else
5180         goto check_suffix;
5181       mnem_p = dot_p;
5182       *dot_p = '\0';
5183       current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5184     }
5185
5186   if (!current_templates)
5187     {
5188     check_suffix:
5189       if (mnem_p > mnemonic)
5190         {
5191           /* See if we can get a match by trimming off a suffix.  */
5192           switch (mnem_p[-1])
5193             {
5194             case WORD_MNEM_SUFFIX:
5195               if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5196                 i.suffix = SHORT_MNEM_SUFFIX;
5197               else
5198                 /* Fall through.  */
5199               case BYTE_MNEM_SUFFIX:
5200               case QWORD_MNEM_SUFFIX:
5201                 i.suffix = mnem_p[-1];
5202               mnem_p[-1] = '\0';
5203               current_templates
5204                 = (const templates *) str_hash_find (op_hash, mnemonic);
5205               break;
5206             case SHORT_MNEM_SUFFIX:
5207             case LONG_MNEM_SUFFIX:
5208               if (!intel_syntax)
5209                 {
5210                   i.suffix = mnem_p[-1];
5211                   mnem_p[-1] = '\0';
5212                   current_templates
5213                     = (const templates *) str_hash_find (op_hash, mnemonic);
5214                 }
5215               break;
5216
5217               /* Intel Syntax.  */
5218             case 'd':
5219               if (intel_syntax)
5220                 {
5221                   if (intel_float_operand (mnemonic) == 1)
5222                     i.suffix = SHORT_MNEM_SUFFIX;
5223                   else
5224                     i.suffix = LONG_MNEM_SUFFIX;
5225                   mnem_p[-1] = '\0';
5226                   current_templates
5227                     = (const templates *) str_hash_find (op_hash, mnemonic);
5228                 }
5229               break;
5230             }
5231         }
5232
5233       if (!current_templates)
5234         {
5235           as_bad (_("no such instruction: `%s'"), token_start);
5236           return NULL;
5237         }
5238     }
5239
5240   if (current_templates->start->opcode_modifier.jump == JUMP
5241       || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5242     {
5243       /* Check for a branch hint.  We allow ",pt" and ",pn" for
5244          predict taken and predict not taken respectively.
5245          I'm not sure that branch hints actually do anything on loop
5246          and jcxz insns (JumpByte) for current Pentium4 chips.  They
5247          may work in the future and it doesn't hurt to accept them
5248          now.  */
5249       if (l[0] == ',' && l[1] == 'p')
5250         {
5251           if (l[2] == 't')
5252             {
5253               if (!add_prefix (DS_PREFIX_OPCODE))
5254                 return NULL;
5255               l += 3;
5256             }
5257           else if (l[2] == 'n')
5258             {
5259               if (!add_prefix (CS_PREFIX_OPCODE))
5260                 return NULL;
5261               l += 3;
5262             }
5263         }
5264     }
5265   /* Any other comma loses.  */
5266   if (*l == ',')
5267     {
5268       as_bad (_("invalid character %s in mnemonic"),
5269               output_invalid (*l));
5270       return NULL;
5271     }
5272
5273   /* Check if instruction is supported on specified architecture.  */
5274   supported = 0;
5275   for (t = current_templates->start; t < current_templates->end; ++t)
5276     {
5277       supported |= cpu_flags_match (t);
5278       if (supported == CPU_FLAGS_PERFECT_MATCH)
5279         {
5280           if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5281             as_warn (_("use .code16 to ensure correct addressing mode"));
5282
5283           return l;
5284         }
5285     }
5286
5287   if (!(supported & CPU_FLAGS_64BIT_MATCH))
5288     as_bad (flag_code == CODE_64BIT
5289             ? _("`%s' is not supported in 64-bit mode")
5290             : _("`%s' is only supported in 64-bit mode"),
5291             current_templates->start->name);
5292   else
5293     as_bad (_("`%s' is not supported on `%s%s'"),
5294             current_templates->start->name,
5295             cpu_arch_name ? cpu_arch_name : default_arch,
5296             cpu_sub_arch_name ? cpu_sub_arch_name : "");
5297
5298   return NULL;
5299 }
5300
5301 static char *
5302 parse_operands (char *l, const char *mnemonic)
5303 {
5304   char *token_start;
5305
5306   /* 1 if operand is pending after ','.  */
5307   unsigned int expecting_operand = 0;
5308
5309   /* Non-zero if operand parens not balanced.  */
5310   unsigned int paren_not_balanced;
5311
5312   while (*l != END_OF_INSN)
5313     {
5314       /* Skip optional white space before operand.  */
5315       if (is_space_char (*l))
5316         ++l;
5317       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5318         {
5319           as_bad (_("invalid character %s before operand %d"),
5320                   output_invalid (*l),
5321                   i.operands + 1);
5322           return NULL;
5323         }
5324       token_start = l;  /* After white space.  */
5325       paren_not_balanced = 0;
5326       while (paren_not_balanced || *l != ',')
5327         {
5328           if (*l == END_OF_INSN)
5329             {
5330               if (paren_not_balanced)
5331                 {
5332                   if (!intel_syntax)
5333                     as_bad (_("unbalanced parenthesis in operand %d."),
5334                             i.operands + 1);
5335                   else
5336                     as_bad (_("unbalanced brackets in operand %d."),
5337                             i.operands + 1);
5338                   return NULL;
5339                 }
5340               else
5341                 break;  /* we are done */
5342             }
5343           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5344             {
5345               as_bad (_("invalid character %s in operand %d"),
5346                       output_invalid (*l),
5347                       i.operands + 1);
5348               return NULL;
5349             }
5350           if (!intel_syntax)
5351             {
5352               if (*l == '(')
5353                 ++paren_not_balanced;
5354               if (*l == ')')
5355                 --paren_not_balanced;
5356             }
5357           else
5358             {
5359               if (*l == '[')
5360                 ++paren_not_balanced;
5361               if (*l == ']')
5362                 --paren_not_balanced;
5363             }
5364           l++;
5365         }
5366       if (l != token_start)
5367         {                       /* Yes, we've read in another operand.  */
5368           unsigned int operand_ok;
5369           this_operand = i.operands++;
5370           if (i.operands > MAX_OPERANDS)
5371             {
5372               as_bad (_("spurious operands; (%d operands/instruction max)"),
5373                       MAX_OPERANDS);
5374               return NULL;
5375             }
5376           i.types[this_operand].bitfield.unspecified = 1;
5377           /* Now parse operand adding info to 'i' as we go along.  */
5378           END_STRING_AND_SAVE (l);
5379
5380           if (i.mem_operands > 1)
5381             {
5382               as_bad (_("too many memory references for `%s'"),
5383                       mnemonic);
5384               return 0;
5385             }
5386
5387           if (intel_syntax)
5388             operand_ok =
5389               i386_intel_operand (token_start,
5390                                   intel_float_operand (mnemonic));
5391           else
5392             operand_ok = i386_att_operand (token_start);
5393
5394           RESTORE_END_STRING (l);
5395           if (!operand_ok)
5396             return NULL;
5397         }
5398       else
5399         {
5400           if (expecting_operand)
5401             {
5402             expecting_operand_after_comma:
5403               as_bad (_("expecting operand after ','; got nothing"));
5404               return NULL;
5405             }
5406           if (*l == ',')
5407             {
5408               as_bad (_("expecting operand before ','; got nothing"));
5409               return NULL;
5410             }
5411         }
5412
5413       /* Now *l must be either ',' or END_OF_INSN.  */
5414       if (*l == ',')
5415         {
5416           if (*++l == END_OF_INSN)
5417             {
5418               /* Just skip it, if it's \n complain.  */
5419               goto expecting_operand_after_comma;
5420             }
5421           expecting_operand = 1;
5422         }
5423     }
5424   return l;
5425 }
5426
5427 static void
5428 swap_2_operands (int xchg1, int xchg2)
5429 {
5430   union i386_op temp_op;
5431   i386_operand_type temp_type;
5432   unsigned int temp_flags;
5433   enum bfd_reloc_code_real temp_reloc;
5434
5435   temp_type = i.types[xchg2];
5436   i.types[xchg2] = i.types[xchg1];
5437   i.types[xchg1] = temp_type;
5438
5439   temp_flags = i.flags[xchg2];
5440   i.flags[xchg2] = i.flags[xchg1];
5441   i.flags[xchg1] = temp_flags;
5442
5443   temp_op = i.op[xchg2];
5444   i.op[xchg2] = i.op[xchg1];
5445   i.op[xchg1] = temp_op;
5446
5447   temp_reloc = i.reloc[xchg2];
5448   i.reloc[xchg2] = i.reloc[xchg1];
5449   i.reloc[xchg1] = temp_reloc;
5450
5451   if (i.mask)
5452     {
5453       if (i.mask->operand == xchg1)
5454         i.mask->operand = xchg2;
5455       else if (i.mask->operand == xchg2)
5456         i.mask->operand = xchg1;
5457     }
5458   if (i.broadcast)
5459     {
5460       if (i.broadcast->operand == xchg1)
5461         i.broadcast->operand = xchg2;
5462       else if (i.broadcast->operand == xchg2)
5463         i.broadcast->operand = xchg1;
5464     }
5465   if (i.rounding)
5466     {
5467       if (i.rounding->operand == xchg1)
5468         i.rounding->operand = xchg2;
5469       else if (i.rounding->operand == xchg2)
5470         i.rounding->operand = xchg1;
5471     }
5472 }
5473
5474 static void
5475 swap_operands (void)
5476 {
5477   switch (i.operands)
5478     {
5479     case 5:
5480     case 4:
5481       swap_2_operands (1, i.operands - 2);
5482       /* Fall through.  */
5483     case 3:
5484     case 2:
5485       swap_2_operands (0, i.operands - 1);
5486       break;
5487     default:
5488       abort ();
5489     }
5490
5491   if (i.mem_operands == 2)
5492     {
5493       const seg_entry *temp_seg;
5494       temp_seg = i.seg[0];
5495       i.seg[0] = i.seg[1];
5496       i.seg[1] = temp_seg;
5497     }
5498 }
5499
5500 /* Try to ensure constant immediates are represented in the smallest
5501    opcode possible.  */
5502 static void
5503 optimize_imm (void)
5504 {
5505   char guess_suffix = 0;
5506   int op;
5507
5508   if (i.suffix)
5509     guess_suffix = i.suffix;
5510   else if (i.reg_operands)
5511     {
5512       /* Figure out a suffix from the last register operand specified.
5513          We can't do this properly yet, i.e. excluding special register
5514          instances, but the following works for instructions with
5515          immediates.  In any case, we can't set i.suffix yet.  */
5516       for (op = i.operands; --op >= 0;)
5517         if (i.types[op].bitfield.class != Reg)
5518           continue;
5519         else if (i.types[op].bitfield.byte)
5520           {
5521             guess_suffix = BYTE_MNEM_SUFFIX;
5522             break;
5523           }
5524         else if (i.types[op].bitfield.word)
5525           {
5526             guess_suffix = WORD_MNEM_SUFFIX;
5527             break;
5528           }
5529         else if (i.types[op].bitfield.dword)
5530           {
5531             guess_suffix = LONG_MNEM_SUFFIX;
5532             break;
5533           }
5534         else if (i.types[op].bitfield.qword)
5535           {
5536             guess_suffix = QWORD_MNEM_SUFFIX;
5537             break;
5538           }
5539     }
5540   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5541     guess_suffix = WORD_MNEM_SUFFIX;
5542
5543   for (op = i.operands; --op >= 0;)
5544     if (operand_type_check (i.types[op], imm))
5545       {
5546         switch (i.op[op].imms->X_op)
5547           {
5548           case O_constant:
5549             /* If a suffix is given, this operand may be shortened.  */
5550             switch (guess_suffix)
5551               {
5552               case LONG_MNEM_SUFFIX:
5553                 i.types[op].bitfield.imm32 = 1;
5554                 i.types[op].bitfield.imm64 = 1;
5555                 break;
5556               case WORD_MNEM_SUFFIX:
5557                 i.types[op].bitfield.imm16 = 1;
5558                 i.types[op].bitfield.imm32 = 1;
5559                 i.types[op].bitfield.imm32s = 1;
5560                 i.types[op].bitfield.imm64 = 1;
5561                 break;
5562               case BYTE_MNEM_SUFFIX:
5563                 i.types[op].bitfield.imm8 = 1;
5564                 i.types[op].bitfield.imm8s = 1;
5565                 i.types[op].bitfield.imm16 = 1;
5566                 i.types[op].bitfield.imm32 = 1;
5567                 i.types[op].bitfield.imm32s = 1;
5568                 i.types[op].bitfield.imm64 = 1;
5569                 break;
5570               }
5571
5572             /* If this operand is at most 16 bits, convert it
5573                to a signed 16 bit number before trying to see
5574                whether it will fit in an even smaller size.
5575                This allows a 16-bit operand such as $0xffe0 to
5576                be recognised as within Imm8S range.  */
5577             if ((i.types[op].bitfield.imm16)
5578                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5579               {
5580                 i.op[op].imms->X_add_number =
5581                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5582               }
5583 #ifdef BFD64
5584             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
5585             if ((i.types[op].bitfield.imm32)
5586                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5587                     == 0))
5588               {
5589                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5590                                                 ^ ((offsetT) 1 << 31))
5591                                                - ((offsetT) 1 << 31));
5592               }
5593 #endif
5594             i.types[op]
5595               = operand_type_or (i.types[op],
5596                                  smallest_imm_type (i.op[op].imms->X_add_number));
5597
5598             /* We must avoid matching of Imm32 templates when 64bit
5599                only immediate is available.  */
5600             if (guess_suffix == QWORD_MNEM_SUFFIX)
5601               i.types[op].bitfield.imm32 = 0;
5602             break;
5603
5604           case O_absent:
5605           case O_register:
5606             abort ();
5607
5608             /* Symbols and expressions.  */
5609           default:
5610             /* Convert symbolic operand to proper sizes for matching, but don't
5611                prevent matching a set of insns that only supports sizes other
5612                than those matching the insn suffix.  */
5613             {
5614               i386_operand_type mask, allowed;
5615               const insn_template *t;
5616
5617               operand_type_set (&mask, 0);
5618               operand_type_set (&allowed, 0);
5619
5620               for (t = current_templates->start;
5621                    t < current_templates->end;
5622                    ++t)
5623                 {
5624                   allowed = operand_type_or (allowed, t->operand_types[op]);
5625                   allowed = operand_type_and (allowed, anyimm);
5626                 }
5627               switch (guess_suffix)
5628                 {
5629                 case QWORD_MNEM_SUFFIX:
5630                   mask.bitfield.imm64 = 1;
5631                   mask.bitfield.imm32s = 1;
5632                   break;
5633                 case LONG_MNEM_SUFFIX:
5634                   mask.bitfield.imm32 = 1;
5635                   break;
5636                 case WORD_MNEM_SUFFIX:
5637                   mask.bitfield.imm16 = 1;
5638                   break;
5639                 case BYTE_MNEM_SUFFIX:
5640                   mask.bitfield.imm8 = 1;
5641                   break;
5642                 default:
5643                   break;
5644                 }
5645               allowed = operand_type_and (mask, allowed);
5646               if (!operand_type_all_zero (&allowed))
5647                 i.types[op] = operand_type_and (i.types[op], mask);
5648             }
5649             break;
5650           }
5651       }
5652 }
5653
5654 /* Try to use the smallest displacement type too.  */
5655 static void
5656 optimize_disp (void)
5657 {
5658   int op;
5659
5660   for (op = i.operands; --op >= 0;)
5661     if (operand_type_check (i.types[op], disp))
5662       {
5663         if (i.op[op].disps->X_op == O_constant)
5664           {
5665             offsetT op_disp = i.op[op].disps->X_add_number;
5666
5667             if (i.types[op].bitfield.disp16
5668                 && (op_disp & ~(offsetT) 0xffff) == 0)
5669               {
5670                 /* If this operand is at most 16 bits, convert
5671                    to a signed 16 bit number and don't use 64bit
5672                    displacement.  */
5673                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5674                 i.types[op].bitfield.disp64 = 0;
5675               }
5676 #ifdef BFD64
5677             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
5678             if (i.types[op].bitfield.disp32
5679                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5680               {
5681                 /* If this operand is at most 32 bits, convert
5682                    to a signed 32 bit number and don't use 64bit
5683                    displacement.  */
5684                 op_disp &= (((offsetT) 2 << 31) - 1);
5685                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5686                 i.types[op].bitfield.disp64 = 0;
5687               }
5688 #endif
5689             if (!op_disp && i.types[op].bitfield.baseindex)
5690               {
5691                 i.types[op].bitfield.disp8 = 0;
5692                 i.types[op].bitfield.disp16 = 0;
5693                 i.types[op].bitfield.disp32 = 0;
5694                 i.types[op].bitfield.disp32s = 0;
5695                 i.types[op].bitfield.disp64 = 0;
5696                 i.op[op].disps = 0;
5697                 i.disp_operands--;
5698               }
5699             else if (flag_code == CODE_64BIT)
5700               {
5701                 if (fits_in_signed_long (op_disp))
5702                   {
5703                     i.types[op].bitfield.disp64 = 0;
5704                     i.types[op].bitfield.disp32s = 1;
5705                   }
5706                 if (i.prefix[ADDR_PREFIX]
5707                     && fits_in_unsigned_long (op_disp))
5708                   i.types[op].bitfield.disp32 = 1;
5709               }
5710             if ((i.types[op].bitfield.disp32
5711                  || i.types[op].bitfield.disp32s
5712                  || i.types[op].bitfield.disp16)
5713                 && fits_in_disp8 (op_disp))
5714               i.types[op].bitfield.disp8 = 1;
5715           }
5716         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5717                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5718           {
5719             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5720                          i.op[op].disps, 0, i.reloc[op]);
5721             i.types[op].bitfield.disp8 = 0;
5722             i.types[op].bitfield.disp16 = 0;
5723             i.types[op].bitfield.disp32 = 0;
5724             i.types[op].bitfield.disp32s = 0;
5725             i.types[op].bitfield.disp64 = 0;
5726           }
5727         else
5728           /* We only support 64bit displacement on constants.  */
5729           i.types[op].bitfield.disp64 = 0;
5730       }
5731 }
5732
5733 /* Return 1 if there is a match in broadcast bytes between operand
5734    GIVEN and instruction template T.   */
5735
5736 static INLINE int
5737 match_broadcast_size (const insn_template *t, unsigned int given)
5738 {
5739   return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5740            && i.types[given].bitfield.byte)
5741           || (t->opcode_modifier.broadcast == WORD_BROADCAST
5742               && i.types[given].bitfield.word)
5743           || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5744               && i.types[given].bitfield.dword)
5745           || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5746               && i.types[given].bitfield.qword));
5747 }
5748
5749 /* Check if operands are valid for the instruction.  */
5750
5751 static int
5752 check_VecOperands (const insn_template *t)
5753 {
5754   unsigned int op;
5755   i386_cpu_flags cpu;
5756
5757   /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5758      any one operand are implicity requiring AVX512VL support if the actual
5759      operand size is YMMword or XMMword.  Since this function runs after
5760      template matching, there's no need to check for YMMword/XMMword in
5761      the template.  */
5762   cpu = cpu_flags_and (t->cpu_flags, avx512);
5763   if (!cpu_flags_all_zero (&cpu)
5764       && !t->cpu_flags.bitfield.cpuavx512vl
5765       && !cpu_arch_flags.bitfield.cpuavx512vl)
5766     {
5767       for (op = 0; op < t->operands; ++op)
5768         {
5769           if (t->operand_types[op].bitfield.zmmword
5770               && (i.types[op].bitfield.ymmword
5771                   || i.types[op].bitfield.xmmword))
5772             {
5773               i.error = unsupported;
5774               return 1;
5775             }
5776         }
5777     }
5778
5779   /* Without VSIB byte, we can't have a vector register for index.  */
5780   if (!t->opcode_modifier.sib
5781       && i.index_reg
5782       && (i.index_reg->reg_type.bitfield.xmmword
5783           || i.index_reg->reg_type.bitfield.ymmword
5784           || i.index_reg->reg_type.bitfield.zmmword))
5785     {
5786       i.error = unsupported_vector_index_register;
5787       return 1;
5788     }
5789
5790   /* Check if default mask is allowed.  */
5791   if (t->opcode_modifier.nodefmask
5792       && (!i.mask || i.mask->mask->reg_num == 0))
5793     {
5794       i.error = no_default_mask;
5795       return 1;
5796     }
5797
5798   /* For VSIB byte, we need a vector register for index, and all vector
5799      registers must be distinct.  */
5800   if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5801     {
5802       if (!i.index_reg
5803           || !((t->opcode_modifier.sib == VECSIB128
5804                 && i.index_reg->reg_type.bitfield.xmmword)
5805                || (t->opcode_modifier.sib == VECSIB256
5806                    && i.index_reg->reg_type.bitfield.ymmword)
5807                || (t->opcode_modifier.sib == VECSIB512
5808                    && i.index_reg->reg_type.bitfield.zmmword)))
5809       {
5810         i.error = invalid_vsib_address;
5811         return 1;
5812       }
5813
5814       gas_assert (i.reg_operands == 2 || i.mask);
5815       if (i.reg_operands == 2 && !i.mask)
5816         {
5817           gas_assert (i.types[0].bitfield.class == RegSIMD);
5818           gas_assert (i.types[0].bitfield.xmmword
5819                       || i.types[0].bitfield.ymmword);
5820           gas_assert (i.types[2].bitfield.class == RegSIMD);
5821           gas_assert (i.types[2].bitfield.xmmword
5822                       || i.types[2].bitfield.ymmword);
5823           if (operand_check == check_none)
5824             return 0;
5825           if (register_number (i.op[0].regs)
5826               != register_number (i.index_reg)
5827               && register_number (i.op[2].regs)
5828                  != register_number (i.index_reg)
5829               && register_number (i.op[0].regs)
5830                  != register_number (i.op[2].regs))
5831             return 0;
5832           if (operand_check == check_error)
5833             {
5834               i.error = invalid_vector_register_set;
5835               return 1;
5836             }
5837           as_warn (_("mask, index, and destination registers should be distinct"));
5838         }
5839       else if (i.reg_operands == 1 && i.mask)
5840         {
5841           if (i.types[1].bitfield.class == RegSIMD
5842               && (i.types[1].bitfield.xmmword
5843                   || i.types[1].bitfield.ymmword
5844                   || i.types[1].bitfield.zmmword)
5845               && (register_number (i.op[1].regs)
5846                   == register_number (i.index_reg)))
5847             {
5848               if (operand_check == check_error)
5849                 {
5850                   i.error = invalid_vector_register_set;
5851                   return 1;
5852                 }
5853               if (operand_check != check_none)
5854                 as_warn (_("index and destination registers should be distinct"));
5855             }
5856         }
5857     }
5858
5859   /* For AMX instructions with three tmmword operands, all tmmword operand must be
5860      distinct */
5861   if (t->operand_types[0].bitfield.tmmword
5862       && i.reg_operands == 3)
5863     {
5864       if (register_number (i.op[0].regs)
5865           == register_number (i.op[1].regs)
5866           || register_number (i.op[0].regs)
5867              == register_number (i.op[2].regs)
5868           || register_number (i.op[1].regs)
5869              == register_number (i.op[2].regs))
5870         {
5871           i.error = invalid_tmm_register_set;
5872           return 1;
5873         }
5874     }
5875
5876   /* Check if broadcast is supported by the instruction and is applied
5877      to the memory operand.  */
5878   if (i.broadcast)
5879     {
5880       i386_operand_type type, overlap;
5881
5882       /* Check if specified broadcast is supported in this instruction,
5883          and its broadcast bytes match the memory operand.  */
5884       op = i.broadcast->operand;
5885       if (!t->opcode_modifier.broadcast
5886           || !(i.flags[op] & Operand_Mem)
5887           || (!i.types[op].bitfield.unspecified
5888               && !match_broadcast_size (t, op)))
5889         {
5890         bad_broadcast:
5891           i.error = unsupported_broadcast;
5892           return 1;
5893         }
5894
5895       i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5896                             * i.broadcast->type);
5897       operand_type_set (&type, 0);
5898       switch (i.broadcast->bytes)
5899         {
5900         case 2:
5901           type.bitfield.word = 1;
5902           break;
5903         case 4:
5904           type.bitfield.dword = 1;
5905           break;
5906         case 8:
5907           type.bitfield.qword = 1;
5908           break;
5909         case 16:
5910           type.bitfield.xmmword = 1;
5911           break;
5912         case 32:
5913           type.bitfield.ymmword = 1;
5914           break;
5915         case 64:
5916           type.bitfield.zmmword = 1;
5917           break;
5918         default:
5919           goto bad_broadcast;
5920         }
5921
5922       overlap = operand_type_and (type, t->operand_types[op]);
5923       if (t->operand_types[op].bitfield.class == RegSIMD
5924           && t->operand_types[op].bitfield.byte
5925              + t->operand_types[op].bitfield.word
5926              + t->operand_types[op].bitfield.dword
5927              + t->operand_types[op].bitfield.qword > 1)
5928         {
5929           overlap.bitfield.xmmword = 0;
5930           overlap.bitfield.ymmword = 0;
5931           overlap.bitfield.zmmword = 0;
5932         }
5933       if (operand_type_all_zero (&overlap))
5934           goto bad_broadcast;
5935
5936       if (t->opcode_modifier.checkregsize)
5937         {
5938           unsigned int j;
5939
5940           type.bitfield.baseindex = 1;
5941           for (j = 0; j < i.operands; ++j)
5942             {
5943               if (j != op
5944                   && !operand_type_register_match(i.types[j],
5945                                                   t->operand_types[j],
5946                                                   type,
5947                                                   t->operand_types[op]))
5948                 goto bad_broadcast;
5949             }
5950         }
5951     }
5952   /* If broadcast is supported in this instruction, we need to check if
5953      operand of one-element size isn't specified without broadcast.  */
5954   else if (t->opcode_modifier.broadcast && i.mem_operands)
5955     {
5956       /* Find memory operand.  */
5957       for (op = 0; op < i.operands; op++)
5958         if (i.flags[op] & Operand_Mem)
5959           break;
5960       gas_assert (op < i.operands);
5961       /* Check size of the memory operand.  */
5962       if (match_broadcast_size (t, op))
5963         {
5964           i.error = broadcast_needed;
5965           return 1;
5966         }
5967     }
5968   else
5969     op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning.  */
5970
5971   /* Check if requested masking is supported.  */
5972   if (i.mask)
5973     {
5974       switch (t->opcode_modifier.masking)
5975         {
5976         case BOTH_MASKING:
5977           break;
5978         case MERGING_MASKING:
5979           if (i.mask->zeroing)
5980             {
5981         case 0:
5982               i.error = unsupported_masking;
5983               return 1;
5984             }
5985           break;
5986         case DYNAMIC_MASKING:
5987           /* Memory destinations allow only merging masking.  */
5988           if (i.mask->zeroing && i.mem_operands)
5989             {
5990               /* Find memory operand.  */
5991               for (op = 0; op < i.operands; op++)
5992                 if (i.flags[op] & Operand_Mem)
5993                   break;
5994               gas_assert (op < i.operands);
5995               if (op == i.operands - 1)
5996                 {
5997                   i.error = unsupported_masking;
5998                   return 1;
5999                 }
6000             }
6001           break;
6002         default:
6003           abort ();
6004         }
6005     }
6006
6007   /* Check if masking is applied to dest operand.  */
6008   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6009     {
6010       i.error = mask_not_on_destination;
6011       return 1;
6012     }
6013
6014   /* Check RC/SAE.  */
6015   if (i.rounding)
6016     {
6017       if (!t->opcode_modifier.sae
6018           || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6019         {
6020           i.error = unsupported_rc_sae;
6021           return 1;
6022         }
6023       /* If the instruction has several immediate operands and one of
6024          them is rounding, the rounding operand should be the last
6025          immediate operand.  */
6026       if (i.imm_operands > 1
6027           && i.rounding->operand != (int) (i.imm_operands - 1))
6028         {
6029           i.error = rc_sae_operand_not_last_imm;
6030           return 1;
6031         }
6032     }
6033
6034   /* Check the special Imm4 cases; must be the first operand.  */
6035   if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6036     {
6037       if (i.op[0].imms->X_op != O_constant
6038           || !fits_in_imm4 (i.op[0].imms->X_add_number))
6039         {
6040           i.error = bad_imm4;
6041           return 1;
6042         }
6043
6044       /* Turn off Imm<N> so that update_imm won't complain.  */
6045       operand_type_set (&i.types[0], 0);
6046     }
6047
6048   /* Check vector Disp8 operand.  */
6049   if (t->opcode_modifier.disp8memshift
6050       && i.disp_encoding != disp_encoding_32bit)
6051     {
6052       if (i.broadcast)
6053         i.memshift = t->opcode_modifier.broadcast - 1;
6054       else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6055         i.memshift = t->opcode_modifier.disp8memshift;
6056       else
6057         {
6058           const i386_operand_type *type = NULL;
6059
6060           i.memshift = 0;
6061           for (op = 0; op < i.operands; op++)
6062             if (i.flags[op] & Operand_Mem)
6063               {
6064                 if (t->opcode_modifier.evex == EVEXLIG)
6065                   i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6066                 else if (t->operand_types[op].bitfield.xmmword
6067                          + t->operand_types[op].bitfield.ymmword
6068                          + t->operand_types[op].bitfield.zmmword <= 1)
6069                   type = &t->operand_types[op];
6070                 else if (!i.types[op].bitfield.unspecified)
6071                   type = &i.types[op];
6072               }
6073             else if (i.types[op].bitfield.class == RegSIMD
6074                      && t->opcode_modifier.evex != EVEXLIG)
6075               {
6076                 if (i.types[op].bitfield.zmmword)
6077                   i.memshift = 6;
6078                 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6079                   i.memshift = 5;
6080                 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6081                   i.memshift = 4;
6082               }
6083
6084           if (type)
6085             {
6086               if (type->bitfield.zmmword)
6087                 i.memshift = 6;
6088               else if (type->bitfield.ymmword)
6089                 i.memshift = 5;
6090               else if (type->bitfield.xmmword)
6091                 i.memshift = 4;
6092             }
6093
6094           /* For the check in fits_in_disp8().  */
6095           if (i.memshift == 0)
6096             i.memshift = -1;
6097         }
6098
6099       for (op = 0; op < i.operands; op++)
6100         if (operand_type_check (i.types[op], disp)
6101             && i.op[op].disps->X_op == O_constant)
6102           {
6103             if (fits_in_disp8 (i.op[op].disps->X_add_number))
6104               {
6105                 i.types[op].bitfield.disp8 = 1;
6106                 return 0;
6107               }
6108             i.types[op].bitfield.disp8 = 0;
6109           }
6110     }
6111
6112   i.memshift = 0;
6113
6114   return 0;
6115 }
6116
6117 /* Check if encoding requirements are met by the instruction.  */
6118
6119 static int
6120 VEX_check_encoding (const insn_template *t)
6121 {
6122   if (i.vec_encoding == vex_encoding_error)
6123     {
6124       i.error = unsupported;
6125       return 1;
6126     }
6127
6128   if (i.vec_encoding == vex_encoding_evex)
6129     {
6130       /* This instruction must be encoded with EVEX prefix.  */
6131       if (!is_evex_encoding (t))
6132         {
6133           i.error = unsupported;
6134           return 1;
6135         }
6136       return 0;
6137     }
6138
6139   if (!t->opcode_modifier.vex)
6140     {
6141       /* This instruction template doesn't have VEX prefix.  */
6142       if (i.vec_encoding != vex_encoding_default)
6143         {
6144           i.error = unsupported;
6145           return 1;
6146         }
6147       return 0;
6148     }
6149
6150   return 0;
6151 }
6152
6153 static const insn_template *
6154 match_template (char mnem_suffix)
6155 {
6156   /* Points to template once we've found it.  */
6157   const insn_template *t;
6158   i386_operand_type overlap0, overlap1, overlap2, overlap3;
6159   i386_operand_type overlap4;
6160   unsigned int found_reverse_match;
6161   i386_opcode_modifier suffix_check;
6162   i386_operand_type operand_types [MAX_OPERANDS];
6163   int addr_prefix_disp;
6164   unsigned int j, size_match, check_register;
6165   enum i386_error specific_error = 0;
6166
6167 #if MAX_OPERANDS != 5
6168 # error "MAX_OPERANDS must be 5."
6169 #endif
6170
6171   found_reverse_match = 0;
6172   addr_prefix_disp = -1;
6173
6174   /* Prepare for mnemonic suffix check.  */
6175   memset (&suffix_check, 0, sizeof (suffix_check));
6176   switch (mnem_suffix)
6177     {
6178     case BYTE_MNEM_SUFFIX:
6179       suffix_check.no_bsuf = 1;
6180       break;
6181     case WORD_MNEM_SUFFIX:
6182       suffix_check.no_wsuf = 1;
6183       break;
6184     case SHORT_MNEM_SUFFIX:
6185       suffix_check.no_ssuf = 1;
6186       break;
6187     case LONG_MNEM_SUFFIX:
6188       suffix_check.no_lsuf = 1;
6189       break;
6190     case QWORD_MNEM_SUFFIX:
6191       suffix_check.no_qsuf = 1;
6192       break;
6193     default:
6194       /* NB: In Intel syntax, normally we can check for memory operand
6195          size when there is no mnemonic suffix.  But jmp and call have
6196          2 different encodings with Dword memory operand size, one with
6197          No_ldSuf and the other without.  i.suffix is set to
6198          LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf.  */
6199       if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6200         suffix_check.no_ldsuf = 1;
6201     }
6202
6203   /* Must have right number of operands.  */
6204   i.error = number_of_operands_mismatch;
6205
6206   for (t = current_templates->start; t < current_templates->end; t++)
6207     {
6208       addr_prefix_disp = -1;
6209       found_reverse_match = 0;
6210
6211       if (i.operands != t->operands)
6212         continue;
6213
6214       /* Check processor support.  */
6215       i.error = unsupported;
6216       if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6217         continue;
6218
6219       /* Check Pseudo Prefix.  */
6220       i.error = unsupported;
6221       if (t->opcode_modifier.pseudovexprefix
6222           && !(i.vec_encoding == vex_encoding_vex
6223               || i.vec_encoding == vex_encoding_vex3))
6224         continue;
6225
6226       /* Check AT&T mnemonic.   */
6227       i.error = unsupported_with_intel_mnemonic;
6228       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6229         continue;
6230
6231       /* Check AT&T/Intel syntax.  */
6232       i.error = unsupported_syntax;
6233       if ((intel_syntax && t->opcode_modifier.attsyntax)
6234           || (!intel_syntax && t->opcode_modifier.intelsyntax))
6235         continue;
6236
6237       /* Check Intel64/AMD64 ISA.   */
6238       switch (isa64)
6239         {
6240         default:
6241           /* Default: Don't accept Intel64.  */
6242           if (t->opcode_modifier.isa64 == INTEL64)
6243             continue;
6244           break;
6245         case amd64:
6246           /* -mamd64: Don't accept Intel64 and Intel64 only.  */
6247           if (t->opcode_modifier.isa64 >= INTEL64)
6248             continue;
6249           break;
6250         case intel64:
6251           /* -mintel64: Don't accept AMD64.  */
6252           if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6253             continue;
6254           break;
6255         }
6256
6257       /* Check the suffix.  */
6258       i.error = invalid_instruction_suffix;
6259       if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6260           || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6261           || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6262           || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6263           || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6264           || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6265         continue;
6266
6267       size_match = operand_size_match (t);
6268       if (!size_match)
6269         continue;
6270
6271       /* This is intentionally not
6272
6273          if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6274
6275          as the case of a missing * on the operand is accepted (perhaps with
6276          a warning, issued further down).  */
6277       if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6278         {
6279           i.error = operand_type_mismatch;
6280           continue;
6281         }
6282
6283       for (j = 0; j < MAX_OPERANDS; j++)
6284         operand_types[j] = t->operand_types[j];
6285
6286       /* In general, don't allow
6287          - 64-bit operands outside of 64-bit mode,
6288          - 32-bit operands on pre-386.  */
6289       j = i.imm_operands + (t->operands > i.imm_operands + 1);
6290       if (((i.suffix == QWORD_MNEM_SUFFIX
6291             && flag_code != CODE_64BIT
6292             && !(t->base_opcode == 0xfc7
6293                  && t->opcode_modifier.opcodeprefix == PREFIX_NONE
6294                  && t->extension_opcode == 1) /* cmpxchg8b */)
6295            || (i.suffix == LONG_MNEM_SUFFIX
6296                && !cpu_arch_flags.bitfield.cpui386))
6297           && (intel_syntax
6298               ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6299                  && !intel_float_operand (t->name))
6300               : intel_float_operand (t->name) != 2)
6301           && (t->operands == i.imm_operands
6302               || (operand_types[i.imm_operands].bitfield.class != RegMMX
6303                && operand_types[i.imm_operands].bitfield.class != RegSIMD
6304                && operand_types[i.imm_operands].bitfield.class != RegMask)
6305               || (operand_types[j].bitfield.class != RegMMX
6306                   && operand_types[j].bitfield.class != RegSIMD
6307                   && operand_types[j].bitfield.class != RegMask))
6308           && !t->opcode_modifier.sib)
6309         continue;
6310
6311       /* Do not verify operands when there are none.  */
6312       if (!t->operands)
6313         {
6314           if (VEX_check_encoding (t))
6315             {
6316               specific_error = i.error;
6317               continue;
6318             }
6319
6320           /* We've found a match; break out of loop.  */
6321           break;
6322         }
6323
6324       if (!t->opcode_modifier.jump
6325           || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6326         {
6327           /* There should be only one Disp operand.  */
6328           for (j = 0; j < MAX_OPERANDS; j++)
6329             if (operand_type_check (operand_types[j], disp))
6330               break;
6331           if (j < MAX_OPERANDS)
6332             {
6333               bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6334
6335               addr_prefix_disp = j;
6336
6337               /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6338                  operand into Disp32/Disp32/Disp16/Disp32 operand.  */
6339               switch (flag_code)
6340                 {
6341                 case CODE_16BIT:
6342                   override = !override;
6343                   /* Fall through.  */
6344                 case CODE_32BIT:
6345                   if (operand_types[j].bitfield.disp32
6346                       && operand_types[j].bitfield.disp16)
6347                     {
6348                       operand_types[j].bitfield.disp16 = override;
6349                       operand_types[j].bitfield.disp32 = !override;
6350                     }
6351                   operand_types[j].bitfield.disp32s = 0;
6352                   operand_types[j].bitfield.disp64 = 0;
6353                   break;
6354
6355                 case CODE_64BIT:
6356                   if (operand_types[j].bitfield.disp32s
6357                       || operand_types[j].bitfield.disp64)
6358                     {
6359                       operand_types[j].bitfield.disp64 &= !override;
6360                       operand_types[j].bitfield.disp32s &= !override;
6361                       operand_types[j].bitfield.disp32 = override;
6362                     }
6363                   operand_types[j].bitfield.disp16 = 0;
6364                   break;
6365                 }
6366             }
6367         }
6368
6369       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
6370       if (i.reloc[0] == BFD_RELOC_386_GOT32
6371           && t->base_opcode == 0xa0
6372           && t->opcode_modifier.opcodespace == SPACE_BASE)
6373         continue;
6374
6375       /* We check register size if needed.  */
6376       if (t->opcode_modifier.checkregsize)
6377         {
6378           check_register = (1 << t->operands) - 1;
6379           if (i.broadcast)
6380             check_register &= ~(1 << i.broadcast->operand);
6381         }
6382       else
6383         check_register = 0;
6384
6385       overlap0 = operand_type_and (i.types[0], operand_types[0]);
6386       switch (t->operands)
6387         {
6388         case 1:
6389           if (!operand_type_match (overlap0, i.types[0]))
6390             continue;
6391           break;
6392         case 2:
6393           /* xchg %eax, %eax is a special case. It is an alias for nop
6394              only in 32bit mode and we can use opcode 0x90.  In 64bit
6395              mode, we can't use 0x90 for xchg %eax, %eax since it should
6396              zero-extend %eax to %rax.  */
6397           if (flag_code == CODE_64BIT
6398               && t->base_opcode == 0x90
6399               && t->opcode_modifier.opcodespace == SPACE_BASE
6400               && i.types[0].bitfield.instance == Accum
6401               && i.types[0].bitfield.dword
6402               && i.types[1].bitfield.instance == Accum
6403               && i.types[1].bitfield.dword)
6404             continue;
6405           /* xrelease mov %eax, <disp> is another special case. It must not
6406              match the accumulator-only encoding of mov.  */
6407           if (flag_code != CODE_64BIT
6408               && i.hle_prefix
6409               && t->base_opcode == 0xa0
6410               && t->opcode_modifier.opcodespace == SPACE_BASE
6411               && i.types[0].bitfield.instance == Accum
6412               && (i.flags[1] & Operand_Mem))
6413             continue;
6414           /* Fall through.  */
6415
6416         case 3:
6417           if (!(size_match & MATCH_STRAIGHT))
6418             goto check_reverse;
6419           /* Reverse direction of operands if swapping is possible in the first
6420              place (operands need to be symmetric) and
6421              - the load form is requested, and the template is a store form,
6422              - the store form is requested, and the template is a load form,
6423              - the non-default (swapped) form is requested.  */
6424           overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6425           if (t->opcode_modifier.d && i.reg_operands == i.operands
6426               && !operand_type_all_zero (&overlap1))
6427             switch (i.dir_encoding)
6428               {
6429               case dir_encoding_load:
6430                 if (operand_type_check (operand_types[i.operands - 1], anymem)
6431                     || t->opcode_modifier.regmem)
6432                   goto check_reverse;
6433                 break;
6434
6435               case dir_encoding_store:
6436                 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6437                     && !t->opcode_modifier.regmem)
6438                   goto check_reverse;
6439                 break;
6440
6441               case dir_encoding_swap:
6442                 goto check_reverse;
6443
6444               case dir_encoding_default:
6445                 break;
6446               }
6447           /* If we want store form, we skip the current load.  */
6448           if ((i.dir_encoding == dir_encoding_store
6449                || i.dir_encoding == dir_encoding_swap)
6450               && i.mem_operands == 0
6451               && t->opcode_modifier.load)
6452             continue;
6453           /* Fall through.  */
6454         case 4:
6455         case 5:
6456           overlap1 = operand_type_and (i.types[1], operand_types[1]);
6457           if (!operand_type_match (overlap0, i.types[0])
6458               || !operand_type_match (overlap1, i.types[1])
6459               || ((check_register & 3) == 3
6460                   && !operand_type_register_match (i.types[0],
6461                                                    operand_types[0],
6462                                                    i.types[1],
6463                                                    operand_types[1])))
6464             {
6465               /* Check if other direction is valid ...  */
6466               if (!t->opcode_modifier.d)
6467                 continue;
6468
6469             check_reverse:
6470               if (!(size_match & MATCH_REVERSE))
6471                 continue;
6472               /* Try reversing direction of operands.  */
6473               overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6474               overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6475               if (!operand_type_match (overlap0, i.types[0])
6476                   || !operand_type_match (overlap1, i.types[i.operands - 1])
6477                   || (check_register
6478                       && !operand_type_register_match (i.types[0],
6479                                                        operand_types[i.operands - 1],
6480                                                        i.types[i.operands - 1],
6481                                                        operand_types[0])))
6482                 {
6483                   /* Does not match either direction.  */
6484                   continue;
6485                 }
6486               /* found_reverse_match holds which of D or FloatR
6487                  we've found.  */
6488               if (!t->opcode_modifier.d)
6489                 found_reverse_match = 0;
6490               else if (operand_types[0].bitfield.tbyte)
6491                 found_reverse_match = Opcode_FloatD;
6492               else if (operand_types[0].bitfield.xmmword
6493                        || operand_types[i.operands - 1].bitfield.xmmword
6494                        || operand_types[0].bitfield.class == RegMMX
6495                        || operand_types[i.operands - 1].bitfield.class == RegMMX
6496                        || is_any_vex_encoding(t))
6497                 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6498                                       ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6499               else
6500                 found_reverse_match = Opcode_D;
6501               if (t->opcode_modifier.floatr)
6502                 found_reverse_match |= Opcode_FloatR;
6503             }
6504           else
6505             {
6506               /* Found a forward 2 operand match here.  */
6507               switch (t->operands)
6508                 {
6509                 case 5:
6510                   overlap4 = operand_type_and (i.types[4],
6511                                                operand_types[4]);
6512                   /* Fall through.  */
6513                 case 4:
6514                   overlap3 = operand_type_and (i.types[3],
6515                                                operand_types[3]);
6516                   /* Fall through.  */
6517                 case 3:
6518                   overlap2 = operand_type_and (i.types[2],
6519                                                operand_types[2]);
6520                   break;
6521                 }
6522
6523               switch (t->operands)
6524                 {
6525                 case 5:
6526                   if (!operand_type_match (overlap4, i.types[4])
6527                       || !operand_type_register_match (i.types[3],
6528                                                        operand_types[3],
6529                                                        i.types[4],
6530                                                        operand_types[4]))
6531                     continue;
6532                   /* Fall through.  */
6533                 case 4:
6534                   if (!operand_type_match (overlap3, i.types[3])
6535                       || ((check_register & 0xa) == 0xa
6536                           && !operand_type_register_match (i.types[1],
6537                                                             operand_types[1],
6538                                                             i.types[3],
6539                                                             operand_types[3]))
6540                       || ((check_register & 0xc) == 0xc
6541                           && !operand_type_register_match (i.types[2],
6542                                                             operand_types[2],
6543                                                             i.types[3],
6544                                                             operand_types[3])))
6545                     continue;
6546                   /* Fall through.  */
6547                 case 3:
6548                   /* Here we make use of the fact that there are no
6549                      reverse match 3 operand instructions.  */
6550                   if (!operand_type_match (overlap2, i.types[2])
6551                       || ((check_register & 5) == 5
6552                           && !operand_type_register_match (i.types[0],
6553                                                             operand_types[0],
6554                                                             i.types[2],
6555                                                             operand_types[2]))
6556                       || ((check_register & 6) == 6
6557                           && !operand_type_register_match (i.types[1],
6558                                                             operand_types[1],
6559                                                             i.types[2],
6560                                                             operand_types[2])))
6561                     continue;
6562                   break;
6563                 }
6564             }
6565           /* Found either forward/reverse 2, 3 or 4 operand match here:
6566              slip through to break.  */
6567         }
6568
6569       /* Check if vector operands are valid.  */
6570       if (check_VecOperands (t))
6571         {
6572           specific_error = i.error;
6573           continue;
6574         }
6575
6576       /* Check if VEX/EVEX encoding requirements can be satisfied.  */
6577       if (VEX_check_encoding (t))
6578         {
6579           specific_error = i.error;
6580           continue;
6581         }
6582
6583       /* We've found a match; break out of loop.  */
6584       break;
6585     }
6586
6587   if (t == current_templates->end)
6588     {
6589       /* We found no match.  */
6590       const char *err_msg;
6591       switch (specific_error ? specific_error : i.error)
6592         {
6593         default:
6594           abort ();
6595         case operand_size_mismatch:
6596           err_msg = _("operand size mismatch");
6597           break;
6598         case operand_type_mismatch:
6599           err_msg = _("operand type mismatch");
6600           break;
6601         case register_type_mismatch:
6602           err_msg = _("register type mismatch");
6603           break;
6604         case number_of_operands_mismatch:
6605           err_msg = _("number of operands mismatch");
6606           break;
6607         case invalid_instruction_suffix:
6608           err_msg = _("invalid instruction suffix");
6609           break;
6610         case bad_imm4:
6611           err_msg = _("constant doesn't fit in 4 bits");
6612           break;
6613         case unsupported_with_intel_mnemonic:
6614           err_msg = _("unsupported with Intel mnemonic");
6615           break;
6616         case unsupported_syntax:
6617           err_msg = _("unsupported syntax");
6618           break;
6619         case unsupported:
6620           as_bad (_("unsupported instruction `%s'"),
6621                   current_templates->start->name);
6622           return NULL;
6623         case invalid_sib_address:
6624           err_msg = _("invalid SIB address");
6625           break;
6626         case invalid_vsib_address:
6627           err_msg = _("invalid VSIB address");
6628           break;
6629         case invalid_vector_register_set:
6630           err_msg = _("mask, index, and destination registers must be distinct");
6631           break;
6632         case invalid_tmm_register_set:
6633           err_msg = _("all tmm registers must be distinct");
6634           break;
6635         case unsupported_vector_index_register:
6636           err_msg = _("unsupported vector index register");
6637           break;
6638         case unsupported_broadcast:
6639           err_msg = _("unsupported broadcast");
6640           break;
6641         case broadcast_needed:
6642           err_msg = _("broadcast is needed for operand of such type");
6643           break;
6644         case unsupported_masking:
6645           err_msg = _("unsupported masking");
6646           break;
6647         case mask_not_on_destination:
6648           err_msg = _("mask not on destination operand");
6649           break;
6650         case no_default_mask:
6651           err_msg = _("default mask isn't allowed");
6652           break;
6653         case unsupported_rc_sae:
6654           err_msg = _("unsupported static rounding/sae");
6655           break;
6656         case rc_sae_operand_not_last_imm:
6657           if (intel_syntax)
6658             err_msg = _("RC/SAE operand must precede immediate operands");
6659           else
6660             err_msg = _("RC/SAE operand must follow immediate operands");
6661           break;
6662         case invalid_register_operand:
6663           err_msg = _("invalid register operand");
6664           break;
6665         }
6666       as_bad (_("%s for `%s'"), err_msg,
6667               current_templates->start->name);
6668       return NULL;
6669     }
6670
6671   if (!quiet_warnings)
6672     {
6673       if (!intel_syntax
6674           && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6675         as_warn (_("indirect %s without `*'"), t->name);
6676
6677       if (t->opcode_modifier.isprefix
6678           && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6679         {
6680           /* Warn them that a data or address size prefix doesn't
6681              affect assembly of the next line of code.  */
6682           as_warn (_("stand-alone `%s' prefix"), t->name);
6683         }
6684     }
6685
6686   /* Copy the template we found.  */
6687   install_template (t);
6688
6689   if (addr_prefix_disp != -1)
6690     i.tm.operand_types[addr_prefix_disp]
6691       = operand_types[addr_prefix_disp];
6692
6693   if (found_reverse_match)
6694     {
6695       /* If we found a reverse match we must alter the opcode direction
6696          bit and clear/flip the regmem modifier one.  found_reverse_match
6697          holds bits to change (different for int & float insns).  */
6698
6699       i.tm.base_opcode ^= found_reverse_match;
6700
6701       i.tm.operand_types[0] = operand_types[i.operands - 1];
6702       i.tm.operand_types[i.operands - 1] = operand_types[0];
6703
6704       /* Certain SIMD insns have their load forms specified in the opcode
6705          table, and hence we need to _set_ RegMem instead of clearing it.
6706          We need to avoid setting the bit though on insns like KMOVW.  */
6707       i.tm.opcode_modifier.regmem
6708         = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6709           && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6710           && !i.tm.opcode_modifier.regmem;
6711     }
6712
6713   return t;
6714 }
6715
6716 static int
6717 check_string (void)
6718 {
6719   unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6720   unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6721
6722   if (i.seg[op] != NULL && i.seg[op] != &es)
6723     {
6724       as_bad (_("`%s' operand %u must use `%ses' segment"),
6725               i.tm.name,
6726               intel_syntax ? i.tm.operands - es_op : es_op + 1,
6727               register_prefix);
6728       return 0;
6729     }
6730
6731   /* There's only ever one segment override allowed per instruction.
6732      This instruction possibly has a legal segment override on the
6733      second operand, so copy the segment to where non-string
6734      instructions store it, allowing common code.  */
6735   i.seg[op] = i.seg[1];
6736
6737   return 1;
6738 }
6739
6740 static int
6741 process_suffix (void)
6742 {
6743   bfd_boolean is_crc32 = FALSE;
6744
6745   /* If matched instruction specifies an explicit instruction mnemonic
6746      suffix, use it.  */
6747   if (i.tm.opcode_modifier.size == SIZE16)
6748     i.suffix = WORD_MNEM_SUFFIX;
6749   else if (i.tm.opcode_modifier.size == SIZE32)
6750     i.suffix = LONG_MNEM_SUFFIX;
6751   else if (i.tm.opcode_modifier.size == SIZE64)
6752     i.suffix = QWORD_MNEM_SUFFIX;
6753   else if (i.reg_operands
6754            && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6755            && !i.tm.opcode_modifier.addrprefixopreg)
6756     {
6757       unsigned int numop = i.operands;
6758       /* CRC32 */
6759       is_crc32 = (i.tm.base_opcode == 0xf38f0
6760                   && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2);
6761
6762       /* movsx/movzx want only their source operand considered here, for the
6763          ambiguity checking below.  The suffix will be replaced afterwards
6764          to represent the destination (register).  */
6765       if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6766           || (i.tm.base_opcode == 0x63
6767               && i.tm.opcode_modifier.opcodespace == SPACE_BASE
6768               && i.tm.cpu_flags.bitfield.cpu64))
6769         --i.operands;
6770
6771       /* crc32 needs REX.W set regardless of suffix / source operand size.  */
6772       if (is_crc32 && i.tm.operand_types[1].bitfield.qword)
6773         i.rex |= REX_W;
6774
6775       /* If there's no instruction mnemonic suffix we try to invent one
6776          based on GPR operands.  */
6777       if (!i.suffix)
6778         {
6779           /* We take i.suffix from the last register operand specified,
6780              Destination register type is more significant than source
6781              register type.  crc32 in SSE4.2 prefers source register
6782              type. */
6783           unsigned int op = is_crc32 ? 1 : i.operands;
6784
6785           while (op--)
6786             if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6787                 || i.tm.operand_types[op].bitfield.instance == Accum)
6788               {
6789                 if (i.types[op].bitfield.class != Reg)
6790                   continue;
6791                 if (i.types[op].bitfield.byte)
6792                   i.suffix = BYTE_MNEM_SUFFIX;
6793                 else if (i.types[op].bitfield.word)
6794                   i.suffix = WORD_MNEM_SUFFIX;
6795                 else if (i.types[op].bitfield.dword)
6796                   i.suffix = LONG_MNEM_SUFFIX;
6797                 else if (i.types[op].bitfield.qword)
6798                   i.suffix = QWORD_MNEM_SUFFIX;
6799                 else
6800                   continue;
6801                 break;
6802               }
6803
6804           /* As an exception, movsx/movzx silently default to a byte source
6805              in AT&T mode.  */
6806           if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6807               && !i.suffix && !intel_syntax)
6808             i.suffix = BYTE_MNEM_SUFFIX;
6809         }
6810       else if (i.suffix == BYTE_MNEM_SUFFIX)
6811         {
6812           if (intel_syntax
6813               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6814               && i.tm.opcode_modifier.no_bsuf)
6815             i.suffix = 0;
6816           else if (!check_byte_reg ())
6817             return 0;
6818         }
6819       else if (i.suffix == LONG_MNEM_SUFFIX)
6820         {
6821           if (intel_syntax
6822               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6823               && i.tm.opcode_modifier.no_lsuf
6824               && !i.tm.opcode_modifier.todword
6825               && !i.tm.opcode_modifier.toqword)
6826             i.suffix = 0;
6827           else if (!check_long_reg ())
6828             return 0;
6829         }
6830       else if (i.suffix == QWORD_MNEM_SUFFIX)
6831         {
6832           if (intel_syntax
6833               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6834               && i.tm.opcode_modifier.no_qsuf
6835               && !i.tm.opcode_modifier.todword
6836               && !i.tm.opcode_modifier.toqword)
6837             i.suffix = 0;
6838           else if (!check_qword_reg ())
6839             return 0;
6840         }
6841       else if (i.suffix == WORD_MNEM_SUFFIX)
6842         {
6843           if (intel_syntax
6844               && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6845               && i.tm.opcode_modifier.no_wsuf)
6846             i.suffix = 0;
6847           else if (!check_word_reg ())
6848             return 0;
6849         }
6850       else if (intel_syntax
6851                && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6852         /* Do nothing if the instruction is going to ignore the prefix.  */
6853         ;
6854       else
6855         abort ();
6856
6857       /* Undo the movsx/movzx change done above.  */
6858       i.operands = numop;
6859     }
6860   else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6861            && !i.suffix)
6862     {
6863       i.suffix = stackop_size;
6864       if (stackop_size == LONG_MNEM_SUFFIX)
6865         {
6866           /* stackop_size is set to LONG_MNEM_SUFFIX for the
6867              .code16gcc directive to support 16-bit mode with
6868              32-bit address.  For IRET without a suffix, generate
6869              16-bit IRET (opcode 0xcf) to return from an interrupt
6870              handler.  */
6871           if (i.tm.base_opcode == 0xcf)
6872             {
6873               i.suffix = WORD_MNEM_SUFFIX;
6874               as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6875             }
6876           /* Warn about changed behavior for segment register push/pop.  */
6877           else if ((i.tm.base_opcode | 1) == 0x07)
6878             as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6879                      i.tm.name);
6880         }
6881     }
6882   else if (!i.suffix
6883            && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6884                || i.tm.opcode_modifier.jump == JUMP_BYTE
6885                || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6886                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6887                    && i.tm.extension_opcode <= 3)))
6888     {
6889       switch (flag_code)
6890         {
6891         case CODE_64BIT:
6892           if (!i.tm.opcode_modifier.no_qsuf)
6893             {
6894               if (i.tm.opcode_modifier.jump == JUMP_BYTE
6895                   || i.tm.opcode_modifier.no_lsuf)
6896                 i.suffix = QWORD_MNEM_SUFFIX;
6897               break;
6898             }
6899           /* Fall through.  */
6900         case CODE_32BIT:
6901           if (!i.tm.opcode_modifier.no_lsuf)
6902             i.suffix = LONG_MNEM_SUFFIX;
6903           break;
6904         case CODE_16BIT:
6905           if (!i.tm.opcode_modifier.no_wsuf)
6906             i.suffix = WORD_MNEM_SUFFIX;
6907           break;
6908         }
6909     }
6910
6911   if (!i.suffix
6912       && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6913           /* Also cover lret/retf/iret in 64-bit mode.  */
6914           || (flag_code == CODE_64BIT
6915               && !i.tm.opcode_modifier.no_lsuf
6916               && !i.tm.opcode_modifier.no_qsuf))
6917       && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6918       /* Explicit sizing prefixes are assumed to disambiguate insns.  */
6919       && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6920       /* Accept FLDENV et al without suffix.  */
6921       && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6922     {
6923       unsigned int suffixes, evex = 0;
6924
6925       suffixes = !i.tm.opcode_modifier.no_bsuf;
6926       if (!i.tm.opcode_modifier.no_wsuf)
6927         suffixes |= 1 << 1;
6928       if (!i.tm.opcode_modifier.no_lsuf)
6929         suffixes |= 1 << 2;
6930       if (!i.tm.opcode_modifier.no_ldsuf)
6931         suffixes |= 1 << 3;
6932       if (!i.tm.opcode_modifier.no_ssuf)
6933         suffixes |= 1 << 4;
6934       if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6935         suffixes |= 1 << 5;
6936
6937       /* For [XYZ]MMWORD operands inspect operand sizes.  While generally
6938          also suitable for AT&T syntax mode, it was requested that this be
6939          restricted to just Intel syntax.  */
6940       if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6941         {
6942           unsigned int op;
6943
6944           for (op = 0; op < i.tm.operands; ++op)
6945             {
6946               if (is_evex_encoding (&i.tm)
6947                   && !cpu_arch_flags.bitfield.cpuavx512vl)
6948                 {
6949                   if (i.tm.operand_types[op].bitfield.ymmword)
6950                     i.tm.operand_types[op].bitfield.xmmword = 0;
6951                   if (i.tm.operand_types[op].bitfield.zmmword)
6952                     i.tm.operand_types[op].bitfield.ymmword = 0;
6953                   if (!i.tm.opcode_modifier.evex
6954                       || i.tm.opcode_modifier.evex == EVEXDYN)
6955                     i.tm.opcode_modifier.evex = EVEX512;
6956                 }
6957
6958               if (i.tm.operand_types[op].bitfield.xmmword
6959                   + i.tm.operand_types[op].bitfield.ymmword
6960                   + i.tm.operand_types[op].bitfield.zmmword < 2)
6961                 continue;
6962
6963               /* Any properly sized operand disambiguates the insn.  */
6964               if (i.types[op].bitfield.xmmword
6965                   || i.types[op].bitfield.ymmword
6966                   || i.types[op].bitfield.zmmword)
6967                 {
6968                   suffixes &= ~(7 << 6);
6969                   evex = 0;
6970                   break;
6971                 }
6972
6973               if ((i.flags[op] & Operand_Mem)
6974                   && i.tm.operand_types[op].bitfield.unspecified)
6975                 {
6976                   if (i.tm.operand_types[op].bitfield.xmmword)
6977                     suffixes |= 1 << 6;
6978                   if (i.tm.operand_types[op].bitfield.ymmword)
6979                     suffixes |= 1 << 7;
6980                   if (i.tm.operand_types[op].bitfield.zmmword)
6981                     suffixes |= 1 << 8;
6982                   if (is_evex_encoding (&i.tm))
6983                     evex = EVEX512;
6984                 }
6985             }
6986         }
6987
6988       /* Are multiple suffixes / operand sizes allowed?  */
6989       if (suffixes & (suffixes - 1))
6990         {
6991           if (intel_syntax
6992               && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6993                   || operand_check == check_error))
6994             {
6995               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6996               return 0;
6997             }
6998           if (operand_check == check_error)
6999             {
7000               as_bad (_("no instruction mnemonic suffix given and "
7001                         "no register operands; can't size `%s'"), i.tm.name);
7002               return 0;
7003             }
7004           if (operand_check == check_warning)
7005             as_warn (_("%s; using default for `%s'"),
7006                        intel_syntax
7007                        ? _("ambiguous operand size")
7008                        : _("no instruction mnemonic suffix given and "
7009                            "no register operands"),
7010                        i.tm.name);
7011
7012           if (i.tm.opcode_modifier.floatmf)
7013             i.suffix = SHORT_MNEM_SUFFIX;
7014           else if ((i.tm.base_opcode | 8) == 0xfbe
7015                    || (i.tm.base_opcode == 0x63
7016                        && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7017                        && i.tm.cpu_flags.bitfield.cpu64))
7018             /* handled below */;
7019           else if (evex)
7020             i.tm.opcode_modifier.evex = evex;
7021           else if (flag_code == CODE_16BIT)
7022             i.suffix = WORD_MNEM_SUFFIX;
7023           else if (!i.tm.opcode_modifier.no_lsuf)
7024             i.suffix = LONG_MNEM_SUFFIX;
7025           else
7026             i.suffix = QWORD_MNEM_SUFFIX;
7027         }
7028     }
7029
7030   if ((i.tm.base_opcode | 8) == 0xfbe
7031       || (i.tm.base_opcode == 0x63
7032           && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7033           && i.tm.cpu_flags.bitfield.cpu64))
7034     {
7035       /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7036          In AT&T syntax, if there is no suffix (warned about above), the default
7037          will be byte extension.  */
7038       if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7039         i.tm.base_opcode |= 1;
7040
7041       /* For further processing, the suffix should represent the destination
7042          (register).  This is already the case when one was used with
7043          mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7044          no suffix to begin with.  */
7045       if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7046         {
7047           if (i.types[1].bitfield.word)
7048             i.suffix = WORD_MNEM_SUFFIX;
7049           else if (i.types[1].bitfield.qword)
7050             i.suffix = QWORD_MNEM_SUFFIX;
7051           else
7052             i.suffix = LONG_MNEM_SUFFIX;
7053
7054           i.tm.opcode_modifier.w = 0;
7055         }
7056     }
7057
7058   if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7059     i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7060                    != (i.tm.operand_types[1].bitfield.class == Reg);
7061
7062   /* Change the opcode based on the operand size given by i.suffix.  */
7063   switch (i.suffix)
7064     {
7065     /* Size floating point instruction.  */
7066     case LONG_MNEM_SUFFIX:
7067       if (i.tm.opcode_modifier.floatmf)
7068         {
7069           i.tm.base_opcode ^= 4;
7070           break;
7071         }
7072     /* fall through */
7073     case WORD_MNEM_SUFFIX:
7074     case QWORD_MNEM_SUFFIX:
7075       /* It's not a byte, select word/dword operation.  */
7076       if (i.tm.opcode_modifier.w)
7077         {
7078           if (i.short_form)
7079             i.tm.base_opcode |= 8;
7080           else
7081             i.tm.base_opcode |= 1;
7082         }
7083     /* fall through */
7084     case SHORT_MNEM_SUFFIX:
7085       /* Now select between word & dword operations via the operand
7086          size prefix, except for instructions that will ignore this
7087          prefix anyway.  */
7088       if (i.suffix != QWORD_MNEM_SUFFIX
7089           && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7090           && !i.tm.opcode_modifier.floatmf
7091           && !is_any_vex_encoding (&i.tm)
7092           && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7093               || (flag_code == CODE_64BIT
7094                   && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7095         {
7096           unsigned int prefix = DATA_PREFIX_OPCODE;
7097
7098           if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7099             prefix = ADDR_PREFIX_OPCODE;
7100
7101           if (!add_prefix (prefix))
7102             return 0;
7103         }
7104
7105       /* Set mode64 for an operand.  */
7106       if (i.suffix == QWORD_MNEM_SUFFIX
7107           && flag_code == CODE_64BIT
7108           && !i.tm.opcode_modifier.norex64
7109           && !i.tm.opcode_modifier.vexw
7110           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
7111              need rex64. */
7112           && ! (i.operands == 2
7113                 && i.tm.base_opcode == 0x90
7114                 && i.tm.extension_opcode == None
7115                 && i.types[0].bitfield.instance == Accum
7116                 && i.types[0].bitfield.qword
7117                 && i.types[1].bitfield.instance == Accum
7118                 && i.types[1].bitfield.qword))
7119         i.rex |= REX_W;
7120
7121       break;
7122
7123     case 0:
7124       /* Select word/dword/qword operation with explicit data sizing prefix
7125          when there are no suitable register operands.  */
7126       if (i.tm.opcode_modifier.w
7127           && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7128           && (!i.reg_operands
7129               || (i.reg_operands == 1
7130                       /* ShiftCount */
7131                   && (i.tm.operand_types[0].bitfield.instance == RegC
7132                       /* InOutPortReg */
7133                       || i.tm.operand_types[0].bitfield.instance == RegD
7134                       || i.tm.operand_types[1].bitfield.instance == RegD
7135                       /* CRC32 */
7136                       || is_crc32))))
7137         i.tm.base_opcode |= 1;
7138       break;
7139     }
7140
7141   if (i.tm.opcode_modifier.addrprefixopreg)
7142     {
7143       gas_assert (!i.suffix);
7144       gas_assert (i.reg_operands);
7145
7146       if (i.tm.operand_types[0].bitfield.instance == Accum
7147           || i.operands == 1)
7148         {
7149           /* The address size override prefix changes the size of the
7150              first operand.  */
7151           if (flag_code == CODE_64BIT
7152               && i.op[0].regs->reg_type.bitfield.word)
7153             {
7154               as_bad (_("16-bit addressing unavailable for `%s'"),
7155                       i.tm.name);
7156               return 0;
7157             }
7158
7159           if ((flag_code == CODE_32BIT
7160                ? i.op[0].regs->reg_type.bitfield.word
7161                : i.op[0].regs->reg_type.bitfield.dword)
7162               && !add_prefix (ADDR_PREFIX_OPCODE))
7163             return 0;
7164         }
7165       else
7166         {
7167           /* Check invalid register operand when the address size override
7168              prefix changes the size of register operands.  */
7169           unsigned int op;
7170           enum { need_word, need_dword, need_qword } need;
7171
7172           /* Check the register operand for the address size prefix if
7173              the memory operand has no real registers, like symbol, DISP
7174              or bogus (x32-only) symbol(%rip) when symbol(%eip) is meant.  */
7175           if (i.mem_operands == 1
7176               && i.reg_operands == 1
7177               && i.operands == 2
7178               && i.types[1].bitfield.class == Reg
7179               && (flag_code == CODE_32BIT
7180                   ? i.op[1].regs->reg_type.bitfield.word
7181                   : i.op[1].regs->reg_type.bitfield.dword)
7182               && ((i.base_reg == NULL && i.index_reg == NULL)
7183 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7184                   || (x86_elf_abi == X86_64_X32_ABI
7185                       && i.base_reg
7186                       && i.base_reg->reg_num == RegIP
7187                       && i.base_reg->reg_type.bitfield.qword))
7188 #else
7189                   || 0)
7190 #endif
7191               && !add_prefix (ADDR_PREFIX_OPCODE))
7192             return 0;
7193
7194           if (flag_code == CODE_32BIT)
7195             need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7196           else if (i.prefix[ADDR_PREFIX])
7197             need = need_dword;
7198           else
7199             need = flag_code == CODE_64BIT ? need_qword : need_word;
7200
7201           for (op = 0; op < i.operands; op++)
7202             {
7203               if (i.types[op].bitfield.class != Reg)
7204                 continue;
7205
7206               switch (need)
7207                 {
7208                 case need_word:
7209                   if (i.op[op].regs->reg_type.bitfield.word)
7210                     continue;
7211                   break;
7212                 case need_dword:
7213                   if (i.op[op].regs->reg_type.bitfield.dword)
7214                     continue;
7215                   break;
7216                 case need_qword:
7217                   if (i.op[op].regs->reg_type.bitfield.qword)
7218                     continue;
7219                   break;
7220                 }
7221
7222               as_bad (_("invalid register operand size for `%s'"),
7223                       i.tm.name);
7224               return 0;
7225             }
7226         }
7227     }
7228
7229   return 1;
7230 }
7231
7232 static int
7233 check_byte_reg (void)
7234 {
7235   int op;
7236
7237   for (op = i.operands; --op >= 0;)
7238     {
7239       /* Skip non-register operands. */
7240       if (i.types[op].bitfield.class != Reg)
7241         continue;
7242
7243       /* If this is an eight bit register, it's OK.  If it's the 16 or
7244          32 bit version of an eight bit register, we will just use the
7245          low portion, and that's OK too.  */
7246       if (i.types[op].bitfield.byte)
7247         continue;
7248
7249       /* I/O port address operands are OK too.  */
7250       if (i.tm.operand_types[op].bitfield.instance == RegD
7251           && i.tm.operand_types[op].bitfield.word)
7252         continue;
7253
7254       /* crc32 only wants its source operand checked here.  */
7255       if (i.tm.base_opcode == 0xf38f0
7256           && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2
7257           && op != 0)
7258         continue;
7259
7260       /* Any other register is bad.  */
7261       as_bad (_("`%s%s' not allowed with `%s%c'"),
7262               register_prefix, i.op[op].regs->reg_name,
7263               i.tm.name, i.suffix);
7264       return 0;
7265     }
7266   return 1;
7267 }
7268
7269 static int
7270 check_long_reg (void)
7271 {
7272   int op;
7273
7274   for (op = i.operands; --op >= 0;)
7275     /* Skip non-register operands. */
7276     if (i.types[op].bitfield.class != Reg)
7277       continue;
7278     /* Reject eight bit registers, except where the template requires
7279        them. (eg. movzb)  */
7280     else if (i.types[op].bitfield.byte
7281              && (i.tm.operand_types[op].bitfield.class == Reg
7282                  || i.tm.operand_types[op].bitfield.instance == Accum)
7283              && (i.tm.operand_types[op].bitfield.word
7284                  || i.tm.operand_types[op].bitfield.dword))
7285       {
7286         as_bad (_("`%s%s' not allowed with `%s%c'"),
7287                 register_prefix,
7288                 i.op[op].regs->reg_name,
7289                 i.tm.name,
7290                 i.suffix);
7291         return 0;
7292       }
7293     /* Error if the e prefix on a general reg is missing.  */
7294     else if (i.types[op].bitfield.word
7295              && (i.tm.operand_types[op].bitfield.class == Reg
7296                  || i.tm.operand_types[op].bitfield.instance == Accum)
7297              && i.tm.operand_types[op].bitfield.dword)
7298       {
7299         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7300                 register_prefix, i.op[op].regs->reg_name,
7301                 i.suffix);
7302         return 0;
7303       }
7304     /* Warn if the r prefix on a general reg is present.  */
7305     else if (i.types[op].bitfield.qword
7306              && (i.tm.operand_types[op].bitfield.class == Reg
7307                  || i.tm.operand_types[op].bitfield.instance == Accum)
7308              && i.tm.operand_types[op].bitfield.dword)
7309       {
7310         if (intel_syntax
7311             && i.tm.opcode_modifier.toqword
7312             && i.types[0].bitfield.class != RegSIMD)
7313           {
7314             /* Convert to QWORD.  We want REX byte. */
7315             i.suffix = QWORD_MNEM_SUFFIX;
7316           }
7317         else
7318           {
7319             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7320                     register_prefix, i.op[op].regs->reg_name,
7321                     i.suffix);
7322             return 0;
7323           }
7324       }
7325   return 1;
7326 }
7327
7328 static int
7329 check_qword_reg (void)
7330 {
7331   int op;
7332
7333   for (op = i.operands; --op >= 0; )
7334     /* Skip non-register operands. */
7335     if (i.types[op].bitfield.class != Reg)
7336       continue;
7337     /* Reject eight bit registers, except where the template requires
7338        them. (eg. movzb)  */
7339     else if (i.types[op].bitfield.byte
7340              && (i.tm.operand_types[op].bitfield.class == Reg
7341                  || i.tm.operand_types[op].bitfield.instance == Accum)
7342              && (i.tm.operand_types[op].bitfield.word
7343                  || i.tm.operand_types[op].bitfield.dword))
7344       {
7345         as_bad (_("`%s%s' not allowed with `%s%c'"),
7346                 register_prefix,
7347                 i.op[op].regs->reg_name,
7348                 i.tm.name,
7349                 i.suffix);
7350         return 0;
7351       }
7352     /* Warn if the r prefix on a general reg is missing.  */
7353     else if ((i.types[op].bitfield.word
7354               || i.types[op].bitfield.dword)
7355              && (i.tm.operand_types[op].bitfield.class == Reg
7356                  || i.tm.operand_types[op].bitfield.instance == Accum)
7357              && i.tm.operand_types[op].bitfield.qword)
7358       {
7359         /* Prohibit these changes in the 64bit mode, since the
7360            lowering is more complicated.  */
7361         if (intel_syntax
7362             && i.tm.opcode_modifier.todword
7363             && i.types[0].bitfield.class != RegSIMD)
7364           {
7365             /* Convert to DWORD.  We don't want REX byte. */
7366             i.suffix = LONG_MNEM_SUFFIX;
7367           }
7368         else
7369           {
7370             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7371                     register_prefix, i.op[op].regs->reg_name,
7372                     i.suffix);
7373             return 0;
7374           }
7375       }
7376   return 1;
7377 }
7378
7379 static int
7380 check_word_reg (void)
7381 {
7382   int op;
7383   for (op = i.operands; --op >= 0;)
7384     /* Skip non-register operands. */
7385     if (i.types[op].bitfield.class != Reg)
7386       continue;
7387     /* Reject eight bit registers, except where the template requires
7388        them. (eg. movzb)  */
7389     else if (i.types[op].bitfield.byte
7390              && (i.tm.operand_types[op].bitfield.class == Reg
7391                  || i.tm.operand_types[op].bitfield.instance == Accum)
7392              && (i.tm.operand_types[op].bitfield.word
7393                  || i.tm.operand_types[op].bitfield.dword))
7394       {
7395         as_bad (_("`%s%s' not allowed with `%s%c'"),
7396                 register_prefix,
7397                 i.op[op].regs->reg_name,
7398                 i.tm.name,
7399                 i.suffix);
7400         return 0;
7401       }
7402     /* Error if the e or r prefix on a general reg is present.  */
7403     else if ((i.types[op].bitfield.dword
7404                  || i.types[op].bitfield.qword)
7405              && (i.tm.operand_types[op].bitfield.class == Reg
7406                  || i.tm.operand_types[op].bitfield.instance == Accum)
7407              && i.tm.operand_types[op].bitfield.word)
7408       {
7409         as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7410                 register_prefix, i.op[op].regs->reg_name,
7411                 i.suffix);
7412         return 0;
7413       }
7414   return 1;
7415 }
7416
7417 static int
7418 update_imm (unsigned int j)
7419 {
7420   i386_operand_type overlap = i.types[j];
7421   if ((overlap.bitfield.imm8
7422        || overlap.bitfield.imm8s
7423        || overlap.bitfield.imm16
7424        || overlap.bitfield.imm32
7425        || overlap.bitfield.imm32s
7426        || overlap.bitfield.imm64)
7427       && !operand_type_equal (&overlap, &imm8)
7428       && !operand_type_equal (&overlap, &imm8s)
7429       && !operand_type_equal (&overlap, &imm16)
7430       && !operand_type_equal (&overlap, &imm32)
7431       && !operand_type_equal (&overlap, &imm32s)
7432       && !operand_type_equal (&overlap, &imm64))
7433     {
7434       if (i.suffix)
7435         {
7436           i386_operand_type temp;
7437
7438           operand_type_set (&temp, 0);
7439           if (i.suffix == BYTE_MNEM_SUFFIX)
7440             {
7441               temp.bitfield.imm8 = overlap.bitfield.imm8;
7442               temp.bitfield.imm8s = overlap.bitfield.imm8s;
7443             }
7444           else if (i.suffix == WORD_MNEM_SUFFIX)
7445             temp.bitfield.imm16 = overlap.bitfield.imm16;
7446           else if (i.suffix == QWORD_MNEM_SUFFIX)
7447             {
7448               temp.bitfield.imm64 = overlap.bitfield.imm64;
7449               temp.bitfield.imm32s = overlap.bitfield.imm32s;
7450             }
7451           else
7452             temp.bitfield.imm32 = overlap.bitfield.imm32;
7453           overlap = temp;
7454         }
7455       else if (operand_type_equal (&overlap, &imm16_32_32s)
7456                || operand_type_equal (&overlap, &imm16_32)
7457                || operand_type_equal (&overlap, &imm16_32s))
7458         {
7459           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7460             overlap = imm16;
7461           else
7462             overlap = imm32s;
7463         }
7464       else if (i.prefix[REX_PREFIX] & REX_W)
7465         overlap = operand_type_and (overlap, imm32s);
7466       else if (i.prefix[DATA_PREFIX])
7467         overlap = operand_type_and (overlap,
7468                                     flag_code != CODE_16BIT ? imm16 : imm32);
7469       if (!operand_type_equal (&overlap, &imm8)
7470           && !operand_type_equal (&overlap, &imm8s)
7471           && !operand_type_equal (&overlap, &imm16)
7472           && !operand_type_equal (&overlap, &imm32)
7473           && !operand_type_equal (&overlap, &imm32s)
7474           && !operand_type_equal (&overlap, &imm64))
7475         {
7476           as_bad (_("no instruction mnemonic suffix given; "
7477                     "can't determine immediate size"));
7478           return 0;
7479         }
7480     }
7481   i.types[j] = overlap;
7482
7483   return 1;
7484 }
7485
7486 static int
7487 finalize_imm (void)
7488 {
7489   unsigned int j, n;
7490
7491   /* Update the first 2 immediate operands.  */
7492   n = i.operands > 2 ? 2 : i.operands;
7493   if (n)
7494     {
7495       for (j = 0; j < n; j++)
7496         if (update_imm (j) == 0)
7497           return 0;
7498
7499       /* The 3rd operand can't be immediate operand.  */
7500       gas_assert (operand_type_check (i.types[2], imm) == 0);
7501     }
7502
7503   return 1;
7504 }
7505
7506 static int
7507 process_operands (void)
7508 {
7509   /* Default segment register this instruction will use for memory
7510      accesses.  0 means unknown.  This is only for optimizing out
7511      unnecessary segment overrides.  */
7512   const seg_entry *default_seg = 0;
7513
7514   if (i.tm.opcode_modifier.sse2avx)
7515     {
7516       /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7517          need converting.  */
7518       i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7519       i.prefix[REX_PREFIX] = 0;
7520       i.rex_encoding = 0;
7521     }
7522   /* ImmExt should be processed after SSE2AVX.  */
7523   else if (i.tm.opcode_modifier.immext)
7524     process_immext ();
7525
7526   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7527     {
7528       unsigned int dupl = i.operands;
7529       unsigned int dest = dupl - 1;
7530       unsigned int j;
7531
7532       /* The destination must be an xmm register.  */
7533       gas_assert (i.reg_operands
7534                   && MAX_OPERANDS > dupl
7535                   && operand_type_equal (&i.types[dest], &regxmm));
7536
7537       if (i.tm.operand_types[0].bitfield.instance == Accum
7538           && i.tm.operand_types[0].bitfield.xmmword)
7539         {
7540           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7541             {
7542               /* Keep xmm0 for instructions with VEX prefix and 3
7543                  sources.  */
7544               i.tm.operand_types[0].bitfield.instance = InstanceNone;
7545               i.tm.operand_types[0].bitfield.class = RegSIMD;
7546               goto duplicate;
7547             }
7548           else
7549             {
7550               /* We remove the first xmm0 and keep the number of
7551                  operands unchanged, which in fact duplicates the
7552                  destination.  */
7553               for (j = 1; j < i.operands; j++)
7554                 {
7555                   i.op[j - 1] = i.op[j];
7556                   i.types[j - 1] = i.types[j];
7557                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7558                   i.flags[j - 1] = i.flags[j];
7559                 }
7560             }
7561         }
7562       else if (i.tm.opcode_modifier.implicit1stxmm0)
7563         {
7564           gas_assert ((MAX_OPERANDS - 1) > dupl
7565                       && (i.tm.opcode_modifier.vexsources
7566                           == VEX3SOURCES));
7567
7568           /* Add the implicit xmm0 for instructions with VEX prefix
7569              and 3 sources.  */
7570           for (j = i.operands; j > 0; j--)
7571             {
7572               i.op[j] = i.op[j - 1];
7573               i.types[j] = i.types[j - 1];
7574               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7575               i.flags[j] = i.flags[j - 1];
7576             }
7577           i.op[0].regs
7578             = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7579           i.types[0] = regxmm;
7580           i.tm.operand_types[0] = regxmm;
7581
7582           i.operands += 2;
7583           i.reg_operands += 2;
7584           i.tm.operands += 2;
7585
7586           dupl++;
7587           dest++;
7588           i.op[dupl] = i.op[dest];
7589           i.types[dupl] = i.types[dest];
7590           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7591           i.flags[dupl] = i.flags[dest];
7592         }
7593       else
7594         {
7595         duplicate:
7596           i.operands++;
7597           i.reg_operands++;
7598           i.tm.operands++;
7599
7600           i.op[dupl] = i.op[dest];
7601           i.types[dupl] = i.types[dest];
7602           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7603           i.flags[dupl] = i.flags[dest];
7604         }
7605
7606        if (i.tm.opcode_modifier.immext)
7607          process_immext ();
7608     }
7609   else if (i.tm.operand_types[0].bitfield.instance == Accum
7610            && i.tm.operand_types[0].bitfield.xmmword)
7611     {
7612       unsigned int j;
7613
7614       for (j = 1; j < i.operands; j++)
7615         {
7616           i.op[j - 1] = i.op[j];
7617           i.types[j - 1] = i.types[j];
7618
7619           /* We need to adjust fields in i.tm since they are used by
7620              build_modrm_byte.  */
7621           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7622
7623           i.flags[j - 1] = i.flags[j];
7624         }
7625
7626       i.operands--;
7627       i.reg_operands--;
7628       i.tm.operands--;
7629     }
7630   else if (i.tm.opcode_modifier.implicitquadgroup)
7631     {
7632       unsigned int regnum, first_reg_in_group, last_reg_in_group;
7633
7634       /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7635       gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7636       regnum = register_number (i.op[1].regs);
7637       first_reg_in_group = regnum & ~3;
7638       last_reg_in_group = first_reg_in_group + 3;
7639       if (regnum != first_reg_in_group)
7640         as_warn (_("source register `%s%s' implicitly denotes"
7641                    " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7642                  register_prefix, i.op[1].regs->reg_name,
7643                  register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7644                  register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7645                  i.tm.name);
7646     }
7647   else if (i.tm.opcode_modifier.regkludge)
7648     {
7649       /* The imul $imm, %reg instruction is converted into
7650          imul $imm, %reg, %reg, and the clr %reg instruction
7651          is converted into xor %reg, %reg.  */
7652
7653       unsigned int first_reg_op;
7654
7655       if (operand_type_check (i.types[0], reg))
7656         first_reg_op = 0;
7657       else
7658         first_reg_op = 1;
7659       /* Pretend we saw the extra register operand.  */
7660       gas_assert (i.reg_operands == 1
7661                   && i.op[first_reg_op + 1].regs == 0);
7662       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7663       i.types[first_reg_op + 1] = i.types[first_reg_op];
7664       i.operands++;
7665       i.reg_operands++;
7666     }
7667
7668   if (i.tm.opcode_modifier.modrm)
7669     {
7670       /* The opcode is completed (modulo i.tm.extension_opcode which
7671          must be put into the modrm byte).  Now, we make the modrm and
7672          index base bytes based on all the info we've collected.  */
7673
7674       default_seg = build_modrm_byte ();
7675     }
7676   else if (i.types[0].bitfield.class == SReg)
7677     {
7678       if (flag_code != CODE_64BIT
7679           ? i.tm.base_opcode == POP_SEG_SHORT
7680             && i.op[0].regs->reg_num == 1
7681           : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7682             && i.op[0].regs->reg_num < 4)
7683         {
7684           as_bad (_("you can't `%s %s%s'"),
7685                   i.tm.name, register_prefix, i.op[0].regs->reg_name);
7686           return 0;
7687         }
7688       if ( i.op[0].regs->reg_num > 3 && i.opcode_length == 1 )
7689         {
7690           i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7691           i.opcode_length = 2;
7692         }
7693       i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7694     }
7695   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7696     {
7697       default_seg = &ds;
7698     }
7699   else if (i.tm.opcode_modifier.isstring)
7700     {
7701       /* For the string instructions that allow a segment override
7702          on one of their operands, the default segment is ds.  */
7703       default_seg = &ds;
7704     }
7705   else if (i.short_form)
7706     {
7707       /* The register or float register operand is in operand
7708          0 or 1.  */
7709       unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7710
7711       /* Register goes in low 3 bits of opcode.  */
7712       i.tm.base_opcode |= i.op[op].regs->reg_num;
7713       if ((i.op[op].regs->reg_flags & RegRex) != 0)
7714         i.rex |= REX_B;
7715       if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7716         {
7717           /* Warn about some common errors, but press on regardless.
7718              The first case can be generated by gcc (<= 2.8.1).  */
7719           if (i.operands == 2)
7720             {
7721               /* Reversed arguments on faddp, fsubp, etc.  */
7722               as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7723                        register_prefix, i.op[!intel_syntax].regs->reg_name,
7724                        register_prefix, i.op[intel_syntax].regs->reg_name);
7725             }
7726           else
7727             {
7728               /* Extraneous `l' suffix on fp insn.  */
7729               as_warn (_("translating to `%s %s%s'"), i.tm.name,
7730                        register_prefix, i.op[0].regs->reg_name);
7731             }
7732         }
7733     }
7734
7735   if ((i.seg[0] || i.prefix[SEG_PREFIX])
7736       && i.tm.base_opcode == 0x8d /* lea */
7737       && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7738       && !is_any_vex_encoding(&i.tm))
7739     {
7740       if (!quiet_warnings)
7741         as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7742       if (optimize)
7743         {
7744           i.seg[0] = NULL;
7745           i.prefix[SEG_PREFIX] = 0;
7746         }
7747     }
7748
7749   /* If a segment was explicitly specified, and the specified segment
7750      is neither the default nor the one already recorded from a prefix,
7751      use an opcode prefix to select it.  If we never figured out what
7752      the default segment is, then default_seg will be zero at this
7753      point, and the specified segment prefix will always be used.  */
7754   if (i.seg[0]
7755       && i.seg[0] != default_seg
7756       && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7757     {
7758       if (!add_prefix (i.seg[0]->seg_prefix))
7759         return 0;
7760     }
7761   return 1;
7762 }
7763
7764 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7765                                  bfd_boolean do_sse2avx)
7766 {
7767   if (r->reg_flags & RegRex)
7768     {
7769       if (i.rex & rex_bit)
7770         as_bad (_("same type of prefix used twice"));
7771       i.rex |= rex_bit;
7772     }
7773   else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7774     {
7775       gas_assert (i.vex.register_specifier == r);
7776       i.vex.register_specifier += 8;
7777     }
7778
7779   if (r->reg_flags & RegVRex)
7780     i.vrex |= rex_bit;
7781 }
7782
7783 static const seg_entry *
7784 build_modrm_byte (void)
7785 {
7786   const seg_entry *default_seg = 0;
7787   unsigned int source, dest;
7788   int vex_3_sources;
7789
7790   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7791   if (vex_3_sources)
7792     {
7793       unsigned int nds, reg_slot;
7794       expressionS *exp;
7795
7796       dest = i.operands - 1;
7797       nds = dest - 1;
7798
7799       /* There are 2 kinds of instructions:
7800          1. 5 operands: 4 register operands or 3 register operands
7801          plus 1 memory operand plus one Imm4 operand, VexXDS, and
7802          VexW0 or VexW1.  The destination must be either XMM, YMM or
7803          ZMM register.
7804          2. 4 operands: 4 register operands or 3 register operands
7805          plus 1 memory operand, with VexXDS.  */
7806       gas_assert ((i.reg_operands == 4
7807                    || (i.reg_operands == 3 && i.mem_operands == 1))
7808                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
7809                   && i.tm.opcode_modifier.vexw
7810                   && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7811
7812       /* If VexW1 is set, the first non-immediate operand is the source and
7813          the second non-immediate one is encoded in the immediate operand.  */
7814       if (i.tm.opcode_modifier.vexw == VEXW1)
7815         {
7816           source = i.imm_operands;
7817           reg_slot = i.imm_operands + 1;
7818         }
7819       else
7820         {
7821           source = i.imm_operands + 1;
7822           reg_slot = i.imm_operands;
7823         }
7824
7825       if (i.imm_operands == 0)
7826         {
7827           /* When there is no immediate operand, generate an 8bit
7828              immediate operand to encode the first operand.  */
7829           exp = &im_expressions[i.imm_operands++];
7830           i.op[i.operands].imms = exp;
7831           i.types[i.operands] = imm8;
7832           i.operands++;
7833
7834           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7835           exp->X_op = O_constant;
7836           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7837           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7838         }
7839       else
7840         {
7841           gas_assert (i.imm_operands == 1);
7842           gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7843           gas_assert (!i.tm.opcode_modifier.immext);
7844
7845           /* Turn on Imm8 again so that output_imm will generate it.  */
7846           i.types[0].bitfield.imm8 = 1;
7847
7848           gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7849           i.op[0].imms->X_add_number
7850               |= register_number (i.op[reg_slot].regs) << 4;
7851           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7852         }
7853
7854       gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7855       i.vex.register_specifier = i.op[nds].regs;
7856     }
7857   else
7858     source = dest = 0;
7859
7860   /* i.reg_operands MUST be the number of real register operands;
7861      implicit registers do not count.  If there are 3 register
7862      operands, it must be a instruction with VexNDS.  For a
7863      instruction with VexNDD, the destination register is encoded
7864      in VEX prefix.  If there are 4 register operands, it must be
7865      a instruction with VEX prefix and 3 sources.  */
7866   if (i.mem_operands == 0
7867       && ((i.reg_operands == 2
7868            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7869           || (i.reg_operands == 3
7870               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7871           || (i.reg_operands == 4 && vex_3_sources)))
7872     {
7873       switch (i.operands)
7874         {
7875         case 2:
7876           source = 0;
7877           break;
7878         case 3:
7879           /* When there are 3 operands, one of them may be immediate,
7880              which may be the first or the last operand.  Otherwise,
7881              the first operand must be shift count register (cl) or it
7882              is an instruction with VexNDS. */
7883           gas_assert (i.imm_operands == 1
7884                       || (i.imm_operands == 0
7885                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7886                               || (i.types[0].bitfield.instance == RegC
7887                                   && i.types[0].bitfield.byte))));
7888           if (operand_type_check (i.types[0], imm)
7889               || (i.types[0].bitfield.instance == RegC
7890                   && i.types[0].bitfield.byte))
7891             source = 1;
7892           else
7893             source = 0;
7894           break;
7895         case 4:
7896           /* When there are 4 operands, the first two must be 8bit
7897              immediate operands. The source operand will be the 3rd
7898              one.
7899
7900              For instructions with VexNDS, if the first operand
7901              an imm8, the source operand is the 2nd one.  If the last
7902              operand is imm8, the source operand is the first one.  */
7903           gas_assert ((i.imm_operands == 2
7904                        && i.types[0].bitfield.imm8
7905                        && i.types[1].bitfield.imm8)
7906                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7907                           && i.imm_operands == 1
7908                           && (i.types[0].bitfield.imm8
7909                               || i.types[i.operands - 1].bitfield.imm8
7910                               || i.rounding)));
7911           if (i.imm_operands == 2)
7912             source = 2;
7913           else
7914             {
7915               if (i.types[0].bitfield.imm8)
7916                 source = 1;
7917               else
7918                 source = 0;
7919             }
7920           break;
7921         case 5:
7922           if (is_evex_encoding (&i.tm))
7923             {
7924               /* For EVEX instructions, when there are 5 operands, the
7925                  first one must be immediate operand.  If the second one
7926                  is immediate operand, the source operand is the 3th
7927                  one.  If the last one is immediate operand, the source
7928                  operand is the 2nd one.  */
7929               gas_assert (i.imm_operands == 2
7930                           && i.tm.opcode_modifier.sae
7931                           && operand_type_check (i.types[0], imm));
7932               if (operand_type_check (i.types[1], imm))
7933                 source = 2;
7934               else if (operand_type_check (i.types[4], imm))
7935                 source = 1;
7936               else
7937                 abort ();
7938             }
7939           break;
7940         default:
7941           abort ();
7942         }
7943
7944       if (!vex_3_sources)
7945         {
7946           dest = source + 1;
7947
7948           /* RC/SAE operand could be between DEST and SRC.  That happens
7949              when one operand is GPR and the other one is XMM/YMM/ZMM
7950              register.  */
7951           if (i.rounding && i.rounding->operand == (int) dest)
7952             dest++;
7953
7954           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7955             {
7956               /* For instructions with VexNDS, the register-only source
7957                  operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7958                  register.  It is encoded in VEX prefix.  */
7959
7960               i386_operand_type op;
7961               unsigned int vvvv;
7962
7963               /* Swap two source operands if needed.  */
7964               if (i.tm.opcode_modifier.swapsources)
7965                 {
7966                   vvvv = source;
7967                   source = dest;
7968                 }
7969               else
7970                 vvvv = dest;
7971
7972               op = i.tm.operand_types[vvvv];
7973               if ((dest + 1) >= i.operands
7974                   || ((op.bitfield.class != Reg
7975                        || (!op.bitfield.dword && !op.bitfield.qword))
7976                       && op.bitfield.class != RegSIMD
7977                       && !operand_type_equal (&op, &regmask)))
7978                 abort ();
7979               i.vex.register_specifier = i.op[vvvv].regs;
7980               dest++;
7981             }
7982         }
7983
7984       i.rm.mode = 3;
7985       /* One of the register operands will be encoded in the i.rm.reg
7986          field, the other in the combined i.rm.mode and i.rm.regmem
7987          fields.  If no form of this instruction supports a memory
7988          destination operand, then we assume the source operand may
7989          sometimes be a memory operand and so we need to store the
7990          destination in the i.rm.reg field.  */
7991       if (!i.tm.opcode_modifier.regmem
7992           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7993         {
7994           i.rm.reg = i.op[dest].regs->reg_num;
7995           i.rm.regmem = i.op[source].regs->reg_num;
7996           set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7997           set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7998         }
7999       else
8000         {
8001           i.rm.reg = i.op[source].regs->reg_num;
8002           i.rm.regmem = i.op[dest].regs->reg_num;
8003           set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8004           set_rex_vrex (i.op[source].regs, REX_R, FALSE);
8005         }
8006       if (flag_code != CODE_64BIT && (i.rex & REX_R))
8007         {
8008           if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8009             abort ();
8010           i.rex &= ~REX_R;
8011           add_prefix (LOCK_PREFIX_OPCODE);
8012         }
8013     }
8014   else
8015     {                   /* If it's not 2 reg operands...  */
8016       unsigned int mem;
8017
8018       if (i.mem_operands)
8019         {
8020           unsigned int fake_zero_displacement = 0;
8021           unsigned int op;
8022
8023           for (op = 0; op < i.operands; op++)
8024             if (i.flags[op] & Operand_Mem)
8025               break;
8026           gas_assert (op < i.operands);
8027
8028           if (i.tm.opcode_modifier.sib)
8029             {
8030               /* The index register of VSIB shouldn't be RegIZ.  */
8031               if (i.tm.opcode_modifier.sib != SIBMEM
8032                   && i.index_reg->reg_num == RegIZ)
8033                 abort ();
8034
8035               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8036               if (!i.base_reg)
8037                 {
8038                   i.sib.base = NO_BASE_REGISTER;
8039                   i.sib.scale = i.log2_scale_factor;
8040                   i.types[op].bitfield.disp8 = 0;
8041                   i.types[op].bitfield.disp16 = 0;
8042                   i.types[op].bitfield.disp64 = 0;
8043                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8044                     {
8045                       /* Must be 32 bit */
8046                       i.types[op].bitfield.disp32 = 1;
8047                       i.types[op].bitfield.disp32s = 0;
8048                     }
8049                   else
8050                     {
8051                       i.types[op].bitfield.disp32 = 0;
8052                       i.types[op].bitfield.disp32s = 1;
8053                     }
8054                 }
8055
8056               /* Since the mandatory SIB always has index register, so
8057                  the code logic remains unchanged. The non-mandatory SIB
8058                  without index register is allowed and will be handled
8059                  later.  */
8060               if (i.index_reg)
8061                 {
8062                   if (i.index_reg->reg_num == RegIZ)
8063                     i.sib.index = NO_INDEX_REGISTER;
8064                   else
8065                     i.sib.index = i.index_reg->reg_num;
8066                   set_rex_vrex (i.index_reg, REX_X, FALSE);
8067                 }
8068             }
8069
8070           default_seg = &ds;
8071
8072           if (i.base_reg == 0)
8073             {
8074               i.rm.mode = 0;
8075               if (!i.disp_operands)
8076                 fake_zero_displacement = 1;
8077               if (i.index_reg == 0)
8078                 {
8079                   i386_operand_type newdisp;
8080
8081                   /* Both check for VSIB and mandatory non-vector SIB. */
8082                   gas_assert (!i.tm.opcode_modifier.sib
8083                               || i.tm.opcode_modifier.sib == SIBMEM);
8084                   /* Operand is just <disp>  */
8085                   if (flag_code == CODE_64BIT)
8086                     {
8087                       /* 64bit mode overwrites the 32bit absolute
8088                          addressing by RIP relative addressing and
8089                          absolute addressing is encoded by one of the
8090                          redundant SIB forms.  */
8091                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8092                       i.sib.base = NO_BASE_REGISTER;
8093                       i.sib.index = NO_INDEX_REGISTER;
8094                       newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8095                     }
8096                   else if ((flag_code == CODE_16BIT)
8097                            ^ (i.prefix[ADDR_PREFIX] != 0))
8098                     {
8099                       i.rm.regmem = NO_BASE_REGISTER_16;
8100                       newdisp = disp16;
8101                     }
8102                   else
8103                     {
8104                       i.rm.regmem = NO_BASE_REGISTER;
8105                       newdisp = disp32;
8106                     }
8107                   i.types[op] = operand_type_and_not (i.types[op], anydisp);
8108                   i.types[op] = operand_type_or (i.types[op], newdisp);
8109                 }
8110               else if (!i.tm.opcode_modifier.sib)
8111                 {
8112                   /* !i.base_reg && i.index_reg  */
8113                   if (i.index_reg->reg_num == RegIZ)
8114                     i.sib.index = NO_INDEX_REGISTER;
8115                   else
8116                     i.sib.index = i.index_reg->reg_num;
8117                   i.sib.base = NO_BASE_REGISTER;
8118                   i.sib.scale = i.log2_scale_factor;
8119                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8120                   i.types[op].bitfield.disp8 = 0;
8121                   i.types[op].bitfield.disp16 = 0;
8122                   i.types[op].bitfield.disp64 = 0;
8123                   if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8124                     {
8125                       /* Must be 32 bit */
8126                       i.types[op].bitfield.disp32 = 1;
8127                       i.types[op].bitfield.disp32s = 0;
8128                     }
8129                   else
8130                     {
8131                       i.types[op].bitfield.disp32 = 0;
8132                       i.types[op].bitfield.disp32s = 1;
8133                     }
8134                   if ((i.index_reg->reg_flags & RegRex) != 0)
8135                     i.rex |= REX_X;
8136                 }
8137             }
8138           /* RIP addressing for 64bit mode.  */
8139           else if (i.base_reg->reg_num == RegIP)
8140             {
8141               gas_assert (!i.tm.opcode_modifier.sib);
8142               i.rm.regmem = NO_BASE_REGISTER;
8143               i.types[op].bitfield.disp8 = 0;
8144               i.types[op].bitfield.disp16 = 0;
8145               i.types[op].bitfield.disp32 = 0;
8146               i.types[op].bitfield.disp32s = 1;
8147               i.types[op].bitfield.disp64 = 0;
8148               i.flags[op] |= Operand_PCrel;
8149               if (! i.disp_operands)
8150                 fake_zero_displacement = 1;
8151             }
8152           else if (i.base_reg->reg_type.bitfield.word)
8153             {
8154               gas_assert (!i.tm.opcode_modifier.sib);
8155               switch (i.base_reg->reg_num)
8156                 {
8157                 case 3: /* (%bx)  */
8158                   if (i.index_reg == 0)
8159                     i.rm.regmem = 7;
8160                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
8161                     i.rm.regmem = i.index_reg->reg_num - 6;
8162                   break;
8163                 case 5: /* (%bp)  */
8164                   default_seg = &ss;
8165                   if (i.index_reg == 0)
8166                     {
8167                       i.rm.regmem = 6;
8168                       if (operand_type_check (i.types[op], disp) == 0)
8169                         {
8170                           /* fake (%bp) into 0(%bp)  */
8171                           if (i.disp_encoding == disp_encoding_16bit)
8172                             i.types[op].bitfield.disp16 = 1;
8173                           else
8174                             i.types[op].bitfield.disp8 = 1;
8175                           fake_zero_displacement = 1;
8176                         }
8177                     }
8178                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
8179                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8180                   break;
8181                 default: /* (%si) -> 4 or (%di) -> 5  */
8182                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8183                 }
8184               if (!fake_zero_displacement
8185                   && !i.disp_operands
8186                   && i.disp_encoding)
8187                 {
8188                   fake_zero_displacement = 1;
8189                   if (i.disp_encoding == disp_encoding_8bit)
8190                     i.types[op].bitfield.disp8 = 1;
8191                   else
8192                     i.types[op].bitfield.disp16 = 1;
8193                 }
8194               i.rm.mode = mode_from_disp_size (i.types[op]);
8195             }
8196           else /* i.base_reg and 32/64 bit mode  */
8197             {
8198               if (flag_code == CODE_64BIT
8199                   && operand_type_check (i.types[op], disp))
8200                 {
8201                   i.types[op].bitfield.disp16 = 0;
8202                   i.types[op].bitfield.disp64 = 0;
8203                   if (i.prefix[ADDR_PREFIX] == 0)
8204                     {
8205                       i.types[op].bitfield.disp32 = 0;
8206                       i.types[op].bitfield.disp32s = 1;
8207                     }
8208                   else
8209                     {
8210                       i.types[op].bitfield.disp32 = 1;
8211                       i.types[op].bitfield.disp32s = 0;
8212                     }
8213                 }
8214
8215               if (!i.tm.opcode_modifier.sib)
8216                 i.rm.regmem = i.base_reg->reg_num;
8217               if ((i.base_reg->reg_flags & RegRex) != 0)
8218                 i.rex |= REX_B;
8219               i.sib.base = i.base_reg->reg_num;
8220               /* x86-64 ignores REX prefix bit here to avoid decoder
8221                  complications.  */
8222               if (!(i.base_reg->reg_flags & RegRex)
8223                   && (i.base_reg->reg_num == EBP_REG_NUM
8224                    || i.base_reg->reg_num == ESP_REG_NUM))
8225                   default_seg = &ss;
8226               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8227                 {
8228                   fake_zero_displacement = 1;
8229                   if (i.disp_encoding == disp_encoding_32bit)
8230                     i.types[op].bitfield.disp32 = 1;
8231                   else
8232                     i.types[op].bitfield.disp8 = 1;
8233                 }
8234               i.sib.scale = i.log2_scale_factor;
8235               if (i.index_reg == 0)
8236                 {
8237                   /* Only check for VSIB. */
8238                   gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8239                               && i.tm.opcode_modifier.sib != VECSIB256
8240                               && i.tm.opcode_modifier.sib != VECSIB512);
8241
8242                   /* <disp>(%esp) becomes two byte modrm with no index
8243                      register.  We've already stored the code for esp
8244                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8245                      Any base register besides %esp will not use the
8246                      extra modrm byte.  */
8247                   i.sib.index = NO_INDEX_REGISTER;
8248                 }
8249               else if (!i.tm.opcode_modifier.sib)
8250                 {
8251                   if (i.index_reg->reg_num == RegIZ)
8252                     i.sib.index = NO_INDEX_REGISTER;
8253                   else
8254                     i.sib.index = i.index_reg->reg_num;
8255                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8256                   if ((i.index_reg->reg_flags & RegRex) != 0)
8257                     i.rex |= REX_X;
8258                 }
8259
8260               if (i.disp_operands
8261                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8262                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8263                 i.rm.mode = 0;
8264               else
8265                 {
8266                   if (!fake_zero_displacement
8267                       && !i.disp_operands
8268                       && i.disp_encoding)
8269                     {
8270                       fake_zero_displacement = 1;
8271                       if (i.disp_encoding == disp_encoding_8bit)
8272                         i.types[op].bitfield.disp8 = 1;
8273                       else
8274                         i.types[op].bitfield.disp32 = 1;
8275                     }
8276                   i.rm.mode = mode_from_disp_size (i.types[op]);
8277                 }
8278             }
8279
8280           if (fake_zero_displacement)
8281             {
8282               /* Fakes a zero displacement assuming that i.types[op]
8283                  holds the correct displacement size.  */
8284               expressionS *exp;
8285
8286               gas_assert (i.op[op].disps == 0);
8287               exp = &disp_expressions[i.disp_operands++];
8288               i.op[op].disps = exp;
8289               exp->X_op = O_constant;
8290               exp->X_add_number = 0;
8291               exp->X_add_symbol = (symbolS *) 0;
8292               exp->X_op_symbol = (symbolS *) 0;
8293             }
8294
8295           mem = op;
8296         }
8297       else
8298         mem = ~0;
8299
8300       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8301         {
8302           if (operand_type_check (i.types[0], imm))
8303             i.vex.register_specifier = NULL;
8304           else
8305             {
8306               /* VEX.vvvv encodes one of the sources when the first
8307                  operand is not an immediate.  */
8308               if (i.tm.opcode_modifier.vexw == VEXW0)
8309                 i.vex.register_specifier = i.op[0].regs;
8310               else
8311                 i.vex.register_specifier = i.op[1].regs;
8312             }
8313
8314           /* Destination is a XMM register encoded in the ModRM.reg
8315              and VEX.R bit.  */
8316           i.rm.reg = i.op[2].regs->reg_num;
8317           if ((i.op[2].regs->reg_flags & RegRex) != 0)
8318             i.rex |= REX_R;
8319
8320           /* ModRM.rm and VEX.B encodes the other source.  */
8321           if (!i.mem_operands)
8322             {
8323               i.rm.mode = 3;
8324
8325               if (i.tm.opcode_modifier.vexw == VEXW0)
8326                 i.rm.regmem = i.op[1].regs->reg_num;
8327               else
8328                 i.rm.regmem = i.op[0].regs->reg_num;
8329
8330               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8331                 i.rex |= REX_B;
8332             }
8333         }
8334       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8335         {
8336           i.vex.register_specifier = i.op[2].regs;
8337           if (!i.mem_operands)
8338             {
8339               i.rm.mode = 3;
8340               i.rm.regmem = i.op[1].regs->reg_num;
8341               if ((i.op[1].regs->reg_flags & RegRex) != 0)
8342                 i.rex |= REX_B;
8343             }
8344         }
8345       /* Fill in i.rm.reg or i.rm.regmem field with register operand
8346          (if any) based on i.tm.extension_opcode.  Again, we must be
8347          careful to make sure that segment/control/debug/test/MMX
8348          registers are coded into the i.rm.reg field.  */
8349       else if (i.reg_operands)
8350         {
8351           unsigned int op;
8352           unsigned int vex_reg = ~0;
8353
8354           for (op = 0; op < i.operands; op++)
8355             if (i.types[op].bitfield.class == Reg
8356                 || i.types[op].bitfield.class == RegBND
8357                 || i.types[op].bitfield.class == RegMask
8358                 || i.types[op].bitfield.class == SReg
8359                 || i.types[op].bitfield.class == RegCR
8360                 || i.types[op].bitfield.class == RegDR
8361                 || i.types[op].bitfield.class == RegTR
8362                 || i.types[op].bitfield.class == RegSIMD
8363                 || i.types[op].bitfield.class == RegMMX)
8364               break;
8365
8366           if (vex_3_sources)
8367             op = dest;
8368           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8369             {
8370               /* For instructions with VexNDS, the register-only
8371                  source operand is encoded in VEX prefix. */
8372               gas_assert (mem != (unsigned int) ~0);
8373
8374               if (op > mem)
8375                 {
8376                   vex_reg = op++;
8377                   gas_assert (op < i.operands);
8378                 }
8379               else
8380                 {
8381                   /* Check register-only source operand when two source
8382                      operands are swapped.  */
8383                   if (!i.tm.operand_types[op].bitfield.baseindex
8384                       && i.tm.operand_types[op + 1].bitfield.baseindex)
8385                     {
8386                       vex_reg = op;
8387                       op += 2;
8388                       gas_assert (mem == (vex_reg + 1)
8389                                   && op < i.operands);
8390                     }
8391                   else
8392                     {
8393                       vex_reg = op + 1;
8394                       gas_assert (vex_reg < i.operands);
8395                     }
8396                 }
8397             }
8398           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8399             {
8400               /* For instructions with VexNDD, the register destination
8401                  is encoded in VEX prefix.  */
8402               if (i.mem_operands == 0)
8403                 {
8404                   /* There is no memory operand.  */
8405                   gas_assert ((op + 2) == i.operands);
8406                   vex_reg = op + 1;
8407                 }
8408               else
8409                 {
8410                   /* There are only 2 non-immediate operands.  */
8411                   gas_assert (op < i.imm_operands + 2
8412                               && i.operands == i.imm_operands + 2);
8413                   vex_reg = i.imm_operands + 1;
8414                 }
8415             }
8416           else
8417             gas_assert (op < i.operands);
8418
8419           if (vex_reg != (unsigned int) ~0)
8420             {
8421               i386_operand_type *type = &i.tm.operand_types[vex_reg];
8422
8423               if ((type->bitfield.class != Reg
8424                    || (!type->bitfield.dword && !type->bitfield.qword))
8425                   && type->bitfield.class != RegSIMD
8426                   && !operand_type_equal (type, &regmask))
8427                 abort ();
8428
8429               i.vex.register_specifier = i.op[vex_reg].regs;
8430             }
8431
8432           /* Don't set OP operand twice.  */
8433           if (vex_reg != op)
8434             {
8435               /* If there is an extension opcode to put here, the
8436                  register number must be put into the regmem field.  */
8437               if (i.tm.extension_opcode != None)
8438                 {
8439                   i.rm.regmem = i.op[op].regs->reg_num;
8440                   set_rex_vrex (i.op[op].regs, REX_B,
8441                                 i.tm.opcode_modifier.sse2avx);
8442                 }
8443               else
8444                 {
8445                   i.rm.reg = i.op[op].regs->reg_num;
8446                   set_rex_vrex (i.op[op].regs, REX_R,
8447                                 i.tm.opcode_modifier.sse2avx);
8448                 }
8449             }
8450
8451           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8452              must set it to 3 to indicate this is a register operand
8453              in the regmem field.  */
8454           if (!i.mem_operands)
8455             i.rm.mode = 3;
8456         }
8457
8458       /* Fill in i.rm.reg field with extension opcode (if any).  */
8459       if (i.tm.extension_opcode != None)
8460         i.rm.reg = i.tm.extension_opcode;
8461     }
8462   return default_seg;
8463 }
8464
8465 static INLINE void
8466 frag_opcode_byte (unsigned char byte)
8467 {
8468   if (now_seg != absolute_section)
8469     FRAG_APPEND_1_CHAR (byte);
8470   else
8471     ++abs_section_offset;
8472 }
8473
8474 static unsigned int
8475 flip_code16 (unsigned int code16)
8476 {
8477   gas_assert (i.tm.operands == 1);
8478
8479   return !(i.prefix[REX_PREFIX] & REX_W)
8480          && (code16 ? i.tm.operand_types[0].bitfield.disp32
8481                       || i.tm.operand_types[0].bitfield.disp32s
8482                     : i.tm.operand_types[0].bitfield.disp16)
8483          ? CODE16 : 0;
8484 }
8485
8486 static void
8487 output_branch (void)
8488 {
8489   char *p;
8490   int size;
8491   int code16;
8492   int prefix;
8493   relax_substateT subtype;
8494   symbolS *sym;
8495   offsetT off;
8496
8497   if (now_seg == absolute_section)
8498     {
8499       as_bad (_("relaxable branches not supported in absolute section"));
8500       return;
8501     }
8502
8503   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8504   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8505
8506   prefix = 0;
8507   if (i.prefix[DATA_PREFIX] != 0)
8508     {
8509       prefix = 1;
8510       i.prefixes -= 1;
8511       code16 ^= flip_code16(code16);
8512     }
8513   /* Pentium4 branch hints.  */
8514   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8515       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8516     {
8517       prefix++;
8518       i.prefixes--;
8519     }
8520   if (i.prefix[REX_PREFIX] != 0)
8521     {
8522       prefix++;
8523       i.prefixes--;
8524     }
8525
8526   /* BND prefixed jump.  */
8527   if (i.prefix[BND_PREFIX] != 0)
8528     {
8529       prefix++;
8530       i.prefixes--;
8531     }
8532
8533   if (i.prefixes != 0)
8534     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8535
8536   /* It's always a symbol;  End frag & setup for relax.
8537      Make sure there is enough room in this frag for the largest
8538      instruction we may generate in md_convert_frag.  This is 2
8539      bytes for the opcode and room for the prefix and largest
8540      displacement.  */
8541   frag_grow (prefix + 2 + 4);
8542   /* Prefix and 1 opcode byte go in fr_fix.  */
8543   p = frag_more (prefix + 1);
8544   if (i.prefix[DATA_PREFIX] != 0)
8545     *p++ = DATA_PREFIX_OPCODE;
8546   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8547       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8548     *p++ = i.prefix[SEG_PREFIX];
8549   if (i.prefix[BND_PREFIX] != 0)
8550     *p++ = BND_PREFIX_OPCODE;
8551   if (i.prefix[REX_PREFIX] != 0)
8552     *p++ = i.prefix[REX_PREFIX];
8553   *p = i.tm.base_opcode;
8554
8555   if ((unsigned char) *p == JUMP_PC_RELATIVE)
8556     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8557   else if (cpu_arch_flags.bitfield.cpui386)
8558     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8559   else
8560     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8561   subtype |= code16;
8562
8563   sym = i.op[0].disps->X_add_symbol;
8564   off = i.op[0].disps->X_add_number;
8565
8566   if (i.op[0].disps->X_op != O_constant
8567       && i.op[0].disps->X_op != O_symbol)
8568     {
8569       /* Handle complex expressions.  */
8570       sym = make_expr_symbol (i.op[0].disps);
8571       off = 0;
8572     }
8573
8574   /* 1 possible extra opcode + 4 byte displacement go in var part.
8575      Pass reloc in fr_var.  */
8576   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8577 }
8578
8579 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8580 /* Return TRUE iff PLT32 relocation should be used for branching to
8581    symbol S.  */
8582
8583 static bfd_boolean
8584 need_plt32_p (symbolS *s)
8585 {
8586   /* PLT32 relocation is ELF only.  */
8587   if (!IS_ELF)
8588     return FALSE;
8589
8590 #ifdef TE_SOLARIS
8591   /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8592      krtld support it.  */
8593   return FALSE;
8594 #endif
8595
8596   /* Since there is no need to prepare for PLT branch on x86-64, we
8597      can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8598      be used as a marker for 32-bit PC-relative branches.  */
8599   if (!object_64bit)
8600     return FALSE;
8601
8602   if (s == NULL)
8603     return FALSE;
8604
8605   /* Weak or undefined symbol need PLT32 relocation.  */
8606   if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8607     return TRUE;
8608
8609   /* Non-global symbol doesn't need PLT32 relocation.  */
8610   if (! S_IS_EXTERNAL (s))
8611     return FALSE;
8612
8613   /* Other global symbols need PLT32 relocation.  NB: Symbol with
8614      non-default visibilities are treated as normal global symbol
8615      so that PLT32 relocation can be used as a marker for 32-bit
8616      PC-relative branches.  It is useful for linker relaxation.  */
8617   return TRUE;
8618 }
8619 #endif
8620
8621 static void
8622 output_jump (void)
8623 {
8624   char *p;
8625   int size;
8626   fixS *fixP;
8627   bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8628
8629   if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8630     {
8631       /* This is a loop or jecxz type instruction.  */
8632       size = 1;
8633       if (i.prefix[ADDR_PREFIX] != 0)
8634         {
8635           frag_opcode_byte (ADDR_PREFIX_OPCODE);
8636           i.prefixes -= 1;
8637         }
8638       /* Pentium4 branch hints.  */
8639       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8640           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8641         {
8642           frag_opcode_byte (i.prefix[SEG_PREFIX]);
8643           i.prefixes--;
8644         }
8645     }
8646   else
8647     {
8648       int code16;
8649
8650       code16 = 0;
8651       if (flag_code == CODE_16BIT)
8652         code16 = CODE16;
8653
8654       if (i.prefix[DATA_PREFIX] != 0)
8655         {
8656           frag_opcode_byte (DATA_PREFIX_OPCODE);
8657           i.prefixes -= 1;
8658           code16 ^= flip_code16(code16);
8659         }
8660
8661       size = 4;
8662       if (code16)
8663         size = 2;
8664     }
8665
8666   /* BND prefixed jump.  */
8667   if (i.prefix[BND_PREFIX] != 0)
8668     {
8669       frag_opcode_byte (i.prefix[BND_PREFIX]);
8670       i.prefixes -= 1;
8671     }
8672
8673   if (i.prefix[REX_PREFIX] != 0)
8674     {
8675       frag_opcode_byte (i.prefix[REX_PREFIX]);
8676       i.prefixes -= 1;
8677     }
8678
8679   if (i.prefixes != 0)
8680     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8681
8682   if (now_seg == absolute_section)
8683     {
8684       abs_section_offset += i.opcode_length + size;
8685       return;
8686     }
8687
8688   p = frag_more (i.opcode_length + size);
8689   switch (i.opcode_length)
8690     {
8691     case 2:
8692       *p++ = i.tm.base_opcode >> 8;
8693       /* Fall through.  */
8694     case 1:
8695       *p++ = i.tm.base_opcode;
8696       break;
8697     default:
8698       abort ();
8699     }
8700
8701 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8702   if (size == 4
8703       && jump_reloc == NO_RELOC
8704       && need_plt32_p (i.op[0].disps->X_add_symbol))
8705     jump_reloc = BFD_RELOC_X86_64_PLT32;
8706 #endif
8707
8708   jump_reloc = reloc (size, 1, 1, jump_reloc);
8709
8710   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8711                       i.op[0].disps, 1, jump_reloc);
8712
8713   /* All jumps handled here are signed, but don't use a signed limit
8714      check for 32 and 16 bit jumps as we want to allow wrap around at
8715      4G and 64k respectively.  */
8716   if (size == 1)
8717     fixP->fx_signed = 1;
8718 }
8719
8720 static void
8721 output_interseg_jump (void)
8722 {
8723   char *p;
8724   int size;
8725   int prefix;
8726   int code16;
8727
8728   code16 = 0;
8729   if (flag_code == CODE_16BIT)
8730     code16 = CODE16;
8731
8732   prefix = 0;
8733   if (i.prefix[DATA_PREFIX] != 0)
8734     {
8735       prefix = 1;
8736       i.prefixes -= 1;
8737       code16 ^= CODE16;
8738     }
8739
8740   gas_assert (!i.prefix[REX_PREFIX]);
8741
8742   size = 4;
8743   if (code16)
8744     size = 2;
8745
8746   if (i.prefixes != 0)
8747     as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8748
8749   if (now_seg == absolute_section)
8750     {
8751       abs_section_offset += prefix + 1 + 2 + size;
8752       return;
8753     }
8754
8755   /* 1 opcode; 2 segment; offset  */
8756   p = frag_more (prefix + 1 + 2 + size);
8757
8758   if (i.prefix[DATA_PREFIX] != 0)
8759     *p++ = DATA_PREFIX_OPCODE;
8760
8761   if (i.prefix[REX_PREFIX] != 0)
8762     *p++ = i.prefix[REX_PREFIX];
8763
8764   *p++ = i.tm.base_opcode;
8765   if (i.op[1].imms->X_op == O_constant)
8766     {
8767       offsetT n = i.op[1].imms->X_add_number;
8768
8769       if (size == 2
8770           && !fits_in_unsigned_word (n)
8771           && !fits_in_signed_word (n))
8772         {
8773           as_bad (_("16-bit jump out of range"));
8774           return;
8775         }
8776       md_number_to_chars (p, n, size);
8777     }
8778   else
8779     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8780                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8781
8782   p += size;
8783   if (i.op[0].imms->X_op == O_constant)
8784     md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
8785   else
8786     fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
8787                  i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
8788 }
8789
8790 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8791 void
8792 x86_cleanup (void)
8793 {
8794   char *p;
8795   asection *seg = now_seg;
8796   subsegT subseg = now_subseg;
8797   asection *sec;
8798   unsigned int alignment, align_size_1;
8799   unsigned int isa_1_descsz, feature_2_descsz, descsz;
8800   unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8801   unsigned int padding;
8802
8803   if (!IS_ELF || !x86_used_note)
8804     return;
8805
8806   x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8807
8808   /* The .note.gnu.property section layout:
8809
8810      Field      Length          Contents
8811      ----       ----            ----
8812      n_namsz    4               4
8813      n_descsz   4               The note descriptor size
8814      n_type     4               NT_GNU_PROPERTY_TYPE_0
8815      n_name     4               "GNU"
8816      n_desc     n_descsz        The program property array
8817      ....       ....            ....
8818    */
8819
8820   /* Create the .note.gnu.property section.  */
8821   sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8822   bfd_set_section_flags (sec,
8823                          (SEC_ALLOC
8824                           | SEC_LOAD
8825                           | SEC_DATA
8826                           | SEC_HAS_CONTENTS
8827                           | SEC_READONLY));
8828
8829   if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8830     {
8831       align_size_1 = 7;
8832       alignment = 3;
8833     }
8834   else
8835     {
8836       align_size_1 = 3;
8837       alignment = 2;
8838     }
8839
8840   bfd_set_section_alignment (sec, alignment);
8841   elf_section_type (sec) = SHT_NOTE;
8842
8843   /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8844                                   + 4-byte data  */
8845   isa_1_descsz_raw = 4 + 4 + 4;
8846   /* Align GNU_PROPERTY_X86_ISA_1_USED.  */
8847   isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8848
8849   feature_2_descsz_raw = isa_1_descsz;
8850   /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8851                                       + 4-byte data  */
8852   feature_2_descsz_raw += 4 + 4 + 4;
8853   /* Align GNU_PROPERTY_X86_FEATURE_2_USED.  */
8854   feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8855                       & ~align_size_1);
8856
8857   descsz = feature_2_descsz;
8858   /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz.  */
8859   p = frag_more (4 + 4 + 4 + 4 + descsz);
8860
8861   /* Write n_namsz.  */
8862   md_number_to_chars (p, (valueT) 4, 4);
8863
8864   /* Write n_descsz.  */
8865   md_number_to_chars (p + 4, (valueT) descsz, 4);
8866
8867   /* Write n_type.  */
8868   md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8869
8870   /* Write n_name.  */
8871   memcpy (p + 4 * 3, "GNU", 4);
8872
8873   /* Write 4-byte type.  */
8874   md_number_to_chars (p + 4 * 4,
8875                       (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8876
8877   /* Write 4-byte data size.  */
8878   md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8879
8880   /* Write 4-byte data.  */
8881   md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8882
8883   /* Zero out paddings.  */
8884   padding = isa_1_descsz - isa_1_descsz_raw;
8885   if (padding)
8886     memset (p + 4 * 7, 0, padding);
8887
8888   /* Write 4-byte type.  */
8889   md_number_to_chars (p + isa_1_descsz + 4 * 4,
8890                       (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8891
8892   /* Write 4-byte data size.  */
8893   md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8894
8895   /* Write 4-byte data.  */
8896   md_number_to_chars (p + isa_1_descsz + 4 * 6,
8897                       (valueT) x86_feature_2_used, 4);
8898
8899   /* Zero out paddings.  */
8900   padding = feature_2_descsz - feature_2_descsz_raw;
8901   if (padding)
8902     memset (p + isa_1_descsz + 4 * 7, 0, padding);
8903
8904   /* We probably can't restore the current segment, for there likely
8905      isn't one yet...  */
8906   if (seg && subseg)
8907     subseg_set (seg, subseg);
8908 }
8909 #endif
8910
8911 static unsigned int
8912 encoding_length (const fragS *start_frag, offsetT start_off,
8913                  const char *frag_now_ptr)
8914 {
8915   unsigned int len = 0;
8916
8917   if (start_frag != frag_now)
8918     {
8919       const fragS *fr = start_frag;
8920
8921       do {
8922         len += fr->fr_fix;
8923         fr = fr->fr_next;
8924       } while (fr && fr != frag_now);
8925     }
8926
8927   return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8928 }
8929
8930 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8931    be macro-fused with conditional jumps.
8932    NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8933    or is one of the following format:
8934
8935     cmp m, imm
8936     add m, imm
8937     sub m, imm
8938    test m, imm
8939     and m, imm
8940     inc m
8941     dec m
8942
8943    it is unfusible.  */
8944
8945 static int
8946 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8947 {
8948   /* No RIP address.  */
8949   if (i.base_reg && i.base_reg->reg_num == RegIP)
8950     return 0;
8951
8952   /* No VEX/EVEX encoding.  */
8953   if (is_any_vex_encoding (&i.tm))
8954     return 0;
8955
8956   /* add, sub without add/sub m, imm.  */
8957   if (i.tm.base_opcode <= 5
8958       || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8959       || ((i.tm.base_opcode | 3) == 0x83
8960           && (i.tm.extension_opcode == 0x5
8961               || i.tm.extension_opcode == 0x0)))
8962     {
8963       *mf_cmp_p = mf_cmp_alu_cmp;
8964       return !(i.mem_operands && i.imm_operands);
8965     }
8966
8967   /* and without and m, imm.  */
8968   if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8969       || ((i.tm.base_opcode | 3) == 0x83
8970           && i.tm.extension_opcode == 0x4))
8971     {
8972       *mf_cmp_p = mf_cmp_test_and;
8973       return !(i.mem_operands && i.imm_operands);
8974     }
8975
8976   /* test without test m imm.  */
8977   if ((i.tm.base_opcode | 1) == 0x85
8978       || (i.tm.base_opcode | 1) == 0xa9
8979       || ((i.tm.base_opcode | 1) == 0xf7
8980           && i.tm.extension_opcode == 0))
8981     {
8982       *mf_cmp_p = mf_cmp_test_and;
8983       return !(i.mem_operands && i.imm_operands);
8984     }
8985
8986   /* cmp without cmp m, imm.  */
8987   if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8988       || ((i.tm.base_opcode | 3) == 0x83
8989           && (i.tm.extension_opcode == 0x7)))
8990     {
8991       *mf_cmp_p = mf_cmp_alu_cmp;
8992       return !(i.mem_operands && i.imm_operands);
8993     }
8994
8995   /* inc, dec without inc/dec m.   */
8996   if ((i.tm.cpu_flags.bitfield.cpuno64
8997        && (i.tm.base_opcode | 0xf) == 0x4f)
8998       || ((i.tm.base_opcode | 1) == 0xff
8999           && i.tm.extension_opcode <= 0x1))
9000     {
9001       *mf_cmp_p = mf_cmp_incdec;
9002       return !i.mem_operands;
9003     }
9004
9005   return 0;
9006 }
9007
9008 /* Return 1 if a FUSED_JCC_PADDING frag should be generated.  */
9009
9010 static int
9011 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9012 {
9013   /* NB: Don't work with COND_JUMP86 without i386.  */
9014   if (!align_branch_power
9015       || now_seg == absolute_section
9016       || !cpu_arch_flags.bitfield.cpui386
9017       || !(align_branch & align_branch_fused_bit))
9018     return 0;
9019
9020   if (maybe_fused_with_jcc_p (mf_cmp_p))
9021     {
9022       if (last_insn.kind == last_insn_other
9023           || last_insn.seg != now_seg)
9024         return 1;
9025       if (flag_debug)
9026         as_warn_where (last_insn.file, last_insn.line,
9027                        _("`%s` skips -malign-branch-boundary on `%s`"),
9028                        last_insn.name, i.tm.name);
9029     }
9030
9031   return 0;
9032 }
9033
9034 /* Return 1 if a BRANCH_PREFIX frag should be generated.  */
9035
9036 static int
9037 add_branch_prefix_frag_p (void)
9038 {
9039   /* NB: Don't work with COND_JUMP86 without i386.  Don't add prefix
9040      to PadLock instructions since they include prefixes in opcode.  */
9041   if (!align_branch_power
9042       || !align_branch_prefix_size
9043       || now_seg == absolute_section
9044       || i.tm.cpu_flags.bitfield.cpupadlock
9045       || !cpu_arch_flags.bitfield.cpui386)
9046     return 0;
9047
9048   /* Don't add prefix if it is a prefix or there is no operand in case
9049      that segment prefix is special.  */
9050   if (!i.operands || i.tm.opcode_modifier.isprefix)
9051     return 0;
9052
9053   if (last_insn.kind == last_insn_other
9054       || last_insn.seg != now_seg)
9055     return 1;
9056
9057   if (flag_debug)
9058     as_warn_where (last_insn.file, last_insn.line,
9059                    _("`%s` skips -malign-branch-boundary on `%s`"),
9060                    last_insn.name, i.tm.name);
9061
9062   return 0;
9063 }
9064
9065 /* Return 1 if a BRANCH_PADDING frag should be generated.  */
9066
9067 static int
9068 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9069                            enum mf_jcc_kind *mf_jcc_p)
9070 {
9071   int add_padding;
9072
9073   /* NB: Don't work with COND_JUMP86 without i386.  */
9074   if (!align_branch_power
9075       || now_seg == absolute_section
9076       || !cpu_arch_flags.bitfield.cpui386)
9077     return 0;
9078
9079   add_padding = 0;
9080
9081   /* Check for jcc and direct jmp.  */
9082   if (i.tm.opcode_modifier.jump == JUMP)
9083     {
9084       if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9085         {
9086           *branch_p = align_branch_jmp;
9087           add_padding = align_branch & align_branch_jmp_bit;
9088         }
9089       else
9090         {
9091           /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9092              igore the lowest bit.  */
9093           *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9094           *branch_p = align_branch_jcc;
9095           if ((align_branch & align_branch_jcc_bit))
9096             add_padding = 1;
9097         }
9098     }
9099   else if (is_any_vex_encoding (&i.tm))
9100     return 0;
9101   else if ((i.tm.base_opcode | 1) == 0xc3)
9102     {
9103       /* Near ret.  */
9104       *branch_p = align_branch_ret;
9105       if ((align_branch & align_branch_ret_bit))
9106         add_padding = 1;
9107     }
9108   else
9109     {
9110       /* Check for indirect jmp, direct and indirect calls.  */
9111       if (i.tm.base_opcode == 0xe8)
9112         {
9113           /* Direct call.  */
9114           *branch_p = align_branch_call;
9115           if ((align_branch & align_branch_call_bit))
9116             add_padding = 1;
9117         }
9118       else if (i.tm.base_opcode == 0xff
9119                && (i.tm.extension_opcode == 2
9120                    || i.tm.extension_opcode == 4))
9121         {
9122           /* Indirect call and jmp.  */
9123           *branch_p = align_branch_indirect;
9124           if ((align_branch & align_branch_indirect_bit))
9125             add_padding = 1;
9126         }
9127
9128       if (add_padding
9129           && i.disp_operands
9130           && tls_get_addr
9131           && (i.op[0].disps->X_op == O_symbol
9132               || (i.op[0].disps->X_op == O_subtract
9133                   && i.op[0].disps->X_op_symbol == GOT_symbol)))
9134         {
9135           symbolS *s = i.op[0].disps->X_add_symbol;
9136           /* No padding to call to global or undefined tls_get_addr.  */
9137           if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9138               && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9139             return 0;
9140         }
9141     }
9142
9143   if (add_padding
9144       && last_insn.kind != last_insn_other
9145       && last_insn.seg == now_seg)
9146     {
9147       if (flag_debug)
9148         as_warn_where (last_insn.file, last_insn.line,
9149                        _("`%s` skips -malign-branch-boundary on `%s`"),
9150                        last_insn.name, i.tm.name);
9151       return 0;
9152     }
9153
9154   return add_padding;
9155 }
9156
9157 static void
9158 output_insn (void)
9159 {
9160   fragS *insn_start_frag;
9161   offsetT insn_start_off;
9162   fragS *fragP = NULL;
9163   enum align_branch_kind branch = align_branch_none;
9164   /* The initializer is arbitrary just to avoid uninitialized error.
9165      it's actually either assigned in add_branch_padding_frag_p
9166      or never be used.  */
9167   enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9168
9169 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9170   if (IS_ELF && x86_used_note && now_seg != absolute_section)
9171     {
9172       if ((i.xstate & xstate_tmm) == xstate_tmm
9173           || i.tm.cpu_flags.bitfield.cpuamx_tile)
9174         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9175
9176       if (i.tm.cpu_flags.bitfield.cpu8087
9177           || i.tm.cpu_flags.bitfield.cpu287
9178           || i.tm.cpu_flags.bitfield.cpu387
9179           || i.tm.cpu_flags.bitfield.cpu687
9180           || i.tm.cpu_flags.bitfield.cpufisttp)
9181         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9182
9183       if ((i.xstate & xstate_mmx)
9184           || i.tm.base_opcode == 0xf77 /* emms */
9185           || i.tm.base_opcode == 0xf0e /* femms */)
9186         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9187
9188       if (i.index_reg)
9189         {
9190           if (i.index_reg->reg_type.bitfield.zmmword)
9191             i.xstate |= xstate_zmm;
9192           else if (i.index_reg->reg_type.bitfield.ymmword)
9193             i.xstate |= xstate_ymm;
9194           else if (i.index_reg->reg_type.bitfield.xmmword)
9195             i.xstate |= xstate_xmm;
9196         }
9197
9198       /* vzeroall / vzeroupper */
9199       if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9200         i.xstate |= xstate_ymm;
9201
9202       if ((i.xstate & xstate_xmm)
9203           /* ldmxcsr / stmxcsr */
9204           || (i.tm.base_opcode == 0xfae && i.tm.cpu_flags.bitfield.cpusse)
9205           /* vldmxcsr / vstmxcsr */
9206           || (i.tm.base_opcode == 0xae && i.tm.cpu_flags.bitfield.cpuavx)
9207           || i.tm.cpu_flags.bitfield.cpuwidekl
9208           || i.tm.cpu_flags.bitfield.cpukl)
9209         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9210
9211       if ((i.xstate & xstate_ymm) == xstate_ymm)
9212         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9213       if ((i.xstate & xstate_zmm) == xstate_zmm)
9214         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9215       if (i.mask || (i.xstate & xstate_mask) == xstate_mask)
9216         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9217       if (i.tm.cpu_flags.bitfield.cpufxsr)
9218         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9219       if (i.tm.cpu_flags.bitfield.cpuxsave)
9220         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9221       if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9222         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9223       if (i.tm.cpu_flags.bitfield.cpuxsavec)
9224         x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9225
9226       if (x86_feature_2_used
9227           || i.tm.cpu_flags.bitfield.cpucmov
9228           || i.tm.cpu_flags.bitfield.cpusyscall
9229           || (i.tm.base_opcode == 0xfc7
9230               && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
9231               && i.tm.extension_opcode == 1) /* cmpxchg8b */)
9232         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9233       if (i.tm.cpu_flags.bitfield.cpusse3
9234           || i.tm.cpu_flags.bitfield.cpussse3
9235           || i.tm.cpu_flags.bitfield.cpusse4_1
9236           || i.tm.cpu_flags.bitfield.cpusse4_2
9237           || i.tm.cpu_flags.bitfield.cpucx16
9238           || i.tm.cpu_flags.bitfield.cpupopcnt
9239           /* LAHF-SAHF insns in 64-bit mode.  */
9240           || (flag_code == CODE_64BIT
9241               && (i.tm.base_opcode | 1) == 0x9f
9242               && i.tm.opcode_modifier.opcodespace == SPACE_BASE))
9243         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9244       if (i.tm.cpu_flags.bitfield.cpuavx
9245           || i.tm.cpu_flags.bitfield.cpuavx2
9246           /* Any VEX encoded insns execpt for CpuAVX512F, CpuAVX512BW,
9247              CpuAVX512DQ, LPW, TBM and AMX.  */
9248           || (i.tm.opcode_modifier.vex
9249               && !i.tm.cpu_flags.bitfield.cpuavx512f
9250               && !i.tm.cpu_flags.bitfield.cpuavx512bw
9251               && !i.tm.cpu_flags.bitfield.cpuavx512dq
9252               && !i.tm.cpu_flags.bitfield.cpulwp
9253               && !i.tm.cpu_flags.bitfield.cputbm
9254               && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9255           || i.tm.cpu_flags.bitfield.cpuf16c
9256           || i.tm.cpu_flags.bitfield.cpufma
9257           || i.tm.cpu_flags.bitfield.cpulzcnt
9258           || i.tm.cpu_flags.bitfield.cpumovbe
9259           || i.tm.cpu_flags.bitfield.cpuxsaves
9260           || (x86_feature_2_used
9261               & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9262                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9263                  | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9264         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9265       if (i.tm.cpu_flags.bitfield.cpuavx512f
9266           || i.tm.cpu_flags.bitfield.cpuavx512bw
9267           || i.tm.cpu_flags.bitfield.cpuavx512dq
9268           || i.tm.cpu_flags.bitfield.cpuavx512vl
9269           /* Any EVEX encoded insns except for AVX512ER, AVX512PF and
9270              VNNIW.  */
9271           || (i.tm.opcode_modifier.evex
9272               && !i.tm.cpu_flags.bitfield.cpuavx512er
9273               && !i.tm.cpu_flags.bitfield.cpuavx512pf
9274               && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9275         x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9276     }
9277 #endif
9278
9279   /* Tie dwarf2 debug info to the address at the start of the insn.
9280      We can't do this after the insn has been output as the current
9281      frag may have been closed off.  eg. by frag_var.  */
9282   dwarf2_emit_insn (0);
9283
9284   insn_start_frag = frag_now;
9285   insn_start_off = frag_now_fix ();
9286
9287   if (add_branch_padding_frag_p (&branch, &mf_jcc))
9288     {
9289       char *p;
9290       /* Branch can be 8 bytes.  Leave some room for prefixes.  */
9291       unsigned int max_branch_padding_size = 14;
9292
9293       /* Align section to boundary.  */
9294       record_alignment (now_seg, align_branch_power);
9295
9296       /* Make room for padding.  */
9297       frag_grow (max_branch_padding_size);
9298
9299       /* Start of the padding.  */
9300       p = frag_more (0);
9301
9302       fragP = frag_now;
9303
9304       frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9305                 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9306                 NULL, 0, p);
9307
9308       fragP->tc_frag_data.mf_type = mf_jcc;
9309       fragP->tc_frag_data.branch_type = branch;
9310       fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9311     }
9312
9313   /* Output jumps.  */
9314   if (i.tm.opcode_modifier.jump == JUMP)
9315     output_branch ();
9316   else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9317            || i.tm.opcode_modifier.jump == JUMP_DWORD)
9318     output_jump ();
9319   else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9320     output_interseg_jump ();
9321   else
9322     {
9323       /* Output normal instructions here.  */
9324       char *p;
9325       unsigned char *q;
9326       unsigned int j;
9327       enum mf_cmp_kind mf_cmp;
9328
9329       if (avoid_fence
9330           && (i.tm.base_opcode == 0xfaee8
9331               || i.tm.base_opcode == 0xfaef0
9332               || i.tm.base_opcode == 0xfaef8))
9333         {
9334           /* Encode lfence, mfence, and sfence as
9335              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
9336           if (now_seg != absolute_section)
9337             {
9338               offsetT val = 0x240483f0ULL;
9339
9340               p = frag_more (5);
9341               md_number_to_chars (p, val, 5);
9342             }
9343           else
9344             abs_section_offset += 5;
9345           return;
9346         }
9347
9348       /* Some processors fail on LOCK prefix. This options makes
9349          assembler ignore LOCK prefix and serves as a workaround.  */
9350       if (omit_lock_prefix)
9351         {
9352           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE
9353               && i.tm.opcode_modifier.isprefix)
9354             return;
9355           i.prefix[LOCK_PREFIX] = 0;
9356         }
9357
9358       if (branch)
9359         /* Skip if this is a branch.  */
9360         ;
9361       else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9362         {
9363           /* Make room for padding.  */
9364           frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9365           p = frag_more (0);
9366
9367           fragP = frag_now;
9368
9369           frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9370                     ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9371                     NULL, 0, p);
9372
9373           fragP->tc_frag_data.mf_type = mf_cmp;
9374           fragP->tc_frag_data.branch_type = align_branch_fused;
9375           fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9376         }
9377       else if (add_branch_prefix_frag_p ())
9378         {
9379           unsigned int max_prefix_size = align_branch_prefix_size;
9380
9381           /* Make room for padding.  */
9382           frag_grow (max_prefix_size);
9383           p = frag_more (0);
9384
9385           fragP = frag_now;
9386
9387           frag_var (rs_machine_dependent, max_prefix_size, 0,
9388                     ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9389                     NULL, 0, p);
9390
9391           fragP->tc_frag_data.max_bytes = max_prefix_size;
9392         }
9393
9394       /* Since the VEX/EVEX prefix contains the implicit prefix, we
9395          don't need the explicit prefix.  */
9396       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9397         {
9398           switch (i.tm.opcode_modifier.opcodeprefix)
9399             {
9400             case PREFIX_0X66:
9401               add_prefix (0x66);
9402               break;
9403             case PREFIX_0XF2:
9404               add_prefix (0xf2);
9405               break;
9406             case PREFIX_0XF3:
9407               if (!i.tm.cpu_flags.bitfield.cpupadlock
9408                   || (i.prefix[REP_PREFIX] != 0xf3))
9409                 add_prefix (0xf3);
9410               break;
9411             case PREFIX_NONE:
9412               switch (i.opcode_length)
9413                 {
9414                 case 3:
9415                 case 2:
9416                   break;
9417                 case 1:
9418                   /* Check for pseudo prefixes.  */
9419                   if (!i.tm.opcode_modifier.isprefix || i.tm.base_opcode)
9420                     break;
9421                   as_bad_where (insn_start_frag->fr_file,
9422                                 insn_start_frag->fr_line,
9423                                 _("pseudo prefix without instruction"));
9424                   return;
9425                 default:
9426                   abort ();
9427                 }
9428               break;
9429             default:
9430               abort ();
9431             }
9432
9433 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9434           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9435              R_X86_64_GOTTPOFF relocation so that linker can safely
9436              perform IE->LE optimization.  A dummy REX_OPCODE prefix
9437              is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9438              relocation for GDesc -> IE/LE optimization.  */
9439           if (x86_elf_abi == X86_64_X32_ABI
9440               && i.operands == 2
9441               && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9442                   || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9443               && i.prefix[REX_PREFIX] == 0)
9444             add_prefix (REX_OPCODE);
9445 #endif
9446
9447           /* The prefix bytes.  */
9448           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9449             if (*q)
9450               frag_opcode_byte (*q);
9451         }
9452       else
9453         {
9454           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9455             if (*q)
9456               switch (j)
9457                 {
9458                 case SEG_PREFIX:
9459                 case ADDR_PREFIX:
9460                   frag_opcode_byte (*q);
9461                   break;
9462                 default:
9463                   /* There should be no other prefixes for instructions
9464                      with VEX prefix.  */
9465                   abort ();
9466                 }
9467
9468           /* For EVEX instructions i.vrex should become 0 after
9469              build_evex_prefix.  For VEX instructions upper 16 registers
9470              aren't available, so VREX should be 0.  */
9471           if (i.vrex)
9472             abort ();
9473           /* Now the VEX prefix.  */
9474           if (now_seg != absolute_section)
9475             {
9476               p = frag_more (i.vex.length);
9477               for (j = 0; j < i.vex.length; j++)
9478                 p[j] = i.vex.bytes[j];
9479             }
9480           else
9481             abs_section_offset += i.vex.length;
9482         }
9483
9484       /* Now the opcode; be careful about word order here!  */
9485       if (now_seg == absolute_section)
9486         abs_section_offset += i.opcode_length;
9487       else if (i.opcode_length == 1)
9488         {
9489           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9490         }
9491       else
9492         {
9493           switch (i.opcode_length)
9494             {
9495             case 4:
9496               p = frag_more (4);
9497               *p++ = (i.tm.base_opcode >> 24) & 0xff;
9498               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9499               break;
9500             case 3:
9501               p = frag_more (3);
9502               *p++ = (i.tm.base_opcode >> 16) & 0xff;
9503               break;
9504             case 2:
9505               p = frag_more (2);
9506               break;
9507             default:
9508               abort ();
9509               break;
9510             }
9511
9512           /* Put out high byte first: can't use md_number_to_chars!  */
9513           *p++ = (i.tm.base_opcode >> 8) & 0xff;
9514           *p = i.tm.base_opcode & 0xff;
9515         }
9516
9517       /* Now the modrm byte and sib byte (if present).  */
9518       if (i.tm.opcode_modifier.modrm)
9519         {
9520           frag_opcode_byte ((i.rm.regmem << 0)
9521                              | (i.rm.reg << 3)
9522                              | (i.rm.mode << 6));
9523           /* If i.rm.regmem == ESP (4)
9524              && i.rm.mode != (Register mode)
9525              && not 16 bit
9526              ==> need second modrm byte.  */
9527           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9528               && i.rm.mode != 3
9529               && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9530             frag_opcode_byte ((i.sib.base << 0)
9531                               | (i.sib.index << 3)
9532                               | (i.sib.scale << 6));
9533         }
9534
9535       if (i.disp_operands)
9536         output_disp (insn_start_frag, insn_start_off);
9537
9538       if (i.imm_operands)
9539         output_imm (insn_start_frag, insn_start_off);
9540
9541       /*
9542        * frag_now_fix () returning plain abs_section_offset when we're in the
9543        * absolute section, and abs_section_offset not getting updated as data
9544        * gets added to the frag breaks the logic below.
9545        */
9546       if (now_seg != absolute_section)
9547         {
9548           j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9549           if (j > 15)
9550             as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9551                      j);
9552           else if (fragP)
9553             {
9554               /* NB: Don't add prefix with GOTPC relocation since
9555                  output_disp() above depends on the fixed encoding
9556                  length.  Can't add prefix with TLS relocation since
9557                  it breaks TLS linker optimization.  */
9558               unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9559               /* Prefix count on the current instruction.  */
9560               unsigned int count = i.vex.length;
9561               unsigned int k;
9562               for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9563                 /* REX byte is encoded in VEX/EVEX prefix.  */
9564                 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9565                   count++;
9566
9567               /* Count prefixes for extended opcode maps.  */
9568               if (!i.vex.length)
9569                 switch (i.opcode_length)
9570                   {
9571                   case 3:
9572                     if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9573                       {
9574                         count++;
9575                         switch ((i.tm.base_opcode >> 8) & 0xff)
9576                           {
9577                           case 0x38:
9578                           case 0x3a:
9579                             count++;
9580                             break;
9581                           default:
9582                             break;
9583                           }
9584                       }
9585                     break;
9586                   case 2:
9587                     if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9588                       count++;
9589                     break;
9590                   case 1:
9591                     break;
9592                   default:
9593                     abort ();
9594                   }
9595
9596               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9597                   == BRANCH_PREFIX)
9598                 {
9599                   /* Set the maximum prefix size in BRANCH_PREFIX
9600                      frag.  */
9601                   if (fragP->tc_frag_data.max_bytes > max)
9602                     fragP->tc_frag_data.max_bytes = max;
9603                   if (fragP->tc_frag_data.max_bytes > count)
9604                     fragP->tc_frag_data.max_bytes -= count;
9605                   else
9606                     fragP->tc_frag_data.max_bytes = 0;
9607                 }
9608               else
9609                 {
9610                   /* Remember the maximum prefix size in FUSED_JCC_PADDING
9611                      frag.  */
9612                   unsigned int max_prefix_size;
9613                   if (align_branch_prefix_size > max)
9614                     max_prefix_size = max;
9615                   else
9616                     max_prefix_size = align_branch_prefix_size;
9617                   if (max_prefix_size > count)
9618                     fragP->tc_frag_data.max_prefix_length
9619                       = max_prefix_size - count;
9620                 }
9621
9622               /* Use existing segment prefix if possible.  Use CS
9623                  segment prefix in 64-bit mode.  In 32-bit mode, use SS
9624                  segment prefix with ESP/EBP base register and use DS
9625                  segment prefix without ESP/EBP base register.  */
9626               if (i.prefix[SEG_PREFIX])
9627                 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9628               else if (flag_code == CODE_64BIT)
9629                 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9630               else if (i.base_reg
9631                        && (i.base_reg->reg_num == 4
9632                            || i.base_reg->reg_num == 5))
9633                 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9634               else
9635                 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9636             }
9637         }
9638     }
9639
9640   /* NB: Don't work with COND_JUMP86 without i386.  */
9641   if (align_branch_power
9642       && now_seg != absolute_section
9643       && cpu_arch_flags.bitfield.cpui386)
9644     {
9645       /* Terminate each frag so that we can add prefix and check for
9646          fused jcc.  */
9647       frag_wane (frag_now);
9648       frag_new (0);
9649     }
9650
9651 #ifdef DEBUG386
9652   if (flag_debug)
9653     {
9654       pi ("" /*line*/, &i);
9655     }
9656 #endif /* DEBUG386  */
9657 }
9658
9659 /* Return the size of the displacement operand N.  */
9660
9661 static int
9662 disp_size (unsigned int n)
9663 {
9664   int size = 4;
9665
9666   if (i.types[n].bitfield.disp64)
9667     size = 8;
9668   else if (i.types[n].bitfield.disp8)
9669     size = 1;
9670   else if (i.types[n].bitfield.disp16)
9671     size = 2;
9672   return size;
9673 }
9674
9675 /* Return the size of the immediate operand N.  */
9676
9677 static int
9678 imm_size (unsigned int n)
9679 {
9680   int size = 4;
9681   if (i.types[n].bitfield.imm64)
9682     size = 8;
9683   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9684     size = 1;
9685   else if (i.types[n].bitfield.imm16)
9686     size = 2;
9687   return size;
9688 }
9689
9690 static void
9691 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9692 {
9693   char *p;
9694   unsigned int n;
9695
9696   for (n = 0; n < i.operands; n++)
9697     {
9698       if (operand_type_check (i.types[n], disp))
9699         {
9700           int size = disp_size (n);
9701
9702           if (now_seg == absolute_section)
9703             abs_section_offset += size;
9704           else if (i.op[n].disps->X_op == O_constant)
9705             {
9706               offsetT val = i.op[n].disps->X_add_number;
9707
9708               val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9709                                      size);
9710               p = frag_more (size);
9711               md_number_to_chars (p, val, size);
9712             }
9713           else
9714             {
9715               enum bfd_reloc_code_real reloc_type;
9716               int sign = i.types[n].bitfield.disp32s;
9717               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9718               fixS *fixP;
9719
9720               /* We can't have 8 bit displacement here.  */
9721               gas_assert (!i.types[n].bitfield.disp8);
9722
9723               /* The PC relative address is computed relative
9724                  to the instruction boundary, so in case immediate
9725                  fields follows, we need to adjust the value.  */
9726               if (pcrel && i.imm_operands)
9727                 {
9728                   unsigned int n1;
9729                   int sz = 0;
9730
9731                   for (n1 = 0; n1 < i.operands; n1++)
9732                     if (operand_type_check (i.types[n1], imm))
9733                       {
9734                         /* Only one immediate is allowed for PC
9735                            relative address.  */
9736                         gas_assert (sz == 0);
9737                         sz = imm_size (n1);
9738                         i.op[n].disps->X_add_number -= sz;
9739                       }
9740                   /* We should find the immediate.  */
9741                   gas_assert (sz != 0);
9742                 }
9743
9744               p = frag_more (size);
9745               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9746               if (GOT_symbol
9747                   && GOT_symbol == i.op[n].disps->X_add_symbol
9748                   && (((reloc_type == BFD_RELOC_32
9749                         || reloc_type == BFD_RELOC_X86_64_32S
9750                         || (reloc_type == BFD_RELOC_64
9751                             && object_64bit))
9752                        && (i.op[n].disps->X_op == O_symbol
9753                            || (i.op[n].disps->X_op == O_add
9754                                && ((symbol_get_value_expression
9755                                     (i.op[n].disps->X_op_symbol)->X_op)
9756                                    == O_subtract))))
9757                       || reloc_type == BFD_RELOC_32_PCREL))
9758                 {
9759                   if (!object_64bit)
9760                     {
9761                       reloc_type = BFD_RELOC_386_GOTPC;
9762                       i.has_gotpc_tls_reloc = TRUE;
9763                       i.op[n].imms->X_add_number +=
9764                         encoding_length (insn_start_frag, insn_start_off, p);
9765                     }
9766                   else if (reloc_type == BFD_RELOC_64)
9767                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9768                   else
9769                     /* Don't do the adjustment for x86-64, as there
9770                        the pcrel addressing is relative to the _next_
9771                        insn, and that is taken care of in other code.  */
9772                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9773                 }
9774               else if (align_branch_power)
9775                 {
9776                   switch (reloc_type)
9777                     {
9778                     case BFD_RELOC_386_TLS_GD:
9779                     case BFD_RELOC_386_TLS_LDM:
9780                     case BFD_RELOC_386_TLS_IE:
9781                     case BFD_RELOC_386_TLS_IE_32:
9782                     case BFD_RELOC_386_TLS_GOTIE:
9783                     case BFD_RELOC_386_TLS_GOTDESC:
9784                     case BFD_RELOC_386_TLS_DESC_CALL:
9785                     case BFD_RELOC_X86_64_TLSGD:
9786                     case BFD_RELOC_X86_64_TLSLD:
9787                     case BFD_RELOC_X86_64_GOTTPOFF:
9788                     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9789                     case BFD_RELOC_X86_64_TLSDESC_CALL:
9790                       i.has_gotpc_tls_reloc = TRUE;
9791                     default:
9792                       break;
9793                     }
9794                 }
9795               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9796                                   size, i.op[n].disps, pcrel,
9797                                   reloc_type);
9798               /* Check for "call/jmp *mem", "mov mem, %reg",
9799                  "test %reg, mem" and "binop mem, %reg" where binop
9800                  is one of adc, add, and, cmp, or, sbb, sub, xor
9801                  instructions without data prefix.  Always generate
9802                  R_386_GOT32X for "sym*GOT" operand in 32-bit mode.  */
9803               if (i.prefix[DATA_PREFIX] == 0
9804                   && (generate_relax_relocations
9805                       || (!object_64bit
9806                           && i.rm.mode == 0
9807                           && i.rm.regmem == 5))
9808                   && (i.rm.mode == 2
9809                       || (i.rm.mode == 0 && i.rm.regmem == 5))
9810                   && !is_any_vex_encoding(&i.tm)
9811                   && ((i.operands == 1
9812                        && i.tm.base_opcode == 0xff
9813                        && (i.rm.reg == 2 || i.rm.reg == 4))
9814                       || (i.operands == 2
9815                           && (i.tm.base_opcode == 0x8b
9816                               || i.tm.base_opcode == 0x85
9817                               || (i.tm.base_opcode & ~0x38) == 0x03))))
9818                 {
9819                   if (object_64bit)
9820                     {
9821                       fixP->fx_tcbit = i.rex != 0;
9822                       if (i.base_reg
9823                           && (i.base_reg->reg_num == RegIP))
9824                       fixP->fx_tcbit2 = 1;
9825                     }
9826                   else
9827                     fixP->fx_tcbit2 = 1;
9828                 }
9829             }
9830         }
9831     }
9832 }
9833
9834 static void
9835 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9836 {
9837   char *p;
9838   unsigned int n;
9839
9840   for (n = 0; n < i.operands; n++)
9841     {
9842       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
9843       if (i.rounding && (int) n == i.rounding->operand)
9844         continue;
9845
9846       if (operand_type_check (i.types[n], imm))
9847         {
9848           int size = imm_size (n);
9849
9850           if (now_seg == absolute_section)
9851             abs_section_offset += size;
9852           else if (i.op[n].imms->X_op == O_constant)
9853             {
9854               offsetT val;
9855
9856               val = offset_in_range (i.op[n].imms->X_add_number,
9857                                      size);
9858               p = frag_more (size);
9859               md_number_to_chars (p, val, size);
9860             }
9861           else
9862             {
9863               /* Not absolute_section.
9864                  Need a 32-bit fixup (don't support 8bit
9865                  non-absolute imms).  Try to support other
9866                  sizes ...  */
9867               enum bfd_reloc_code_real reloc_type;
9868               int sign;
9869
9870               if (i.types[n].bitfield.imm32s
9871                   && (i.suffix == QWORD_MNEM_SUFFIX
9872                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9873                 sign = 1;
9874               else
9875                 sign = 0;
9876
9877               p = frag_more (size);
9878               reloc_type = reloc (size, 0, sign, i.reloc[n]);
9879
9880               /*   This is tough to explain.  We end up with this one if we
9881                * have operands that look like
9882                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
9883                * obtain the absolute address of the GOT, and it is strongly
9884                * preferable from a performance point of view to avoid using
9885                * a runtime relocation for this.  The actual sequence of
9886                * instructions often look something like:
9887                *
9888                *        call    .L66
9889                * .L66:
9890                *        popl    %ebx
9891                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9892                *
9893                *   The call and pop essentially return the absolute address
9894                * of the label .L66 and store it in %ebx.  The linker itself
9895                * will ultimately change the first operand of the addl so
9896                * that %ebx points to the GOT, but to keep things simple, the
9897                * .o file must have this operand set so that it generates not
9898                * the absolute address of .L66, but the absolute address of
9899                * itself.  This allows the linker itself simply treat a GOTPC
9900                * relocation as asking for a pcrel offset to the GOT to be
9901                * added in, and the addend of the relocation is stored in the
9902                * operand field for the instruction itself.
9903                *
9904                *   Our job here is to fix the operand so that it would add
9905                * the correct offset so that %ebx would point to itself.  The
9906                * thing that is tricky is that .-.L66 will point to the
9907                * beginning of the instruction, so we need to further modify
9908                * the operand so that it will point to itself.  There are
9909                * other cases where you have something like:
9910                *
9911                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9912                *
9913                * and here no correction would be required.  Internally in
9914                * the assembler we treat operands of this form as not being
9915                * pcrel since the '.' is explicitly mentioned, and I wonder
9916                * whether it would simplify matters to do it this way.  Who
9917                * knows.  In earlier versions of the PIC patches, the
9918                * pcrel_adjust field was used to store the correction, but
9919                * since the expression is not pcrel, I felt it would be
9920                * confusing to do it this way.  */
9921
9922               if ((reloc_type == BFD_RELOC_32
9923                    || reloc_type == BFD_RELOC_X86_64_32S
9924                    || reloc_type == BFD_RELOC_64)
9925                   && GOT_symbol
9926                   && GOT_symbol == i.op[n].imms->X_add_symbol
9927                   && (i.op[n].imms->X_op == O_symbol
9928                       || (i.op[n].imms->X_op == O_add
9929                           && ((symbol_get_value_expression
9930                                (i.op[n].imms->X_op_symbol)->X_op)
9931                               == O_subtract))))
9932                 {
9933                   if (!object_64bit)
9934                     reloc_type = BFD_RELOC_386_GOTPC;
9935                   else if (size == 4)
9936                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
9937                   else if (size == 8)
9938                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
9939                   i.has_gotpc_tls_reloc = TRUE;
9940                   i.op[n].imms->X_add_number +=
9941                     encoding_length (insn_start_frag, insn_start_off, p);
9942                 }
9943               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9944                            i.op[n].imms, 0, reloc_type);
9945             }
9946         }
9947     }
9948 }
9949 \f
9950 /* x86_cons_fix_new is called via the expression parsing code when a
9951    reloc is needed.  We use this hook to get the correct .got reloc.  */
9952 static int cons_sign = -1;
9953
9954 void
9955 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9956                   expressionS *exp, bfd_reloc_code_real_type r)
9957 {
9958   r = reloc (len, 0, cons_sign, r);
9959
9960 #ifdef TE_PE
9961   if (exp->X_op == O_secrel)
9962     {
9963       exp->X_op = O_symbol;
9964       r = BFD_RELOC_32_SECREL;
9965     }
9966 #endif
9967
9968   fix_new_exp (frag, off, len, exp, 0, r);
9969 }
9970
9971 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9972    purpose of the `.dc.a' internal pseudo-op.  */
9973
9974 int
9975 x86_address_bytes (void)
9976 {
9977   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9978     return 4;
9979   return stdoutput->arch_info->bits_per_address / 8;
9980 }
9981
9982 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9983     || defined (LEX_AT)
9984 # define lex_got(reloc, adjust, types) NULL
9985 #else
9986 /* Parse operands of the form
9987    <symbol>@GOTOFF+<nnn>
9988    and similar .plt or .got references.
9989
9990    If we find one, set up the correct relocation in RELOC and copy the
9991    input string, minus the `@GOTOFF' into a malloc'd buffer for
9992    parsing by the calling routine.  Return this buffer, and if ADJUST
9993    is non-null set it to the length of the string we removed from the
9994    input line.  Otherwise return NULL.  */
9995 static char *
9996 lex_got (enum bfd_reloc_code_real *rel,
9997          int *adjust,
9998          i386_operand_type *types)
9999 {
10000   /* Some of the relocations depend on the size of what field is to
10001      be relocated.  But in our callers i386_immediate and i386_displacement
10002      we don't yet know the operand size (this will be set by insn
10003      matching).  Hence we record the word32 relocation here,
10004      and adjust the reloc according to the real size in reloc().  */
10005   static const struct {
10006     const char *str;
10007     int len;
10008     const enum bfd_reloc_code_real rel[2];
10009     const i386_operand_type types64;
10010     bfd_boolean need_GOT_symbol;
10011   } gotrel[] = {
10012 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10013     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
10014                                         BFD_RELOC_SIZE32 },
10015       OPERAND_TYPE_IMM32_64, FALSE },
10016 #endif
10017     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
10018                                        BFD_RELOC_X86_64_PLTOFF64 },
10019       OPERAND_TYPE_IMM64, TRUE },
10020     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
10021                                        BFD_RELOC_X86_64_PLT32    },
10022       OPERAND_TYPE_IMM32_32S_DISP32, FALSE },
10023     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
10024                                        BFD_RELOC_X86_64_GOTPLT64 },
10025       OPERAND_TYPE_IMM64_DISP64, TRUE },
10026     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
10027                                        BFD_RELOC_X86_64_GOTOFF64 },
10028       OPERAND_TYPE_IMM64_DISP64, TRUE },
10029     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10030                                        BFD_RELOC_X86_64_GOTPCREL },
10031       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10032     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
10033                                        BFD_RELOC_X86_64_TLSGD    },
10034       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10035     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
10036                                        _dummy_first_bfd_reloc_code_real },
10037       OPERAND_TYPE_NONE, TRUE },
10038     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
10039                                        BFD_RELOC_X86_64_TLSLD    },
10040       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10041     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10042                                        BFD_RELOC_X86_64_GOTTPOFF },
10043       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10044     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
10045                                        BFD_RELOC_X86_64_TPOFF32  },
10046       OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10047     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
10048                                        _dummy_first_bfd_reloc_code_real },
10049       OPERAND_TYPE_NONE, TRUE },
10050     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
10051                                        BFD_RELOC_X86_64_DTPOFF32 },
10052       OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10053     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10054                                        _dummy_first_bfd_reloc_code_real },
10055       OPERAND_TYPE_NONE, TRUE },
10056     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10057                                        _dummy_first_bfd_reloc_code_real },
10058       OPERAND_TYPE_NONE, TRUE },
10059     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
10060                                        BFD_RELOC_X86_64_GOT32    },
10061       OPERAND_TYPE_IMM32_32S_64_DISP32, TRUE },
10062     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
10063                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10064       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10065     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
10066                                        BFD_RELOC_X86_64_TLSDESC_CALL },
10067       OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10068   };
10069   char *cp;
10070   unsigned int j;
10071
10072 #if defined (OBJ_MAYBE_ELF)
10073   if (!IS_ELF)
10074     return NULL;
10075 #endif
10076
10077   for (cp = input_line_pointer; *cp != '@'; cp++)
10078     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10079       return NULL;
10080
10081   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10082     {
10083       int len = gotrel[j].len;
10084       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10085         {
10086           if (gotrel[j].rel[object_64bit] != 0)
10087             {
10088               int first, second;
10089               char *tmpbuf, *past_reloc;
10090
10091               *rel = gotrel[j].rel[object_64bit];
10092
10093               if (types)
10094                 {
10095                   if (flag_code != CODE_64BIT)
10096                     {
10097                       types->bitfield.imm32 = 1;
10098                       types->bitfield.disp32 = 1;
10099                     }
10100                   else
10101                     *types = gotrel[j].types64;
10102                 }
10103
10104               if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10105                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10106
10107               /* The length of the first part of our input line.  */
10108               first = cp - input_line_pointer;
10109
10110               /* The second part goes from after the reloc token until
10111                  (and including) an end_of_line char or comma.  */
10112               past_reloc = cp + 1 + len;
10113               cp = past_reloc;
10114               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10115                 ++cp;
10116               second = cp + 1 - past_reloc;
10117
10118               /* Allocate and copy string.  The trailing NUL shouldn't
10119                  be necessary, but be safe.  */
10120               tmpbuf = XNEWVEC (char, first + second + 2);
10121               memcpy (tmpbuf, input_line_pointer, first);
10122               if (second != 0 && *past_reloc != ' ')
10123                 /* Replace the relocation token with ' ', so that
10124                    errors like foo@GOTOFF1 will be detected.  */
10125                 tmpbuf[first++] = ' ';
10126               else
10127                 /* Increment length by 1 if the relocation token is
10128                    removed.  */
10129                 len++;
10130               if (adjust)
10131                 *adjust = len;
10132               memcpy (tmpbuf + first, past_reloc, second);
10133               tmpbuf[first + second] = '\0';
10134               return tmpbuf;
10135             }
10136
10137           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10138                   gotrel[j].str, 1 << (5 + object_64bit));
10139           return NULL;
10140         }
10141     }
10142
10143   /* Might be a symbol version string.  Don't as_bad here.  */
10144   return NULL;
10145 }
10146 #endif
10147
10148 #ifdef TE_PE
10149 #ifdef lex_got
10150 #undef lex_got
10151 #endif
10152 /* Parse operands of the form
10153    <symbol>@SECREL32+<nnn>
10154
10155    If we find one, set up the correct relocation in RELOC and copy the
10156    input string, minus the `@SECREL32' into a malloc'd buffer for
10157    parsing by the calling routine.  Return this buffer, and if ADJUST
10158    is non-null set it to the length of the string we removed from the
10159    input line.  Otherwise return NULL.
10160
10161    This function is copied from the ELF version above adjusted for PE targets.  */
10162
10163 static char *
10164 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10165          int *adjust ATTRIBUTE_UNUSED,
10166          i386_operand_type *types)
10167 {
10168   static const struct
10169   {
10170     const char *str;
10171     int len;
10172     const enum bfd_reloc_code_real rel[2];
10173     const i386_operand_type types64;
10174   }
10175   gotrel[] =
10176   {
10177     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
10178                                           BFD_RELOC_32_SECREL },
10179       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10180   };
10181
10182   char *cp;
10183   unsigned j;
10184
10185   for (cp = input_line_pointer; *cp != '@'; cp++)
10186     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10187       return NULL;
10188
10189   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10190     {
10191       int len = gotrel[j].len;
10192
10193       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10194         {
10195           if (gotrel[j].rel[object_64bit] != 0)
10196             {
10197               int first, second;
10198               char *tmpbuf, *past_reloc;
10199
10200               *rel = gotrel[j].rel[object_64bit];
10201               if (adjust)
10202                 *adjust = len;
10203
10204               if (types)
10205                 {
10206                   if (flag_code != CODE_64BIT)
10207                     {
10208                       types->bitfield.imm32 = 1;
10209                       types->bitfield.disp32 = 1;
10210                     }
10211                   else
10212                     *types = gotrel[j].types64;
10213                 }
10214
10215               /* The length of the first part of our input line.  */
10216               first = cp - input_line_pointer;
10217
10218               /* The second part goes from after the reloc token until
10219                  (and including) an end_of_line char or comma.  */
10220               past_reloc = cp + 1 + len;
10221               cp = past_reloc;
10222               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10223                 ++cp;
10224               second = cp + 1 - past_reloc;
10225
10226               /* Allocate and copy string.  The trailing NUL shouldn't
10227                  be necessary, but be safe.  */
10228               tmpbuf = XNEWVEC (char, first + second + 2);
10229               memcpy (tmpbuf, input_line_pointer, first);
10230               if (second != 0 && *past_reloc != ' ')
10231                 /* Replace the relocation token with ' ', so that
10232                    errors like foo@SECLREL321 will be detected.  */
10233                 tmpbuf[first++] = ' ';
10234               memcpy (tmpbuf + first, past_reloc, second);
10235               tmpbuf[first + second] = '\0';
10236               return tmpbuf;
10237             }
10238
10239           as_bad (_("@%s reloc is not supported with %d-bit output format"),
10240                   gotrel[j].str, 1 << (5 + object_64bit));
10241           return NULL;
10242         }
10243     }
10244
10245   /* Might be a symbol version string.  Don't as_bad here.  */
10246   return NULL;
10247 }
10248
10249 #endif /* TE_PE */
10250
10251 bfd_reloc_code_real_type
10252 x86_cons (expressionS *exp, int size)
10253 {
10254   bfd_reloc_code_real_type got_reloc = NO_RELOC;
10255
10256   intel_syntax = -intel_syntax;
10257
10258   exp->X_md = 0;
10259   if (size == 4 || (object_64bit && size == 8))
10260     {
10261       /* Handle @GOTOFF and the like in an expression.  */
10262       char *save;
10263       char *gotfree_input_line;
10264       int adjust = 0;
10265
10266       save = input_line_pointer;
10267       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10268       if (gotfree_input_line)
10269         input_line_pointer = gotfree_input_line;
10270
10271       expression (exp);
10272
10273       if (gotfree_input_line)
10274         {
10275           /* expression () has merrily parsed up to the end of line,
10276              or a comma - in the wrong buffer.  Transfer how far
10277              input_line_pointer has moved to the right buffer.  */
10278           input_line_pointer = (save
10279                                 + (input_line_pointer - gotfree_input_line)
10280                                 + adjust);
10281           free (gotfree_input_line);
10282           if (exp->X_op == O_constant
10283               || exp->X_op == O_absent
10284               || exp->X_op == O_illegal
10285               || exp->X_op == O_register
10286               || exp->X_op == O_big)
10287             {
10288               char c = *input_line_pointer;
10289               *input_line_pointer = 0;
10290               as_bad (_("missing or invalid expression `%s'"), save);
10291               *input_line_pointer = c;
10292             }
10293           else if ((got_reloc == BFD_RELOC_386_PLT32
10294                     || got_reloc == BFD_RELOC_X86_64_PLT32)
10295                    && exp->X_op != O_symbol)
10296             {
10297               char c = *input_line_pointer;
10298               *input_line_pointer = 0;
10299               as_bad (_("invalid PLT expression `%s'"), save);
10300               *input_line_pointer = c;
10301             }
10302         }
10303     }
10304   else
10305     expression (exp);
10306
10307   intel_syntax = -intel_syntax;
10308
10309   if (intel_syntax)
10310     i386_intel_simplify (exp);
10311
10312   return got_reloc;
10313 }
10314
10315 static void
10316 signed_cons (int size)
10317 {
10318   if (flag_code == CODE_64BIT)
10319     cons_sign = 1;
10320   cons (size);
10321   cons_sign = -1;
10322 }
10323
10324 #ifdef TE_PE
10325 static void
10326 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10327 {
10328   expressionS exp;
10329
10330   do
10331     {
10332       expression (&exp);
10333       if (exp.X_op == O_symbol)
10334         exp.X_op = O_secrel;
10335
10336       emit_expr (&exp, 4);
10337     }
10338   while (*input_line_pointer++ == ',');
10339
10340   input_line_pointer--;
10341   demand_empty_rest_of_line ();
10342 }
10343 #endif
10344
10345 /* Handle Vector operations.  */
10346
10347 static char *
10348 check_VecOperations (char *op_string, char *op_end)
10349 {
10350   const reg_entry *mask;
10351   const char *saved;
10352   char *end_op;
10353
10354   while (*op_string
10355          && (op_end == NULL || op_string < op_end))
10356     {
10357       saved = op_string;
10358       if (*op_string == '{')
10359         {
10360           op_string++;
10361
10362           /* Check broadcasts.  */
10363           if (strncmp (op_string, "1to", 3) == 0)
10364             {
10365               int bcst_type;
10366
10367               if (i.broadcast)
10368                 goto duplicated_vec_op;
10369
10370               op_string += 3;
10371               if (*op_string == '8')
10372                 bcst_type = 8;
10373               else if (*op_string == '4')
10374                 bcst_type = 4;
10375               else if (*op_string == '2')
10376                 bcst_type = 2;
10377               else if (*op_string == '1'
10378                        && *(op_string+1) == '6')
10379                 {
10380                   bcst_type = 16;
10381                   op_string++;
10382                 }
10383               else
10384                 {
10385                   as_bad (_("Unsupported broadcast: `%s'"), saved);
10386                   return NULL;
10387                 }
10388               op_string++;
10389
10390               broadcast_op.type = bcst_type;
10391               broadcast_op.operand = this_operand;
10392               broadcast_op.bytes = 0;
10393               i.broadcast = &broadcast_op;
10394             }
10395           /* Check masking operation.  */
10396           else if ((mask = parse_register (op_string, &end_op)) != NULL)
10397             {
10398               if (mask == &bad_reg)
10399                 return NULL;
10400
10401               /* k0 can't be used for write mask.  */
10402               if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10403                 {
10404                   as_bad (_("`%s%s' can't be used for write mask"),
10405                           register_prefix, mask->reg_name);
10406                   return NULL;
10407                 }
10408
10409               if (!i.mask)
10410                 {
10411                   mask_op.mask = mask;
10412                   mask_op.zeroing = 0;
10413                   mask_op.operand = this_operand;
10414                   i.mask = &mask_op;
10415                 }
10416               else
10417                 {
10418                   if (i.mask->mask)
10419                     goto duplicated_vec_op;
10420
10421                   i.mask->mask = mask;
10422
10423                   /* Only "{z}" is allowed here.  No need to check
10424                      zeroing mask explicitly.  */
10425                   if (i.mask->operand != this_operand)
10426                     {
10427                       as_bad (_("invalid write mask `%s'"), saved);
10428                       return NULL;
10429                     }
10430                 }
10431
10432               op_string = end_op;
10433             }
10434           /* Check zeroing-flag for masking operation.  */
10435           else if (*op_string == 'z')
10436             {
10437               if (!i.mask)
10438                 {
10439                   mask_op.mask = NULL;
10440                   mask_op.zeroing = 1;
10441                   mask_op.operand = this_operand;
10442                   i.mask = &mask_op;
10443                 }
10444               else
10445                 {
10446                   if (i.mask->zeroing)
10447                     {
10448                     duplicated_vec_op:
10449                       as_bad (_("duplicated `%s'"), saved);
10450                       return NULL;
10451                     }
10452
10453                   i.mask->zeroing = 1;
10454
10455                   /* Only "{%k}" is allowed here.  No need to check mask
10456                      register explicitly.  */
10457                   if (i.mask->operand != this_operand)
10458                     {
10459                       as_bad (_("invalid zeroing-masking `%s'"),
10460                               saved);
10461                       return NULL;
10462                     }
10463                 }
10464
10465               op_string++;
10466             }
10467           else
10468             goto unknown_vec_op;
10469
10470           if (*op_string != '}')
10471             {
10472               as_bad (_("missing `}' in `%s'"), saved);
10473               return NULL;
10474             }
10475           op_string++;
10476
10477           /* Strip whitespace since the addition of pseudo prefixes
10478              changed how the scrubber treats '{'.  */
10479           if (is_space_char (*op_string))
10480             ++op_string;
10481
10482           continue;
10483         }
10484     unknown_vec_op:
10485       /* We don't know this one.  */
10486       as_bad (_("unknown vector operation: `%s'"), saved);
10487       return NULL;
10488     }
10489
10490   if (i.mask && i.mask->zeroing && !i.mask->mask)
10491     {
10492       as_bad (_("zeroing-masking only allowed with write mask"));
10493       return NULL;
10494     }
10495
10496   return op_string;
10497 }
10498
10499 static int
10500 i386_immediate (char *imm_start)
10501 {
10502   char *save_input_line_pointer;
10503   char *gotfree_input_line;
10504   segT exp_seg = 0;
10505   expressionS *exp;
10506   i386_operand_type types;
10507
10508   operand_type_set (&types, ~0);
10509
10510   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10511     {
10512       as_bad (_("at most %d immediate operands are allowed"),
10513               MAX_IMMEDIATE_OPERANDS);
10514       return 0;
10515     }
10516
10517   exp = &im_expressions[i.imm_operands++];
10518   i.op[this_operand].imms = exp;
10519
10520   if (is_space_char (*imm_start))
10521     ++imm_start;
10522
10523   save_input_line_pointer = input_line_pointer;
10524   input_line_pointer = imm_start;
10525
10526   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10527   if (gotfree_input_line)
10528     input_line_pointer = gotfree_input_line;
10529
10530   exp_seg = expression (exp);
10531
10532   SKIP_WHITESPACE ();
10533
10534   /* Handle vector operations.  */
10535   if (*input_line_pointer == '{')
10536     {
10537       input_line_pointer = check_VecOperations (input_line_pointer,
10538                                                 NULL);
10539       if (input_line_pointer == NULL)
10540         return 0;
10541     }
10542
10543   if (*input_line_pointer)
10544     as_bad (_("junk `%s' after expression"), input_line_pointer);
10545
10546   input_line_pointer = save_input_line_pointer;
10547   if (gotfree_input_line)
10548     {
10549       free (gotfree_input_line);
10550
10551       if (exp->X_op == O_constant || exp->X_op == O_register)
10552         exp->X_op = O_illegal;
10553     }
10554
10555   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10556 }
10557
10558 static int
10559 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10560                          i386_operand_type types, const char *imm_start)
10561 {
10562   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10563     {
10564       if (imm_start)
10565         as_bad (_("missing or invalid immediate expression `%s'"),
10566                 imm_start);
10567       return 0;
10568     }
10569   else if (exp->X_op == O_constant)
10570     {
10571       /* Size it properly later.  */
10572       i.types[this_operand].bitfield.imm64 = 1;
10573       /* If not 64bit, sign extend val.  */
10574       if (flag_code != CODE_64BIT
10575           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10576         exp->X_add_number
10577           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10578     }
10579 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10580   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10581            && exp_seg != absolute_section
10582            && exp_seg != text_section
10583            && exp_seg != data_section
10584            && exp_seg != bss_section
10585            && exp_seg != undefined_section
10586            && !bfd_is_com_section (exp_seg))
10587     {
10588       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10589       return 0;
10590     }
10591 #endif
10592   else if (!intel_syntax && exp_seg == reg_section)
10593     {
10594       if (imm_start)
10595         as_bad (_("illegal immediate register operand %s"), imm_start);
10596       return 0;
10597     }
10598   else
10599     {
10600       /* This is an address.  The size of the address will be
10601          determined later, depending on destination register,
10602          suffix, or the default for the section.  */
10603       i.types[this_operand].bitfield.imm8 = 1;
10604       i.types[this_operand].bitfield.imm16 = 1;
10605       i.types[this_operand].bitfield.imm32 = 1;
10606       i.types[this_operand].bitfield.imm32s = 1;
10607       i.types[this_operand].bitfield.imm64 = 1;
10608       i.types[this_operand] = operand_type_and (i.types[this_operand],
10609                                                 types);
10610     }
10611
10612   return 1;
10613 }
10614
10615 static char *
10616 i386_scale (char *scale)
10617 {
10618   offsetT val;
10619   char *save = input_line_pointer;
10620
10621   input_line_pointer = scale;
10622   val = get_absolute_expression ();
10623
10624   switch (val)
10625     {
10626     case 1:
10627       i.log2_scale_factor = 0;
10628       break;
10629     case 2:
10630       i.log2_scale_factor = 1;
10631       break;
10632     case 4:
10633       i.log2_scale_factor = 2;
10634       break;
10635     case 8:
10636       i.log2_scale_factor = 3;
10637       break;
10638     default:
10639       {
10640         char sep = *input_line_pointer;
10641
10642         *input_line_pointer = '\0';
10643         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10644                 scale);
10645         *input_line_pointer = sep;
10646         input_line_pointer = save;
10647         return NULL;
10648       }
10649     }
10650   if (i.log2_scale_factor != 0 && i.index_reg == 0)
10651     {
10652       as_warn (_("scale factor of %d without an index register"),
10653                1 << i.log2_scale_factor);
10654       i.log2_scale_factor = 0;
10655     }
10656   scale = input_line_pointer;
10657   input_line_pointer = save;
10658   return scale;
10659 }
10660
10661 static int
10662 i386_displacement (char *disp_start, char *disp_end)
10663 {
10664   expressionS *exp;
10665   segT exp_seg = 0;
10666   char *save_input_line_pointer;
10667   char *gotfree_input_line;
10668   int override;
10669   i386_operand_type bigdisp, types = anydisp;
10670   int ret;
10671
10672   if (i.disp_operands == MAX_MEMORY_OPERANDS)
10673     {
10674       as_bad (_("at most %d displacement operands are allowed"),
10675               MAX_MEMORY_OPERANDS);
10676       return 0;
10677     }
10678
10679   operand_type_set (&bigdisp, 0);
10680   if (i.jumpabsolute
10681       || i.types[this_operand].bitfield.baseindex
10682       || (current_templates->start->opcode_modifier.jump != JUMP
10683           && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10684     {
10685       i386_addressing_mode ();
10686       override = (i.prefix[ADDR_PREFIX] != 0);
10687       if (flag_code == CODE_64BIT)
10688         {
10689           if (!override)
10690             {
10691               bigdisp.bitfield.disp32s = 1;
10692               bigdisp.bitfield.disp64 = 1;
10693             }
10694           else
10695             bigdisp.bitfield.disp32 = 1;
10696         }
10697       else if ((flag_code == CODE_16BIT) ^ override)
10698           bigdisp.bitfield.disp16 = 1;
10699       else
10700           bigdisp.bitfield.disp32 = 1;
10701     }
10702   else
10703     {
10704       /* For PC-relative branches, the width of the displacement may be
10705          dependent upon data size, but is never dependent upon address size.
10706          Also make sure to not unintentionally match against a non-PC-relative
10707          branch template.  */
10708       static templates aux_templates;
10709       const insn_template *t = current_templates->start;
10710       bfd_boolean has_intel64 = FALSE;
10711
10712       aux_templates.start = t;
10713       while (++t < current_templates->end)
10714         {
10715           if (t->opcode_modifier.jump
10716               != current_templates->start->opcode_modifier.jump)
10717             break;
10718           if ((t->opcode_modifier.isa64 >= INTEL64))
10719             has_intel64 = TRUE;
10720         }
10721       if (t < current_templates->end)
10722         {
10723           aux_templates.end = t;
10724           current_templates = &aux_templates;
10725         }
10726
10727       override = (i.prefix[DATA_PREFIX] != 0);
10728       if (flag_code == CODE_64BIT)
10729         {
10730           if ((override || i.suffix == WORD_MNEM_SUFFIX)
10731               && (!intel64 || !has_intel64))
10732             bigdisp.bitfield.disp16 = 1;
10733           else
10734             bigdisp.bitfield.disp32s = 1;
10735         }
10736       else
10737         {
10738           if (!override)
10739             override = (i.suffix == (flag_code != CODE_16BIT
10740                                      ? WORD_MNEM_SUFFIX
10741                                      : LONG_MNEM_SUFFIX));
10742           bigdisp.bitfield.disp32 = 1;
10743           if ((flag_code == CODE_16BIT) ^ override)
10744             {
10745               bigdisp.bitfield.disp32 = 0;
10746               bigdisp.bitfield.disp16 = 1;
10747             }
10748         }
10749     }
10750   i.types[this_operand] = operand_type_or (i.types[this_operand],
10751                                            bigdisp);
10752
10753   exp = &disp_expressions[i.disp_operands];
10754   i.op[this_operand].disps = exp;
10755   i.disp_operands++;
10756   save_input_line_pointer = input_line_pointer;
10757   input_line_pointer = disp_start;
10758   END_STRING_AND_SAVE (disp_end);
10759
10760 #ifndef GCC_ASM_O_HACK
10761 #define GCC_ASM_O_HACK 0
10762 #endif
10763 #if GCC_ASM_O_HACK
10764   END_STRING_AND_SAVE (disp_end + 1);
10765   if (i.types[this_operand].bitfield.baseIndex
10766       && displacement_string_end[-1] == '+')
10767     {
10768       /* This hack is to avoid a warning when using the "o"
10769          constraint within gcc asm statements.
10770          For instance:
10771
10772          #define _set_tssldt_desc(n,addr,limit,type) \
10773          __asm__ __volatile__ ( \
10774          "movw %w2,%0\n\t" \
10775          "movw %w1,2+%0\n\t" \
10776          "rorl $16,%1\n\t" \
10777          "movb %b1,4+%0\n\t" \
10778          "movb %4,5+%0\n\t" \
10779          "movb $0,6+%0\n\t" \
10780          "movb %h1,7+%0\n\t" \
10781          "rorl $16,%1" \
10782          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10783
10784          This works great except that the output assembler ends
10785          up looking a bit weird if it turns out that there is
10786          no offset.  You end up producing code that looks like:
10787
10788          #APP
10789          movw $235,(%eax)
10790          movw %dx,2+(%eax)
10791          rorl $16,%edx
10792          movb %dl,4+(%eax)
10793          movb $137,5+(%eax)
10794          movb $0,6+(%eax)
10795          movb %dh,7+(%eax)
10796          rorl $16,%edx
10797          #NO_APP
10798
10799          So here we provide the missing zero.  */
10800
10801       *displacement_string_end = '0';
10802     }
10803 #endif
10804   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10805   if (gotfree_input_line)
10806     input_line_pointer = gotfree_input_line;
10807
10808   exp_seg = expression (exp);
10809
10810   SKIP_WHITESPACE ();
10811   if (*input_line_pointer)
10812     as_bad (_("junk `%s' after expression"), input_line_pointer);
10813 #if GCC_ASM_O_HACK
10814   RESTORE_END_STRING (disp_end + 1);
10815 #endif
10816   input_line_pointer = save_input_line_pointer;
10817   if (gotfree_input_line)
10818     {
10819       free (gotfree_input_line);
10820
10821       if (exp->X_op == O_constant || exp->X_op == O_register)
10822         exp->X_op = O_illegal;
10823     }
10824
10825   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10826
10827   RESTORE_END_STRING (disp_end);
10828
10829   return ret;
10830 }
10831
10832 static int
10833 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10834                             i386_operand_type types, const char *disp_start)
10835 {
10836   i386_operand_type bigdisp;
10837   int ret = 1;
10838
10839   /* We do this to make sure that the section symbol is in
10840      the symbol table.  We will ultimately change the relocation
10841      to be relative to the beginning of the section.  */
10842   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10843       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10844       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10845     {
10846       if (exp->X_op != O_symbol)
10847         goto inv_disp;
10848
10849       if (S_IS_LOCAL (exp->X_add_symbol)
10850           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10851           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10852         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10853       exp->X_op = O_subtract;
10854       exp->X_op_symbol = GOT_symbol;
10855       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10856         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10857       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10858         i.reloc[this_operand] = BFD_RELOC_64;
10859       else
10860         i.reloc[this_operand] = BFD_RELOC_32;
10861     }
10862
10863   else if (exp->X_op == O_absent
10864            || exp->X_op == O_illegal
10865            || exp->X_op == O_big)
10866     {
10867     inv_disp:
10868       as_bad (_("missing or invalid displacement expression `%s'"),
10869               disp_start);
10870       ret = 0;
10871     }
10872
10873   else if (flag_code == CODE_64BIT
10874            && !i.prefix[ADDR_PREFIX]
10875            && exp->X_op == O_constant)
10876     {
10877       /* Since displacement is signed extended to 64bit, don't allow
10878          disp32 and turn off disp32s if they are out of range.  */
10879       i.types[this_operand].bitfield.disp32 = 0;
10880       if (!fits_in_signed_long (exp->X_add_number))
10881         {
10882           i.types[this_operand].bitfield.disp32s = 0;
10883           if (i.types[this_operand].bitfield.baseindex)
10884             {
10885               as_bad (_("0x%lx out range of signed 32bit displacement"),
10886                       (long) exp->X_add_number);
10887               ret = 0;
10888             }
10889         }
10890     }
10891
10892 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10893   else if (exp->X_op != O_constant
10894            && OUTPUT_FLAVOR == bfd_target_aout_flavour
10895            && exp_seg != absolute_section
10896            && exp_seg != text_section
10897            && exp_seg != data_section
10898            && exp_seg != bss_section
10899            && exp_seg != undefined_section
10900            && !bfd_is_com_section (exp_seg))
10901     {
10902       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10903       ret = 0;
10904     }
10905 #endif
10906
10907   if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10908       /* Constants get taken care of by optimize_disp().  */
10909       && exp->X_op != O_constant)
10910     i.types[this_operand].bitfield.disp8 = 1;
10911
10912   /* Check if this is a displacement only operand.  */
10913   bigdisp = i.types[this_operand];
10914   bigdisp.bitfield.disp8 = 0;
10915   bigdisp.bitfield.disp16 = 0;
10916   bigdisp.bitfield.disp32 = 0;
10917   bigdisp.bitfield.disp32s = 0;
10918   bigdisp.bitfield.disp64 = 0;
10919   if (operand_type_all_zero (&bigdisp))
10920     i.types[this_operand] = operand_type_and (i.types[this_operand],
10921                                               types);
10922
10923   return ret;
10924 }
10925
10926 /* Return the active addressing mode, taking address override and
10927    registers forming the address into consideration.  Update the
10928    address override prefix if necessary.  */
10929
10930 static enum flag_code
10931 i386_addressing_mode (void)
10932 {
10933   enum flag_code addr_mode;
10934
10935   if (i.prefix[ADDR_PREFIX])
10936     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10937   else if (flag_code == CODE_16BIT
10938            && current_templates->start->cpu_flags.bitfield.cpumpx
10939            /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10940               from md_assemble() by "is not a valid base/index expression"
10941               when there is a base and/or index.  */
10942            && !i.types[this_operand].bitfield.baseindex)
10943     {
10944       /* MPX insn memory operands with neither base nor index must be forced
10945          to use 32-bit addressing in 16-bit mode.  */
10946       addr_mode = CODE_32BIT;
10947       i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10948       ++i.prefixes;
10949       gas_assert (!i.types[this_operand].bitfield.disp16);
10950       gas_assert (!i.types[this_operand].bitfield.disp32);
10951     }
10952   else
10953     {
10954       addr_mode = flag_code;
10955
10956 #if INFER_ADDR_PREFIX
10957       if (i.mem_operands == 0)
10958         {
10959           /* Infer address prefix from the first memory operand.  */
10960           const reg_entry *addr_reg = i.base_reg;
10961
10962           if (addr_reg == NULL)
10963             addr_reg = i.index_reg;
10964
10965           if (addr_reg)
10966             {
10967               if (addr_reg->reg_type.bitfield.dword)
10968                 addr_mode = CODE_32BIT;
10969               else if (flag_code != CODE_64BIT
10970                        && addr_reg->reg_type.bitfield.word)
10971                 addr_mode = CODE_16BIT;
10972
10973               if (addr_mode != flag_code)
10974                 {
10975                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10976                   i.prefixes += 1;
10977                   /* Change the size of any displacement too.  At most one
10978                      of Disp16 or Disp32 is set.
10979                      FIXME.  There doesn't seem to be any real need for
10980                      separate Disp16 and Disp32 flags.  The same goes for
10981                      Imm16 and Imm32.  Removing them would probably clean
10982                      up the code quite a lot.  */
10983                   if (flag_code != CODE_64BIT
10984                       && (i.types[this_operand].bitfield.disp16
10985                           || i.types[this_operand].bitfield.disp32))
10986                     i.types[this_operand]
10987                       = operand_type_xor (i.types[this_operand], disp16_32);
10988                 }
10989             }
10990         }
10991 #endif
10992     }
10993
10994   return addr_mode;
10995 }
10996
10997 /* Make sure the memory operand we've been dealt is valid.
10998    Return 1 on success, 0 on a failure.  */
10999
11000 static int
11001 i386_index_check (const char *operand_string)
11002 {
11003   const char *kind = "base/index";
11004   enum flag_code addr_mode = i386_addressing_mode ();
11005   const insn_template *t = current_templates->start;
11006
11007   if (t->opcode_modifier.isstring
11008       && !t->cpu_flags.bitfield.cpupadlock
11009       && (current_templates->end[-1].opcode_modifier.isstring
11010           || i.mem_operands))
11011     {
11012       /* Memory operands of string insns are special in that they only allow
11013          a single register (rDI, rSI, or rBX) as their memory address.  */
11014       const reg_entry *expected_reg;
11015       static const char *di_si[][2] =
11016         {
11017           { "esi", "edi" },
11018           { "si", "di" },
11019           { "rsi", "rdi" }
11020         };
11021       static const char *bx[] = { "ebx", "bx", "rbx" };
11022
11023       kind = "string address";
11024
11025       if (t->opcode_modifier.prefixok == PrefixRep)
11026         {
11027           int es_op = current_templates->end[-1].opcode_modifier.isstring
11028                       - IS_STRING_ES_OP0;
11029           int op = 0;
11030
11031           if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11032               || ((!i.mem_operands != !intel_syntax)
11033                   && current_templates->end[-1].operand_types[1]
11034                      .bitfield.baseindex))
11035             op = 1;
11036           expected_reg
11037             = (const reg_entry *) str_hash_find (reg_hash,
11038                                                  di_si[addr_mode][op == es_op]);
11039         }
11040       else
11041         expected_reg
11042           = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11043
11044       if (i.base_reg != expected_reg
11045           || i.index_reg
11046           || operand_type_check (i.types[this_operand], disp))
11047         {
11048           /* The second memory operand must have the same size as
11049              the first one.  */
11050           if (i.mem_operands
11051               && i.base_reg
11052               && !((addr_mode == CODE_64BIT
11053                     && i.base_reg->reg_type.bitfield.qword)
11054                    || (addr_mode == CODE_32BIT
11055                        ? i.base_reg->reg_type.bitfield.dword
11056                        : i.base_reg->reg_type.bitfield.word)))
11057             goto bad_address;
11058
11059           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11060                    operand_string,
11061                    intel_syntax ? '[' : '(',
11062                    register_prefix,
11063                    expected_reg->reg_name,
11064                    intel_syntax ? ']' : ')');
11065           return 1;
11066         }
11067       else
11068         return 1;
11069
11070     bad_address:
11071       as_bad (_("`%s' is not a valid %s expression"),
11072               operand_string, kind);
11073       return 0;
11074     }
11075   else
11076     {
11077       if (addr_mode != CODE_16BIT)
11078         {
11079           /* 32-bit/64-bit checks.  */
11080           if (i.disp_encoding == disp_encoding_16bit)
11081             {
11082             bad_disp:
11083               as_bad (_("invalid `%s' prefix"),
11084                       addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11085               return 0;
11086             }
11087
11088           if ((i.base_reg
11089                && ((addr_mode == CODE_64BIT
11090                     ? !i.base_reg->reg_type.bitfield.qword
11091                     : !i.base_reg->reg_type.bitfield.dword)
11092                    || (i.index_reg && i.base_reg->reg_num == RegIP)
11093                    || i.base_reg->reg_num == RegIZ))
11094               || (i.index_reg
11095                   && !i.index_reg->reg_type.bitfield.xmmword
11096                   && !i.index_reg->reg_type.bitfield.ymmword
11097                   && !i.index_reg->reg_type.bitfield.zmmword
11098                   && ((addr_mode == CODE_64BIT
11099                        ? !i.index_reg->reg_type.bitfield.qword
11100                        : !i.index_reg->reg_type.bitfield.dword)
11101                       || !i.index_reg->reg_type.bitfield.baseindex)))
11102             goto bad_address;
11103
11104           /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11105           if ((t->opcode_modifier.opcodeprefix == PREFIX_0XF3
11106                && t->base_opcode == 0x0f1b)
11107               || (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11108                   && (t->base_opcode & ~1) == 0x0f1a)
11109               || t->opcode_modifier.sib == SIBMEM)
11110             {
11111               /* They cannot use RIP-relative addressing. */
11112               if (i.base_reg && i.base_reg->reg_num == RegIP)
11113                 {
11114                   as_bad (_("`%s' cannot be used here"), operand_string);
11115                   return 0;
11116                 }
11117
11118               /* bndldx and bndstx ignore their scale factor. */
11119               if (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11120                   && (t->base_opcode & ~1) == 0x0f1a
11121                   && i.log2_scale_factor)
11122                 as_warn (_("register scaling is being ignored here"));
11123             }
11124         }
11125       else
11126         {
11127           /* 16-bit checks.  */
11128           if (i.disp_encoding == disp_encoding_32bit)
11129             goto bad_disp;
11130
11131           if ((i.base_reg
11132                && (!i.base_reg->reg_type.bitfield.word
11133                    || !i.base_reg->reg_type.bitfield.baseindex))
11134               || (i.index_reg
11135                   && (!i.index_reg->reg_type.bitfield.word
11136                       || !i.index_reg->reg_type.bitfield.baseindex
11137                       || !(i.base_reg
11138                            && i.base_reg->reg_num < 6
11139                            && i.index_reg->reg_num >= 6
11140                            && i.log2_scale_factor == 0))))
11141             goto bad_address;
11142         }
11143     }
11144   return 1;
11145 }
11146
11147 /* Handle vector immediates.  */
11148
11149 static int
11150 RC_SAE_immediate (const char *imm_start)
11151 {
11152   unsigned int match_found, j;
11153   const char *pstr = imm_start;
11154   expressionS *exp;
11155
11156   if (*pstr != '{')
11157     return 0;
11158
11159   pstr++;
11160   match_found = 0;
11161   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11162     {
11163       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11164         {
11165           if (!i.rounding)
11166             {
11167               rc_op.type = RC_NamesTable[j].type;
11168               rc_op.operand = this_operand;
11169               i.rounding = &rc_op;
11170             }
11171           else
11172             {
11173               as_bad (_("duplicated `%s'"), imm_start);
11174               return 0;
11175             }
11176           pstr += RC_NamesTable[j].len;
11177           match_found = 1;
11178           break;
11179         }
11180     }
11181   if (!match_found)
11182     return 0;
11183
11184   if (*pstr++ != '}')
11185     {
11186       as_bad (_("Missing '}': '%s'"), imm_start);
11187       return 0;
11188     }
11189   /* RC/SAE immediate string should contain nothing more.  */;
11190   if (*pstr != 0)
11191     {
11192       as_bad (_("Junk after '}': '%s'"), imm_start);
11193       return 0;
11194     }
11195
11196   exp = &im_expressions[i.imm_operands++];
11197   i.op[this_operand].imms = exp;
11198
11199   exp->X_op = O_constant;
11200   exp->X_add_number = 0;
11201   exp->X_add_symbol = (symbolS *) 0;
11202   exp->X_op_symbol = (symbolS *) 0;
11203
11204   i.types[this_operand].bitfield.imm8 = 1;
11205   return 1;
11206 }
11207
11208 /* Only string instructions can have a second memory operand, so
11209    reduce current_templates to just those if it contains any.  */
11210 static int
11211 maybe_adjust_templates (void)
11212 {
11213   const insn_template *t;
11214
11215   gas_assert (i.mem_operands == 1);
11216
11217   for (t = current_templates->start; t < current_templates->end; ++t)
11218     if (t->opcode_modifier.isstring)
11219       break;
11220
11221   if (t < current_templates->end)
11222     {
11223       static templates aux_templates;
11224       bfd_boolean recheck;
11225
11226       aux_templates.start = t;
11227       for (; t < current_templates->end; ++t)
11228         if (!t->opcode_modifier.isstring)
11229           break;
11230       aux_templates.end = t;
11231
11232       /* Determine whether to re-check the first memory operand.  */
11233       recheck = (aux_templates.start != current_templates->start
11234                  || t != current_templates->end);
11235
11236       current_templates = &aux_templates;
11237
11238       if (recheck)
11239         {
11240           i.mem_operands = 0;
11241           if (i.memop1_string != NULL
11242               && i386_index_check (i.memop1_string) == 0)
11243             return 0;
11244           i.mem_operands = 1;
11245         }
11246     }
11247
11248   return 1;
11249 }
11250
11251 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
11252    on error.  */
11253
11254 static int
11255 i386_att_operand (char *operand_string)
11256 {
11257   const reg_entry *r;
11258   char *end_op;
11259   char *op_string = operand_string;
11260
11261   if (is_space_char (*op_string))
11262     ++op_string;
11263
11264   /* We check for an absolute prefix (differentiating,
11265      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
11266   if (*op_string == ABSOLUTE_PREFIX)
11267     {
11268       ++op_string;
11269       if (is_space_char (*op_string))
11270         ++op_string;
11271       i.jumpabsolute = TRUE;
11272     }
11273
11274   /* Check if operand is a register.  */
11275   if ((r = parse_register (op_string, &end_op)) != NULL)
11276     {
11277       i386_operand_type temp;
11278
11279       if (r == &bad_reg)
11280         return 0;
11281
11282       /* Check for a segment override by searching for ':' after a
11283          segment register.  */
11284       op_string = end_op;
11285       if (is_space_char (*op_string))
11286         ++op_string;
11287       if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11288         {
11289           switch (r->reg_num)
11290             {
11291             case 0:
11292               i.seg[i.mem_operands] = &es;
11293               break;
11294             case 1:
11295               i.seg[i.mem_operands] = &cs;
11296               break;
11297             case 2:
11298               i.seg[i.mem_operands] = &ss;
11299               break;
11300             case 3:
11301               i.seg[i.mem_operands] = &ds;
11302               break;
11303             case 4:
11304               i.seg[i.mem_operands] = &fs;
11305               break;
11306             case 5:
11307               i.seg[i.mem_operands] = &gs;
11308               break;
11309             }
11310
11311           /* Skip the ':' and whitespace.  */
11312           ++op_string;
11313           if (is_space_char (*op_string))
11314             ++op_string;
11315
11316           if (!is_digit_char (*op_string)
11317               && !is_identifier_char (*op_string)
11318               && *op_string != '('
11319               && *op_string != ABSOLUTE_PREFIX)
11320             {
11321               as_bad (_("bad memory operand `%s'"), op_string);
11322               return 0;
11323             }
11324           /* Handle case of %es:*foo.  */
11325           if (*op_string == ABSOLUTE_PREFIX)
11326             {
11327               ++op_string;
11328               if (is_space_char (*op_string))
11329                 ++op_string;
11330               i.jumpabsolute = TRUE;
11331             }
11332           goto do_memory_reference;
11333         }
11334
11335       /* Handle vector operations.  */
11336       if (*op_string == '{')
11337         {
11338           op_string = check_VecOperations (op_string, NULL);
11339           if (op_string == NULL)
11340             return 0;
11341         }
11342
11343       if (*op_string)
11344         {
11345           as_bad (_("junk `%s' after register"), op_string);
11346           return 0;
11347         }
11348       temp = r->reg_type;
11349       temp.bitfield.baseindex = 0;
11350       i.types[this_operand] = operand_type_or (i.types[this_operand],
11351                                                temp);
11352       i.types[this_operand].bitfield.unspecified = 0;
11353       i.op[this_operand].regs = r;
11354       i.reg_operands++;
11355     }
11356   else if (*op_string == REGISTER_PREFIX)
11357     {
11358       as_bad (_("bad register name `%s'"), op_string);
11359       return 0;
11360     }
11361   else if (*op_string == IMMEDIATE_PREFIX)
11362     {
11363       ++op_string;
11364       if (i.jumpabsolute)
11365         {
11366           as_bad (_("immediate operand illegal with absolute jump"));
11367           return 0;
11368         }
11369       if (!i386_immediate (op_string))
11370         return 0;
11371     }
11372   else if (RC_SAE_immediate (operand_string))
11373     {
11374       /* If it is a RC or SAE immediate, do nothing.  */
11375       ;
11376     }
11377   else if (is_digit_char (*op_string)
11378            || is_identifier_char (*op_string)
11379            || *op_string == '"'
11380            || *op_string == '(')
11381     {
11382       /* This is a memory reference of some sort.  */
11383       char *base_string;
11384
11385       /* Start and end of displacement string expression (if found).  */
11386       char *displacement_string_start;
11387       char *displacement_string_end;
11388       char *vop_start;
11389
11390     do_memory_reference:
11391       if (i.mem_operands == 1 && !maybe_adjust_templates ())
11392         return 0;
11393       if ((i.mem_operands == 1
11394            && !current_templates->start->opcode_modifier.isstring)
11395           || i.mem_operands == 2)
11396         {
11397           as_bad (_("too many memory references for `%s'"),
11398                   current_templates->start->name);
11399           return 0;
11400         }
11401
11402       /* Check for base index form.  We detect the base index form by
11403          looking for an ')' at the end of the operand, searching
11404          for the '(' matching it, and finding a REGISTER_PREFIX or ','
11405          after the '('.  */
11406       base_string = op_string + strlen (op_string);
11407
11408       /* Handle vector operations.  */
11409       vop_start = strchr (op_string, '{');
11410       if (vop_start && vop_start < base_string)
11411         {
11412           if (check_VecOperations (vop_start, base_string) == NULL)
11413             return 0;
11414           base_string = vop_start;
11415         }
11416
11417       --base_string;
11418       if (is_space_char (*base_string))
11419         --base_string;
11420
11421       /* If we only have a displacement, set-up for it to be parsed later.  */
11422       displacement_string_start = op_string;
11423       displacement_string_end = base_string + 1;
11424
11425       if (*base_string == ')')
11426         {
11427           char *temp_string;
11428           unsigned int parens_balanced = 1;
11429           /* We've already checked that the number of left & right ()'s are
11430              equal, so this loop will not be infinite.  */
11431           do
11432             {
11433               base_string--;
11434               if (*base_string == ')')
11435                 parens_balanced++;
11436               if (*base_string == '(')
11437                 parens_balanced--;
11438             }
11439           while (parens_balanced);
11440
11441           temp_string = base_string;
11442
11443           /* Skip past '(' and whitespace.  */
11444           ++base_string;
11445           if (is_space_char (*base_string))
11446             ++base_string;
11447
11448           if (*base_string == ','
11449               || ((i.base_reg = parse_register (base_string, &end_op))
11450                   != NULL))
11451             {
11452               displacement_string_end = temp_string;
11453
11454               i.types[this_operand].bitfield.baseindex = 1;
11455
11456               if (i.base_reg)
11457                 {
11458                   if (i.base_reg == &bad_reg)
11459                     return 0;
11460                   base_string = end_op;
11461                   if (is_space_char (*base_string))
11462                     ++base_string;
11463                 }
11464
11465               /* There may be an index reg or scale factor here.  */
11466               if (*base_string == ',')
11467                 {
11468                   ++base_string;
11469                   if (is_space_char (*base_string))
11470                     ++base_string;
11471
11472                   if ((i.index_reg = parse_register (base_string, &end_op))
11473                       != NULL)
11474                     {
11475                       if (i.index_reg == &bad_reg)
11476                         return 0;
11477                       base_string = end_op;
11478                       if (is_space_char (*base_string))
11479                         ++base_string;
11480                       if (*base_string == ',')
11481                         {
11482                           ++base_string;
11483                           if (is_space_char (*base_string))
11484                             ++base_string;
11485                         }
11486                       else if (*base_string != ')')
11487                         {
11488                           as_bad (_("expecting `,' or `)' "
11489                                     "after index register in `%s'"),
11490                                   operand_string);
11491                           return 0;
11492                         }
11493                     }
11494                   else if (*base_string == REGISTER_PREFIX)
11495                     {
11496                       end_op = strchr (base_string, ',');
11497                       if (end_op)
11498                         *end_op = '\0';
11499                       as_bad (_("bad register name `%s'"), base_string);
11500                       return 0;
11501                     }
11502
11503                   /* Check for scale factor.  */
11504                   if (*base_string != ')')
11505                     {
11506                       char *end_scale = i386_scale (base_string);
11507
11508                       if (!end_scale)
11509                         return 0;
11510
11511                       base_string = end_scale;
11512                       if (is_space_char (*base_string))
11513                         ++base_string;
11514                       if (*base_string != ')')
11515                         {
11516                           as_bad (_("expecting `)' "
11517                                     "after scale factor in `%s'"),
11518                                   operand_string);
11519                           return 0;
11520                         }
11521                     }
11522                   else if (!i.index_reg)
11523                     {
11524                       as_bad (_("expecting index register or scale factor "
11525                                 "after `,'; got '%c'"),
11526                               *base_string);
11527                       return 0;
11528                     }
11529                 }
11530               else if (*base_string != ')')
11531                 {
11532                   as_bad (_("expecting `,' or `)' "
11533                             "after base register in `%s'"),
11534                           operand_string);
11535                   return 0;
11536                 }
11537             }
11538           else if (*base_string == REGISTER_PREFIX)
11539             {
11540               end_op = strchr (base_string, ',');
11541               if (end_op)
11542                 *end_op = '\0';
11543               as_bad (_("bad register name `%s'"), base_string);
11544               return 0;
11545             }
11546         }
11547
11548       /* If there's an expression beginning the operand, parse it,
11549          assuming displacement_string_start and
11550          displacement_string_end are meaningful.  */
11551       if (displacement_string_start != displacement_string_end)
11552         {
11553           if (!i386_displacement (displacement_string_start,
11554                                   displacement_string_end))
11555             return 0;
11556         }
11557
11558       /* Special case for (%dx) while doing input/output op.  */
11559       if (i.base_reg
11560           && i.base_reg->reg_type.bitfield.instance == RegD
11561           && i.base_reg->reg_type.bitfield.word
11562           && i.index_reg == 0
11563           && i.log2_scale_factor == 0
11564           && i.seg[i.mem_operands] == 0
11565           && !operand_type_check (i.types[this_operand], disp))
11566         {
11567           i.types[this_operand] = i.base_reg->reg_type;
11568           return 1;
11569         }
11570
11571       if (i386_index_check (operand_string) == 0)
11572         return 0;
11573       i.flags[this_operand] |= Operand_Mem;
11574       if (i.mem_operands == 0)
11575         i.memop1_string = xstrdup (operand_string);
11576       i.mem_operands++;
11577     }
11578   else
11579     {
11580       /* It's not a memory operand; argh!  */
11581       as_bad (_("invalid char %s beginning operand %d `%s'"),
11582               output_invalid (*op_string),
11583               this_operand + 1,
11584               op_string);
11585       return 0;
11586     }
11587   return 1;                     /* Normal return.  */
11588 }
11589 \f
11590 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11591    that an rs_machine_dependent frag may reach.  */
11592
11593 unsigned int
11594 i386_frag_max_var (fragS *frag)
11595 {
11596   /* The only relaxable frags are for jumps.
11597      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
11598   gas_assert (frag->fr_type == rs_machine_dependent);
11599   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11600 }
11601
11602 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11603 static int
11604 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11605 {
11606   /* STT_GNU_IFUNC symbol must go through PLT.  */
11607   if ((symbol_get_bfdsym (fr_symbol)->flags
11608        & BSF_GNU_INDIRECT_FUNCTION) != 0)
11609     return 0;
11610
11611   if (!S_IS_EXTERNAL (fr_symbol))
11612     /* Symbol may be weak or local.  */
11613     return !S_IS_WEAK (fr_symbol);
11614
11615   /* Global symbols with non-default visibility can't be preempted. */
11616   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11617     return 1;
11618
11619   if (fr_var != NO_RELOC)
11620     switch ((enum bfd_reloc_code_real) fr_var)
11621       {
11622       case BFD_RELOC_386_PLT32:
11623       case BFD_RELOC_X86_64_PLT32:
11624         /* Symbol with PLT relocation may be preempted. */
11625         return 0;
11626       default:
11627         abort ();
11628       }
11629
11630   /* Global symbols with default visibility in a shared library may be
11631      preempted by another definition.  */
11632   return !shared;
11633 }
11634 #endif
11635
11636 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11637    Note also work for Skylake and Cascadelake.
11638 ---------------------------------------------------------------------
11639 |   JCC   | ADD/SUB/CMP | INC/DEC | TEST/AND |
11640 | ------  | ----------- | ------- | -------- |
11641 |   Jo    |      N      |    N    |     Y    |
11642 |   Jno   |      N      |    N    |     Y    |
11643 |  Jc/Jb  |      Y      |    N    |     Y    |
11644 | Jae/Jnb |      Y      |    N    |     Y    |
11645 |  Je/Jz  |      Y      |    Y    |     Y    |
11646 | Jne/Jnz |      Y      |    Y    |     Y    |
11647 | Jna/Jbe |      Y      |    N    |     Y    |
11648 | Ja/Jnbe |      Y      |    N    |     Y    |
11649 |   Js    |      N      |    N    |     Y    |
11650 |   Jns   |      N      |    N    |     Y    |
11651 |  Jp/Jpe |      N      |    N    |     Y    |
11652 | Jnp/Jpo |      N      |    N    |     Y    |
11653 | Jl/Jnge |      Y      |    Y    |     Y    |
11654 | Jge/Jnl |      Y      |    Y    |     Y    |
11655 | Jle/Jng |      Y      |    Y    |     Y    |
11656 | Jg/Jnle |      Y      |    Y    |     Y    |
11657 ---------------------------------------------------------------------  */
11658 static int
11659 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11660 {
11661   if (mf_cmp == mf_cmp_alu_cmp)
11662     return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11663             || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11664   if (mf_cmp == mf_cmp_incdec)
11665     return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11666             || mf_jcc == mf_jcc_jle);
11667   if (mf_cmp == mf_cmp_test_and)
11668     return 1;
11669   return 0;
11670 }
11671
11672 /* Return the next non-empty frag.  */
11673
11674 static fragS *
11675 i386_next_non_empty_frag (fragS *fragP)
11676 {
11677   /* There may be a frag with a ".fill 0" when there is no room in
11678      the current frag for frag_grow in output_insn.  */
11679   for (fragP = fragP->fr_next;
11680        (fragP != NULL
11681         && fragP->fr_type == rs_fill
11682         && fragP->fr_fix == 0);
11683        fragP = fragP->fr_next)
11684     ;
11685   return fragP;
11686 }
11687
11688 /* Return the next jcc frag after BRANCH_PADDING.  */
11689
11690 static fragS *
11691 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11692 {
11693   fragS *branch_fragP;
11694   if (!pad_fragP)
11695     return NULL;
11696
11697   if (pad_fragP->fr_type == rs_machine_dependent
11698       && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11699           == BRANCH_PADDING))
11700     {
11701       branch_fragP = i386_next_non_empty_frag (pad_fragP);
11702       if (branch_fragP->fr_type != rs_machine_dependent)
11703         return NULL;
11704       if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11705           && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11706                                    pad_fragP->tc_frag_data.mf_type))
11707         return branch_fragP;
11708     }
11709
11710   return NULL;
11711 }
11712
11713 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags.  */
11714
11715 static void
11716 i386_classify_machine_dependent_frag (fragS *fragP)
11717 {
11718   fragS *cmp_fragP;
11719   fragS *pad_fragP;
11720   fragS *branch_fragP;
11721   fragS *next_fragP;
11722   unsigned int max_prefix_length;
11723
11724   if (fragP->tc_frag_data.classified)
11725     return;
11726
11727   /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING.  Convert
11728      FUSED_JCC_PADDING and merge BRANCH_PADDING.  */
11729   for (next_fragP = fragP;
11730        next_fragP != NULL;
11731        next_fragP = next_fragP->fr_next)
11732     {
11733       next_fragP->tc_frag_data.classified = 1;
11734       if (next_fragP->fr_type == rs_machine_dependent)
11735         switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11736           {
11737           case BRANCH_PADDING:
11738             /* The BRANCH_PADDING frag must be followed by a branch
11739                frag.  */
11740             branch_fragP = i386_next_non_empty_frag (next_fragP);
11741             next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11742             break;
11743           case FUSED_JCC_PADDING:
11744             /* Check if this is a fused jcc:
11745                FUSED_JCC_PADDING
11746                CMP like instruction
11747                BRANCH_PADDING
11748                COND_JUMP
11749                */
11750             cmp_fragP = i386_next_non_empty_frag (next_fragP);
11751             pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11752             branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11753             if (branch_fragP)
11754               {
11755                 /* The BRANCH_PADDING frag is merged with the
11756                    FUSED_JCC_PADDING frag.  */
11757                 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11758                 /* CMP like instruction size.  */
11759                 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11760                 frag_wane (pad_fragP);
11761                 /* Skip to branch_fragP.  */
11762                 next_fragP = branch_fragP;
11763               }
11764             else if (next_fragP->tc_frag_data.max_prefix_length)
11765               {
11766                 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11767                    a fused jcc.  */
11768                 next_fragP->fr_subtype
11769                   = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11770                 next_fragP->tc_frag_data.max_bytes
11771                   = next_fragP->tc_frag_data.max_prefix_length;
11772                 /* This will be updated in the BRANCH_PREFIX scan.  */
11773                 next_fragP->tc_frag_data.max_prefix_length = 0;
11774               }
11775             else
11776               frag_wane (next_fragP);
11777             break;
11778           }
11779     }
11780
11781   /* Stop if there is no BRANCH_PREFIX.  */
11782   if (!align_branch_prefix_size)
11783     return;
11784
11785   /* Scan for BRANCH_PREFIX.  */
11786   for (; fragP != NULL; fragP = fragP->fr_next)
11787     {
11788       if (fragP->fr_type != rs_machine_dependent
11789           || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11790               != BRANCH_PREFIX))
11791         continue;
11792
11793       /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11794          COND_JUMP_PREFIX.  */
11795       max_prefix_length = 0;
11796       for (next_fragP = fragP;
11797            next_fragP != NULL;
11798            next_fragP = next_fragP->fr_next)
11799         {
11800           if (next_fragP->fr_type == rs_fill)
11801             /* Skip rs_fill frags.  */
11802             continue;
11803           else if (next_fragP->fr_type != rs_machine_dependent)
11804             /* Stop for all other frags.  */
11805             break;
11806
11807           /* rs_machine_dependent frags.  */
11808           if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11809               == BRANCH_PREFIX)
11810             {
11811               /* Count BRANCH_PREFIX frags.  */
11812               if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11813                 {
11814                   max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11815                   frag_wane (next_fragP);
11816                 }
11817               else
11818                 max_prefix_length
11819                   += next_fragP->tc_frag_data.max_bytes;
11820             }
11821           else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11822                     == BRANCH_PADDING)
11823                    || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11824                        == FUSED_JCC_PADDING))
11825             {
11826               /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING.  */
11827               fragP->tc_frag_data.u.padding_fragP = next_fragP;
11828               break;
11829             }
11830           else
11831             /* Stop for other rs_machine_dependent frags.  */
11832             break;
11833         }
11834
11835       fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11836
11837       /* Skip to the next frag.  */
11838       fragP = next_fragP;
11839     }
11840 }
11841
11842 /* Compute padding size for
11843
11844         FUSED_JCC_PADDING
11845         CMP like instruction
11846         BRANCH_PADDING
11847         COND_JUMP/UNCOND_JUMP
11848
11849    or
11850
11851         BRANCH_PADDING
11852         COND_JUMP/UNCOND_JUMP
11853  */
11854
11855 static int
11856 i386_branch_padding_size (fragS *fragP, offsetT address)
11857 {
11858   unsigned int offset, size, padding_size;
11859   fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11860
11861   /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag.  */
11862   if (!address)
11863     address = fragP->fr_address;
11864   address += fragP->fr_fix;
11865
11866   /* CMP like instrunction size.  */
11867   size = fragP->tc_frag_data.cmp_size;
11868
11869   /* The base size of the branch frag.  */
11870   size += branch_fragP->fr_fix;
11871
11872   /* Add opcode and displacement bytes for the rs_machine_dependent
11873      branch frag.  */
11874   if (branch_fragP->fr_type == rs_machine_dependent)
11875     size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11876
11877   /* Check if branch is within boundary and doesn't end at the last
11878      byte.  */
11879   offset = address & ((1U << align_branch_power) - 1);
11880   if ((offset + size) >= (1U << align_branch_power))
11881     /* Padding needed to avoid crossing boundary.  */
11882     padding_size = (1U << align_branch_power) - offset;
11883   else
11884     /* No padding needed.  */
11885     padding_size = 0;
11886
11887   /* The return value may be saved in tc_frag_data.length which is
11888      unsigned byte.  */
11889   if (!fits_in_unsigned_byte (padding_size))
11890     abort ();
11891
11892   return padding_size;
11893 }
11894
11895 /* i386_generic_table_relax_frag()
11896
11897    Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11898    grow/shrink padding to align branch frags.  Hand others to
11899    relax_frag().  */
11900
11901 long
11902 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11903 {
11904   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11905       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11906     {
11907       long padding_size = i386_branch_padding_size (fragP, 0);
11908       long grow = padding_size - fragP->tc_frag_data.length;
11909
11910       /* When the BRANCH_PREFIX frag is used, the computed address
11911          must match the actual address and there should be no padding.  */
11912       if (fragP->tc_frag_data.padding_address
11913           && (fragP->tc_frag_data.padding_address != fragP->fr_address
11914               || padding_size))
11915         abort ();
11916
11917       /* Update the padding size.  */
11918       if (grow)
11919         fragP->tc_frag_data.length = padding_size;
11920
11921       return grow;
11922     }
11923   else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11924     {
11925       fragS *padding_fragP, *next_fragP;
11926       long padding_size, left_size, last_size;
11927
11928       padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11929       if (!padding_fragP)
11930         /* Use the padding set by the leading BRANCH_PREFIX frag.  */
11931         return (fragP->tc_frag_data.length
11932                 - fragP->tc_frag_data.last_length);
11933
11934       /* Compute the relative address of the padding frag in the very
11935         first time where the BRANCH_PREFIX frag sizes are zero.  */
11936       if (!fragP->tc_frag_data.padding_address)
11937         fragP->tc_frag_data.padding_address
11938           = padding_fragP->fr_address - (fragP->fr_address - stretch);
11939
11940       /* First update the last length from the previous interation.  */
11941       left_size = fragP->tc_frag_data.prefix_length;
11942       for (next_fragP = fragP;
11943            next_fragP != padding_fragP;
11944            next_fragP = next_fragP->fr_next)
11945         if (next_fragP->fr_type == rs_machine_dependent
11946             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11947                 == BRANCH_PREFIX))
11948           {
11949             if (left_size)
11950               {
11951                 int max = next_fragP->tc_frag_data.max_bytes;
11952                 if (max)
11953                   {
11954                     int size;
11955                     if (max > left_size)
11956                       size = left_size;
11957                     else
11958                       size = max;
11959                     left_size -= size;
11960                     next_fragP->tc_frag_data.last_length = size;
11961                   }
11962               }
11963             else
11964               next_fragP->tc_frag_data.last_length = 0;
11965           }
11966
11967       /* Check the padding size for the padding frag.  */
11968       padding_size = i386_branch_padding_size
11969         (padding_fragP, (fragP->fr_address
11970                          + fragP->tc_frag_data.padding_address));
11971
11972       last_size = fragP->tc_frag_data.prefix_length;
11973       /* Check if there is change from the last interation.  */
11974       if (padding_size == last_size)
11975         {
11976           /* Update the expected address of the padding frag.  */
11977           padding_fragP->tc_frag_data.padding_address
11978             = (fragP->fr_address + padding_size
11979                + fragP->tc_frag_data.padding_address);
11980           return 0;
11981         }
11982
11983       if (padding_size > fragP->tc_frag_data.max_prefix_length)
11984         {
11985           /* No padding if there is no sufficient room.  Clear the
11986              expected address of the padding frag.  */
11987           padding_fragP->tc_frag_data.padding_address = 0;
11988           padding_size = 0;
11989         }
11990       else
11991         /* Store the expected address of the padding frag.  */
11992         padding_fragP->tc_frag_data.padding_address
11993           = (fragP->fr_address + padding_size
11994              + fragP->tc_frag_data.padding_address);
11995
11996       fragP->tc_frag_data.prefix_length = padding_size;
11997
11998       /* Update the length for the current interation.  */
11999       left_size = padding_size;
12000       for (next_fragP = fragP;
12001            next_fragP != padding_fragP;
12002            next_fragP = next_fragP->fr_next)
12003         if (next_fragP->fr_type == rs_machine_dependent
12004             && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12005                 == BRANCH_PREFIX))
12006           {
12007             if (left_size)
12008               {
12009                 int max = next_fragP->tc_frag_data.max_bytes;
12010                 if (max)
12011                   {
12012                     int size;
12013                     if (max > left_size)
12014                       size = left_size;
12015                     else
12016                       size = max;
12017                     left_size -= size;
12018                     next_fragP->tc_frag_data.length = size;
12019                   }
12020               }
12021             else
12022               next_fragP->tc_frag_data.length = 0;
12023           }
12024
12025       return (fragP->tc_frag_data.length
12026               - fragP->tc_frag_data.last_length);
12027     }
12028   return relax_frag (segment, fragP, stretch);
12029 }
12030
12031 /* md_estimate_size_before_relax()
12032
12033    Called just before relax() for rs_machine_dependent frags.  The x86
12034    assembler uses these frags to handle variable size jump
12035    instructions.
12036
12037    Any symbol that is now undefined will not become defined.
12038    Return the correct fr_subtype in the frag.
12039    Return the initial "guess for variable size of frag" to caller.
12040    The guess is actually the growth beyond the fixed part.  Whatever
12041    we do to grow the fixed or variable part contributes to our
12042    returned value.  */
12043
12044 int
12045 md_estimate_size_before_relax (fragS *fragP, segT segment)
12046 {
12047   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12048       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12049       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12050     {
12051       i386_classify_machine_dependent_frag (fragP);
12052       return fragP->tc_frag_data.length;
12053     }
12054
12055   /* We've already got fragP->fr_subtype right;  all we have to do is
12056      check for un-relaxable symbols.  On an ELF system, we can't relax
12057      an externally visible symbol, because it may be overridden by a
12058      shared library.  */
12059   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12060 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12061       || (IS_ELF
12062           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12063                                                 fragP->fr_var))
12064 #endif
12065 #if defined (OBJ_COFF) && defined (TE_PE)
12066       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12067           && S_IS_WEAK (fragP->fr_symbol))
12068 #endif
12069       )
12070     {
12071       /* Symbol is undefined in this segment, or we need to keep a
12072          reloc so that weak symbols can be overridden.  */
12073       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12074       enum bfd_reloc_code_real reloc_type;
12075       unsigned char *opcode;
12076       int old_fr_fix;
12077
12078       if (fragP->fr_var != NO_RELOC)
12079         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12080       else if (size == 2)
12081         reloc_type = BFD_RELOC_16_PCREL;
12082 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12083       else if (need_plt32_p (fragP->fr_symbol))
12084         reloc_type = BFD_RELOC_X86_64_PLT32;
12085 #endif
12086       else
12087         reloc_type = BFD_RELOC_32_PCREL;
12088
12089       old_fr_fix = fragP->fr_fix;
12090       opcode = (unsigned char *) fragP->fr_opcode;
12091
12092       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12093         {
12094         case UNCOND_JUMP:
12095           /* Make jmp (0xeb) a (d)word displacement jump.  */
12096           opcode[0] = 0xe9;
12097           fragP->fr_fix += size;
12098           fix_new (fragP, old_fr_fix, size,
12099                    fragP->fr_symbol,
12100                    fragP->fr_offset, 1,
12101                    reloc_type);
12102           break;
12103
12104         case COND_JUMP86:
12105           if (size == 2
12106               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12107             {
12108               /* Negate the condition, and branch past an
12109                  unconditional jump.  */
12110               opcode[0] ^= 1;
12111               opcode[1] = 3;
12112               /* Insert an unconditional jump.  */
12113               opcode[2] = 0xe9;
12114               /* We added two extra opcode bytes, and have a two byte
12115                  offset.  */
12116               fragP->fr_fix += 2 + 2;
12117               fix_new (fragP, old_fr_fix + 2, 2,
12118                        fragP->fr_symbol,
12119                        fragP->fr_offset, 1,
12120                        reloc_type);
12121               break;
12122             }
12123           /* Fall through.  */
12124
12125         case COND_JUMP:
12126           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12127             {
12128               fixS *fixP;
12129
12130               fragP->fr_fix += 1;
12131               fixP = fix_new (fragP, old_fr_fix, 1,
12132                               fragP->fr_symbol,
12133                               fragP->fr_offset, 1,
12134                               BFD_RELOC_8_PCREL);
12135               fixP->fx_signed = 1;
12136               break;
12137             }
12138
12139           /* This changes the byte-displacement jump 0x7N
12140              to the (d)word-displacement jump 0x0f,0x8N.  */
12141           opcode[1] = opcode[0] + 0x10;
12142           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12143           /* We've added an opcode byte.  */
12144           fragP->fr_fix += 1 + size;
12145           fix_new (fragP, old_fr_fix + 1, size,
12146                    fragP->fr_symbol,
12147                    fragP->fr_offset, 1,
12148                    reloc_type);
12149           break;
12150
12151         default:
12152           BAD_CASE (fragP->fr_subtype);
12153           break;
12154         }
12155       frag_wane (fragP);
12156       return fragP->fr_fix - old_fr_fix;
12157     }
12158
12159   /* Guess size depending on current relax state.  Initially the relax
12160      state will correspond to a short jump and we return 1, because
12161      the variable part of the frag (the branch offset) is one byte
12162      long.  However, we can relax a section more than once and in that
12163      case we must either set fr_subtype back to the unrelaxed state,
12164      or return the value for the appropriate branch.  */
12165   return md_relax_table[fragP->fr_subtype].rlx_length;
12166 }
12167
12168 /* Called after relax() is finished.
12169
12170    In:  Address of frag.
12171         fr_type == rs_machine_dependent.
12172         fr_subtype is what the address relaxed to.
12173
12174    Out: Any fixSs and constants are set up.
12175         Caller will turn frag into a ".space 0".  */
12176
12177 void
12178 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12179                  fragS *fragP)
12180 {
12181   unsigned char *opcode;
12182   unsigned char *where_to_put_displacement = NULL;
12183   offsetT target_address;
12184   offsetT opcode_address;
12185   unsigned int extension = 0;
12186   offsetT displacement_from_opcode_start;
12187
12188   if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12189       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12190       || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12191     {
12192       /* Generate nop padding.  */
12193       unsigned int size = fragP->tc_frag_data.length;
12194       if (size)
12195         {
12196           if (size > fragP->tc_frag_data.max_bytes)
12197             abort ();
12198
12199           if (flag_debug)
12200             {
12201               const char *msg;
12202               const char *branch = "branch";
12203               const char *prefix = "";
12204               fragS *padding_fragP;
12205               if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12206                   == BRANCH_PREFIX)
12207                 {
12208                   padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12209                   switch (fragP->tc_frag_data.default_prefix)
12210                     {
12211                     default:
12212                       abort ();
12213                       break;
12214                     case CS_PREFIX_OPCODE:
12215                       prefix = " cs";
12216                       break;
12217                     case DS_PREFIX_OPCODE:
12218                       prefix = " ds";
12219                       break;
12220                     case ES_PREFIX_OPCODE:
12221                       prefix = " es";
12222                       break;
12223                     case FS_PREFIX_OPCODE:
12224                       prefix = " fs";
12225                       break;
12226                     case GS_PREFIX_OPCODE:
12227                       prefix = " gs";
12228                       break;
12229                     case SS_PREFIX_OPCODE:
12230                       prefix = " ss";
12231                       break;
12232                     }
12233                   if (padding_fragP)
12234                     msg = _("%s:%u: add %d%s at 0x%llx to align "
12235                             "%s within %d-byte boundary\n");
12236                   else
12237                     msg = _("%s:%u: add additional %d%s at 0x%llx to "
12238                             "align %s within %d-byte boundary\n");
12239                 }
12240               else
12241                 {
12242                   padding_fragP = fragP;
12243                   msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12244                           "%s within %d-byte boundary\n");
12245                 }
12246
12247               if (padding_fragP)
12248                 switch (padding_fragP->tc_frag_data.branch_type)
12249                   {
12250                   case align_branch_jcc:
12251                     branch = "jcc";
12252                     break;
12253                   case align_branch_fused:
12254                     branch = "fused jcc";
12255                     break;
12256                   case align_branch_jmp:
12257                     branch = "jmp";
12258                     break;
12259                   case align_branch_call:
12260                     branch = "call";
12261                     break;
12262                   case align_branch_indirect:
12263                     branch = "indiret branch";
12264                     break;
12265                   case align_branch_ret:
12266                     branch = "ret";
12267                     break;
12268                   default:
12269                     break;
12270                   }
12271
12272               fprintf (stdout, msg,
12273                        fragP->fr_file, fragP->fr_line, size, prefix,
12274                        (long long) fragP->fr_address, branch,
12275                        1 << align_branch_power);
12276             }
12277           if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12278             memset (fragP->fr_opcode,
12279                     fragP->tc_frag_data.default_prefix, size);
12280           else
12281             i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12282                                 size, 0);
12283           fragP->fr_fix += size;
12284         }
12285       return;
12286     }
12287
12288   opcode = (unsigned char *) fragP->fr_opcode;
12289
12290   /* Address we want to reach in file space.  */
12291   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12292
12293   /* Address opcode resides at in file space.  */
12294   opcode_address = fragP->fr_address + fragP->fr_fix;
12295
12296   /* Displacement from opcode start to fill into instruction.  */
12297   displacement_from_opcode_start = target_address - opcode_address;
12298
12299   if ((fragP->fr_subtype & BIG) == 0)
12300     {
12301       /* Don't have to change opcode.  */
12302       extension = 1;            /* 1 opcode + 1 displacement  */
12303       where_to_put_displacement = &opcode[1];
12304     }
12305   else
12306     {
12307       if (no_cond_jump_promotion
12308           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12309         as_warn_where (fragP->fr_file, fragP->fr_line,
12310                        _("long jump required"));
12311
12312       switch (fragP->fr_subtype)
12313         {
12314         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12315           extension = 4;                /* 1 opcode + 4 displacement  */
12316           opcode[0] = 0xe9;
12317           where_to_put_displacement = &opcode[1];
12318           break;
12319
12320         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12321           extension = 2;                /* 1 opcode + 2 displacement  */
12322           opcode[0] = 0xe9;
12323           where_to_put_displacement = &opcode[1];
12324           break;
12325
12326         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12327         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12328           extension = 5;                /* 2 opcode + 4 displacement  */
12329           opcode[1] = opcode[0] + 0x10;
12330           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12331           where_to_put_displacement = &opcode[2];
12332           break;
12333
12334         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12335           extension = 3;                /* 2 opcode + 2 displacement  */
12336           opcode[1] = opcode[0] + 0x10;
12337           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12338           where_to_put_displacement = &opcode[2];
12339           break;
12340
12341         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12342           extension = 4;
12343           opcode[0] ^= 1;
12344           opcode[1] = 3;
12345           opcode[2] = 0xe9;
12346           where_to_put_displacement = &opcode[3];
12347           break;
12348
12349         default:
12350           BAD_CASE (fragP->fr_subtype);
12351           break;
12352         }
12353     }
12354
12355   /* If size if less then four we are sure that the operand fits,
12356      but if it's 4, then it could be that the displacement is larger
12357      then -/+ 2GB.  */
12358   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12359       && object_64bit
12360       && ((addressT) (displacement_from_opcode_start - extension
12361                       + ((addressT) 1 << 31))
12362           > (((addressT) 2 << 31) - 1)))
12363     {
12364       as_bad_where (fragP->fr_file, fragP->fr_line,
12365                     _("jump target out of range"));
12366       /* Make us emit 0.  */
12367       displacement_from_opcode_start = extension;
12368     }
12369   /* Now put displacement after opcode.  */
12370   md_number_to_chars ((char *) where_to_put_displacement,
12371                       (valueT) (displacement_from_opcode_start - extension),
12372                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12373   fragP->fr_fix += extension;
12374 }
12375 \f
12376 /* Apply a fixup (fixP) to segment data, once it has been determined
12377    by our caller that we have all the info we need to fix it up.
12378
12379    Parameter valP is the pointer to the value of the bits.
12380
12381    On the 386, immediates, displacements, and data pointers are all in
12382    the same (little-endian) format, so we don't need to care about which
12383    we are handling.  */
12384
12385 void
12386 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12387 {
12388   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12389   valueT value = *valP;
12390
12391 #if !defined (TE_Mach)
12392   if (fixP->fx_pcrel)
12393     {
12394       switch (fixP->fx_r_type)
12395         {
12396         default:
12397           break;
12398
12399         case BFD_RELOC_64:
12400           fixP->fx_r_type = BFD_RELOC_64_PCREL;
12401           break;
12402         case BFD_RELOC_32:
12403         case BFD_RELOC_X86_64_32S:
12404           fixP->fx_r_type = BFD_RELOC_32_PCREL;
12405           break;
12406         case BFD_RELOC_16:
12407           fixP->fx_r_type = BFD_RELOC_16_PCREL;
12408           break;
12409         case BFD_RELOC_8:
12410           fixP->fx_r_type = BFD_RELOC_8_PCREL;
12411           break;
12412         }
12413     }
12414
12415   if (fixP->fx_addsy != NULL
12416       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12417           || fixP->fx_r_type == BFD_RELOC_64_PCREL
12418           || fixP->fx_r_type == BFD_RELOC_16_PCREL
12419           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12420       && !use_rela_relocations)
12421     {
12422       /* This is a hack.  There should be a better way to handle this.
12423          This covers for the fact that bfd_install_relocation will
12424          subtract the current location (for partial_inplace, PC relative
12425          relocations); see more below.  */
12426 #ifndef OBJ_AOUT
12427       if (IS_ELF
12428 #ifdef TE_PE
12429           || OUTPUT_FLAVOR == bfd_target_coff_flavour
12430 #endif
12431           )
12432         value += fixP->fx_where + fixP->fx_frag->fr_address;
12433 #endif
12434 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12435       if (IS_ELF)
12436         {
12437           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12438
12439           if ((sym_seg == seg
12440                || (symbol_section_p (fixP->fx_addsy)
12441                    && sym_seg != absolute_section))
12442               && !generic_force_reloc (fixP))
12443             {
12444               /* Yes, we add the values in twice.  This is because
12445                  bfd_install_relocation subtracts them out again.  I think
12446                  bfd_install_relocation is broken, but I don't dare change
12447                  it.  FIXME.  */
12448               value += fixP->fx_where + fixP->fx_frag->fr_address;
12449             }
12450         }
12451 #endif
12452 #if defined (OBJ_COFF) && defined (TE_PE)
12453       /* For some reason, the PE format does not store a
12454          section address offset for a PC relative symbol.  */
12455       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12456           || S_IS_WEAK (fixP->fx_addsy))
12457         value += md_pcrel_from (fixP);
12458 #endif
12459     }
12460 #if defined (OBJ_COFF) && defined (TE_PE)
12461   if (fixP->fx_addsy != NULL
12462       && S_IS_WEAK (fixP->fx_addsy)
12463       /* PR 16858: Do not modify weak function references.  */
12464       && ! fixP->fx_pcrel)
12465     {
12466 #if !defined (TE_PEP)
12467       /* For x86 PE weak function symbols are neither PC-relative
12468          nor do they set S_IS_FUNCTION.  So the only reliable way
12469          to detect them is to check the flags of their containing
12470          section.  */
12471       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12472           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12473         ;
12474       else
12475 #endif
12476       value -= S_GET_VALUE (fixP->fx_addsy);
12477     }
12478 #endif
12479
12480   /* Fix a few things - the dynamic linker expects certain values here,
12481      and we must not disappoint it.  */
12482 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12483   if (IS_ELF && fixP->fx_addsy)
12484     switch (fixP->fx_r_type)
12485       {
12486       case BFD_RELOC_386_PLT32:
12487       case BFD_RELOC_X86_64_PLT32:
12488         /* Make the jump instruction point to the address of the operand.
12489            At runtime we merely add the offset to the actual PLT entry.
12490            NB: Subtract the offset size only for jump instructions.  */
12491         if (fixP->fx_pcrel)
12492           value = -4;
12493         break;
12494
12495       case BFD_RELOC_386_TLS_GD:
12496       case BFD_RELOC_386_TLS_LDM:
12497       case BFD_RELOC_386_TLS_IE_32:
12498       case BFD_RELOC_386_TLS_IE:
12499       case BFD_RELOC_386_TLS_GOTIE:
12500       case BFD_RELOC_386_TLS_GOTDESC:
12501       case BFD_RELOC_X86_64_TLSGD:
12502       case BFD_RELOC_X86_64_TLSLD:
12503       case BFD_RELOC_X86_64_GOTTPOFF:
12504       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12505         value = 0; /* Fully resolved at runtime.  No addend.  */
12506         /* Fallthrough */
12507       case BFD_RELOC_386_TLS_LE:
12508       case BFD_RELOC_386_TLS_LDO_32:
12509       case BFD_RELOC_386_TLS_LE_32:
12510       case BFD_RELOC_X86_64_DTPOFF32:
12511       case BFD_RELOC_X86_64_DTPOFF64:
12512       case BFD_RELOC_X86_64_TPOFF32:
12513       case BFD_RELOC_X86_64_TPOFF64:
12514         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12515         break;
12516
12517       case BFD_RELOC_386_TLS_DESC_CALL:
12518       case BFD_RELOC_X86_64_TLSDESC_CALL:
12519         value = 0; /* Fully resolved at runtime.  No addend.  */
12520         S_SET_THREAD_LOCAL (fixP->fx_addsy);
12521         fixP->fx_done = 0;
12522         return;
12523
12524       case BFD_RELOC_VTABLE_INHERIT:
12525       case BFD_RELOC_VTABLE_ENTRY:
12526         fixP->fx_done = 0;
12527         return;
12528
12529       default:
12530         break;
12531       }
12532 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
12533   *valP = value;
12534 #endif /* !defined (TE_Mach)  */
12535
12536   /* Are we finished with this relocation now?  */
12537   if (fixP->fx_addsy == NULL)
12538     fixP->fx_done = 1;
12539 #if defined (OBJ_COFF) && defined (TE_PE)
12540   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12541     {
12542       fixP->fx_done = 0;
12543       /* Remember value for tc_gen_reloc.  */
12544       fixP->fx_addnumber = value;
12545       /* Clear out the frag for now.  */
12546       value = 0;
12547     }
12548 #endif
12549   else if (use_rela_relocations)
12550     {
12551       fixP->fx_no_overflow = 1;
12552       /* Remember value for tc_gen_reloc.  */
12553       fixP->fx_addnumber = value;
12554       value = 0;
12555     }
12556
12557   md_number_to_chars (p, value, fixP->fx_size);
12558 }
12559 \f
12560 const char *
12561 md_atof (int type, char *litP, int *sizeP)
12562 {
12563   /* This outputs the LITTLENUMs in REVERSE order;
12564      in accord with the bigendian 386.  */
12565   return ieee_md_atof (type, litP, sizeP, FALSE);
12566 }
12567 \f
12568 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12569
12570 static char *
12571 output_invalid (int c)
12572 {
12573   if (ISPRINT (c))
12574     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12575               "'%c'", c);
12576   else
12577     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12578               "(0x%x)", (unsigned char) c);
12579   return output_invalid_buf;
12580 }
12581
12582 /* Verify that @r can be used in the current context.  */
12583
12584 static bfd_boolean check_register (const reg_entry *r)
12585 {
12586   if (allow_pseudo_reg)
12587     return TRUE;
12588
12589   if (operand_type_all_zero (&r->reg_type))
12590     return FALSE;
12591
12592   if ((r->reg_type.bitfield.dword
12593        || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12594        || r->reg_type.bitfield.class == RegCR
12595        || r->reg_type.bitfield.class == RegDR)
12596       && !cpu_arch_flags.bitfield.cpui386)
12597     return FALSE;
12598
12599   if (r->reg_type.bitfield.class == RegTR
12600       && (flag_code == CODE_64BIT
12601           || !cpu_arch_flags.bitfield.cpui386
12602           || cpu_arch_isa_flags.bitfield.cpui586
12603           || cpu_arch_isa_flags.bitfield.cpui686))
12604     return FALSE;
12605
12606   if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12607     return FALSE;
12608
12609   if (!cpu_arch_flags.bitfield.cpuavx512f)
12610     {
12611       if (r->reg_type.bitfield.zmmword
12612           || r->reg_type.bitfield.class == RegMask)
12613         return FALSE;
12614
12615       if (!cpu_arch_flags.bitfield.cpuavx)
12616         {
12617           if (r->reg_type.bitfield.ymmword)
12618             return FALSE;
12619
12620           if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12621             return FALSE;
12622         }
12623     }
12624
12625   if (r->reg_type.bitfield.tmmword
12626       && (!cpu_arch_flags.bitfield.cpuamx_tile
12627           || flag_code != CODE_64BIT))
12628     return FALSE;
12629
12630   if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12631     return FALSE;
12632
12633   /* Don't allow fake index register unless allow_index_reg isn't 0. */
12634   if (!allow_index_reg && r->reg_num == RegIZ)
12635     return FALSE;
12636
12637   /* Upper 16 vector registers are only available with VREX in 64bit
12638      mode, and require EVEX encoding.  */
12639   if (r->reg_flags & RegVRex)
12640     {
12641       if (!cpu_arch_flags.bitfield.cpuavx512f
12642           || flag_code != CODE_64BIT)
12643         return FALSE;
12644
12645       if (i.vec_encoding == vex_encoding_default)
12646         i.vec_encoding = vex_encoding_evex;
12647       else if (i.vec_encoding != vex_encoding_evex)
12648         i.vec_encoding = vex_encoding_error;
12649     }
12650
12651   if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12652       && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12653       && flag_code != CODE_64BIT)
12654     return FALSE;
12655
12656   if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12657       && !intel_syntax)
12658     return FALSE;
12659
12660   return TRUE;
12661 }
12662
12663 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12664
12665 static const reg_entry *
12666 parse_real_register (char *reg_string, char **end_op)
12667 {
12668   char *s = reg_string;
12669   char *p;
12670   char reg_name_given[MAX_REG_NAME_SIZE + 1];
12671   const reg_entry *r;
12672
12673   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
12674   if (*s == REGISTER_PREFIX)
12675     ++s;
12676
12677   if (is_space_char (*s))
12678     ++s;
12679
12680   p = reg_name_given;
12681   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12682     {
12683       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12684         return (const reg_entry *) NULL;
12685       s++;
12686     }
12687
12688   /* For naked regs, make sure that we are not dealing with an identifier.
12689      This prevents confusing an identifier like `eax_var' with register
12690      `eax'.  */
12691   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12692     return (const reg_entry *) NULL;
12693
12694   *end_op = s;
12695
12696   r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12697
12698   /* Handle floating point regs, allowing spaces in the (i) part.  */
12699   if (r == i386_regtab /* %st is first entry of table  */)
12700     {
12701       if (!cpu_arch_flags.bitfield.cpu8087
12702           && !cpu_arch_flags.bitfield.cpu287
12703           && !cpu_arch_flags.bitfield.cpu387
12704           && !allow_pseudo_reg)
12705         return (const reg_entry *) NULL;
12706
12707       if (is_space_char (*s))
12708         ++s;
12709       if (*s == '(')
12710         {
12711           ++s;
12712           if (is_space_char (*s))
12713             ++s;
12714           if (*s >= '0' && *s <= '7')
12715             {
12716               int fpr = *s - '0';
12717               ++s;
12718               if (is_space_char (*s))
12719                 ++s;
12720               if (*s == ')')
12721                 {
12722                   *end_op = s + 1;
12723                   r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12724                   know (r);
12725                   return r + fpr;
12726                 }
12727             }
12728           /* We have "%st(" then garbage.  */
12729           return (const reg_entry *) NULL;
12730         }
12731     }
12732
12733   return r && check_register (r) ? r : NULL;
12734 }
12735
12736 /* REG_STRING starts *before* REGISTER_PREFIX.  */
12737
12738 static const reg_entry *
12739 parse_register (char *reg_string, char **end_op)
12740 {
12741   const reg_entry *r;
12742
12743   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12744     r = parse_real_register (reg_string, end_op);
12745   else
12746     r = NULL;
12747   if (!r)
12748     {
12749       char *save = input_line_pointer;
12750       char c;
12751       symbolS *symbolP;
12752
12753       input_line_pointer = reg_string;
12754       c = get_symbol_name (&reg_string);
12755       symbolP = symbol_find (reg_string);
12756       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12757         {
12758           const expressionS *e = symbol_get_value_expression (symbolP);
12759
12760           know (e->X_op == O_register);
12761           know (e->X_add_number >= 0
12762                 && (valueT) e->X_add_number < i386_regtab_size);
12763           r = i386_regtab + e->X_add_number;
12764           if (!check_register (r))
12765             {
12766               as_bad (_("register '%s%s' cannot be used here"),
12767                       register_prefix, r->reg_name);
12768               r = &bad_reg;
12769             }
12770           *end_op = input_line_pointer;
12771         }
12772       *input_line_pointer = c;
12773       input_line_pointer = save;
12774     }
12775   return r;
12776 }
12777
12778 int
12779 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12780 {
12781   const reg_entry *r;
12782   char *end = input_line_pointer;
12783
12784   *end = *nextcharP;
12785   r = parse_register (name, &input_line_pointer);
12786   if (r && end <= input_line_pointer)
12787     {
12788       *nextcharP = *input_line_pointer;
12789       *input_line_pointer = 0;
12790       if (r != &bad_reg)
12791         {
12792           e->X_op = O_register;
12793           e->X_add_number = r - i386_regtab;
12794         }
12795       else
12796           e->X_op = O_illegal;
12797       return 1;
12798     }
12799   input_line_pointer = end;
12800   *end = 0;
12801   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12802 }
12803
12804 void
12805 md_operand (expressionS *e)
12806 {
12807   char *end;
12808   const reg_entry *r;
12809
12810   switch (*input_line_pointer)
12811     {
12812     case REGISTER_PREFIX:
12813       r = parse_real_register (input_line_pointer, &end);
12814       if (r)
12815         {
12816           e->X_op = O_register;
12817           e->X_add_number = r - i386_regtab;
12818           input_line_pointer = end;
12819         }
12820       break;
12821
12822     case '[':
12823       gas_assert (intel_syntax);
12824       end = input_line_pointer++;
12825       expression (e);
12826       if (*input_line_pointer == ']')
12827         {
12828           ++input_line_pointer;
12829           e->X_op_symbol = make_expr_symbol (e);
12830           e->X_add_symbol = NULL;
12831           e->X_add_number = 0;
12832           e->X_op = O_index;
12833         }
12834       else
12835         {
12836           e->X_op = O_absent;
12837           input_line_pointer = end;
12838         }
12839       break;
12840     }
12841 }
12842
12843 \f
12844 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12845 const char *md_shortopts = "kVQ:sqnO::";
12846 #else
12847 const char *md_shortopts = "qnO::";
12848 #endif
12849
12850 #define OPTION_32 (OPTION_MD_BASE + 0)
12851 #define OPTION_64 (OPTION_MD_BASE + 1)
12852 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12853 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12854 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12855 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12856 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12857 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12858 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12859 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12860 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12861 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12862 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12863 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12864 #define OPTION_X32 (OPTION_MD_BASE + 14)
12865 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12866 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12867 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12868 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12869 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12870 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12871 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12872 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12873 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12874 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12875 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12876 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12877 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12878 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12879 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12880 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12881 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12882 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12883 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12884
12885 struct option md_longopts[] =
12886 {
12887   {"32", no_argument, NULL, OPTION_32},
12888 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12889      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12890   {"64", no_argument, NULL, OPTION_64},
12891 #endif
12892 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12893   {"x32", no_argument, NULL, OPTION_X32},
12894   {"mshared", no_argument, NULL, OPTION_MSHARED},
12895   {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12896 #endif
12897   {"divide", no_argument, NULL, OPTION_DIVIDE},
12898   {"march", required_argument, NULL, OPTION_MARCH},
12899   {"mtune", required_argument, NULL, OPTION_MTUNE},
12900   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12901   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12902   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12903   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12904   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12905   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12906   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12907   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12908   {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12909   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12910   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12911   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12912 # if defined (TE_PE) || defined (TE_PEP)
12913   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12914 #endif
12915   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12916   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12917   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12918   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12919   {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12920   {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12921   {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12922   {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12923   {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12924   {"mlfence-before-indirect-branch", required_argument, NULL,
12925    OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12926   {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12927   {"mamd64", no_argument, NULL, OPTION_MAMD64},
12928   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12929   {NULL, no_argument, NULL, 0}
12930 };
12931 size_t md_longopts_size = sizeof (md_longopts);
12932
12933 int
12934 md_parse_option (int c, const char *arg)
12935 {
12936   unsigned int j;
12937   char *arch, *next, *saved, *type;
12938
12939   switch (c)
12940     {
12941     case 'n':
12942       optimize_align_code = 0;
12943       break;
12944
12945     case 'q':
12946       quiet_warnings = 1;
12947       break;
12948
12949 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12950       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12951          should be emitted or not.  FIXME: Not implemented.  */
12952     case 'Q':
12953       if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12954         return 0;
12955       break;
12956
12957       /* -V: SVR4 argument to print version ID.  */
12958     case 'V':
12959       print_version_id ();
12960       break;
12961
12962       /* -k: Ignore for FreeBSD compatibility.  */
12963     case 'k':
12964       break;
12965
12966     case 's':
12967       /* -s: On i386 Solaris, this tells the native assembler to use
12968          .stab instead of .stab.excl.  We always use .stab anyhow.  */
12969       break;
12970
12971     case OPTION_MSHARED:
12972       shared = 1;
12973       break;
12974
12975     case OPTION_X86_USED_NOTE:
12976       if (strcasecmp (arg, "yes") == 0)
12977         x86_used_note = 1;
12978       else if (strcasecmp (arg, "no") == 0)
12979         x86_used_note = 0;
12980       else
12981         as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12982       break;
12983
12984
12985 #endif
12986 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12987      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12988     case OPTION_64:
12989       {
12990         const char **list, **l;
12991
12992         list = bfd_target_list ();
12993         for (l = list; *l != NULL; l++)
12994           if (startswith (*l, "elf64-x86-64")
12995               || strcmp (*l, "coff-x86-64") == 0
12996               || strcmp (*l, "pe-x86-64") == 0
12997               || strcmp (*l, "pei-x86-64") == 0
12998               || strcmp (*l, "mach-o-x86-64") == 0)
12999             {
13000               default_arch = "x86_64";
13001               break;
13002             }
13003         if (*l == NULL)
13004           as_fatal (_("no compiled in support for x86_64"));
13005         free (list);
13006       }
13007       break;
13008 #endif
13009
13010 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13011     case OPTION_X32:
13012       if (IS_ELF)
13013         {
13014           const char **list, **l;
13015
13016           list = bfd_target_list ();
13017           for (l = list; *l != NULL; l++)
13018             if (startswith (*l, "elf32-x86-64"))
13019               {
13020                 default_arch = "x86_64:32";
13021                 break;
13022               }
13023           if (*l == NULL)
13024             as_fatal (_("no compiled in support for 32bit x86_64"));
13025           free (list);
13026         }
13027       else
13028         as_fatal (_("32bit x86_64 is only supported for ELF"));
13029       break;
13030 #endif
13031
13032     case OPTION_32:
13033       default_arch = "i386";
13034       break;
13035
13036     case OPTION_DIVIDE:
13037 #ifdef SVR4_COMMENT_CHARS
13038       {
13039         char *n, *t;
13040         const char *s;
13041
13042         n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13043         t = n;
13044         for (s = i386_comment_chars; *s != '\0'; s++)
13045           if (*s != '/')
13046             *t++ = *s;
13047         *t = '\0';
13048         i386_comment_chars = n;
13049       }
13050 #endif
13051       break;
13052
13053     case OPTION_MARCH:
13054       saved = xstrdup (arg);
13055       arch = saved;
13056       /* Allow -march=+nosse.  */
13057       if (*arch == '+')
13058         arch++;
13059       do
13060         {
13061           if (*arch == '.')
13062             as_fatal (_("invalid -march= option: `%s'"), arg);
13063           next = strchr (arch, '+');
13064           if (next)
13065             *next++ = '\0';
13066           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13067             {
13068               if (strcmp (arch, cpu_arch [j].name) == 0)
13069                 {
13070                   /* Processor.  */
13071                   if (! cpu_arch[j].flags.bitfield.cpui386)
13072                     continue;
13073
13074                   cpu_arch_name = cpu_arch[j].name;
13075                   cpu_sub_arch_name = NULL;
13076                   cpu_arch_flags = cpu_arch[j].flags;
13077                   cpu_arch_isa = cpu_arch[j].type;
13078                   cpu_arch_isa_flags = cpu_arch[j].flags;
13079                   if (!cpu_arch_tune_set)
13080                     {
13081                       cpu_arch_tune = cpu_arch_isa;
13082                       cpu_arch_tune_flags = cpu_arch_isa_flags;
13083                     }
13084                   break;
13085                 }
13086               else if (*cpu_arch [j].name == '.'
13087                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
13088                 {
13089                   /* ISA extension.  */
13090                   i386_cpu_flags flags;
13091
13092                   flags = cpu_flags_or (cpu_arch_flags,
13093                                         cpu_arch[j].flags);
13094
13095                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13096                     {
13097                       if (cpu_sub_arch_name)
13098                         {
13099                           char *name = cpu_sub_arch_name;
13100                           cpu_sub_arch_name = concat (name,
13101                                                       cpu_arch[j].name,
13102                                                       (const char *) NULL);
13103                           free (name);
13104                         }
13105                       else
13106                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13107                       cpu_arch_flags = flags;
13108                       cpu_arch_isa_flags = flags;
13109                     }
13110                   else
13111                     cpu_arch_isa_flags
13112                       = cpu_flags_or (cpu_arch_isa_flags,
13113                                       cpu_arch[j].flags);
13114                   break;
13115                 }
13116             }
13117
13118           if (j >= ARRAY_SIZE (cpu_arch))
13119             {
13120               /* Disable an ISA extension.  */
13121               for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13122                 if (strcmp (arch, cpu_noarch [j].name) == 0)
13123                   {
13124                     i386_cpu_flags flags;
13125
13126                     flags = cpu_flags_and_not (cpu_arch_flags,
13127                                                cpu_noarch[j].flags);
13128                     if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13129                       {
13130                         if (cpu_sub_arch_name)
13131                           {
13132                             char *name = cpu_sub_arch_name;
13133                             cpu_sub_arch_name = concat (arch,
13134                                                         (const char *) NULL);
13135                             free (name);
13136                           }
13137                         else
13138                           cpu_sub_arch_name = xstrdup (arch);
13139                         cpu_arch_flags = flags;
13140                         cpu_arch_isa_flags = flags;
13141                       }
13142                     break;
13143                   }
13144
13145               if (j >= ARRAY_SIZE (cpu_noarch))
13146                 j = ARRAY_SIZE (cpu_arch);
13147             }
13148
13149           if (j >= ARRAY_SIZE (cpu_arch))
13150             as_fatal (_("invalid -march= option: `%s'"), arg);
13151
13152           arch = next;
13153         }
13154       while (next != NULL);
13155       free (saved);
13156       break;
13157
13158     case OPTION_MTUNE:
13159       if (*arg == '.')
13160         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13161       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13162         {
13163           if (strcmp (arg, cpu_arch [j].name) == 0)
13164             {
13165               cpu_arch_tune_set = 1;
13166               cpu_arch_tune = cpu_arch [j].type;
13167               cpu_arch_tune_flags = cpu_arch[j].flags;
13168               break;
13169             }
13170         }
13171       if (j >= ARRAY_SIZE (cpu_arch))
13172         as_fatal (_("invalid -mtune= option: `%s'"), arg);
13173       break;
13174
13175     case OPTION_MMNEMONIC:
13176       if (strcasecmp (arg, "att") == 0)
13177         intel_mnemonic = 0;
13178       else if (strcasecmp (arg, "intel") == 0)
13179         intel_mnemonic = 1;
13180       else
13181         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13182       break;
13183
13184     case OPTION_MSYNTAX:
13185       if (strcasecmp (arg, "att") == 0)
13186         intel_syntax = 0;
13187       else if (strcasecmp (arg, "intel") == 0)
13188         intel_syntax = 1;
13189       else
13190         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13191       break;
13192
13193     case OPTION_MINDEX_REG:
13194       allow_index_reg = 1;
13195       break;
13196
13197     case OPTION_MNAKED_REG:
13198       allow_naked_reg = 1;
13199       break;
13200
13201     case OPTION_MSSE2AVX:
13202       sse2avx = 1;
13203       break;
13204
13205     case OPTION_MSSE_CHECK:
13206       if (strcasecmp (arg, "error") == 0)
13207         sse_check = check_error;
13208       else if (strcasecmp (arg, "warning") == 0)
13209         sse_check = check_warning;
13210       else if (strcasecmp (arg, "none") == 0)
13211         sse_check = check_none;
13212       else
13213         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13214       break;
13215
13216     case OPTION_MOPERAND_CHECK:
13217       if (strcasecmp (arg, "error") == 0)
13218         operand_check = check_error;
13219       else if (strcasecmp (arg, "warning") == 0)
13220         operand_check = check_warning;
13221       else if (strcasecmp (arg, "none") == 0)
13222         operand_check = check_none;
13223       else
13224         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13225       break;
13226
13227     case OPTION_MAVXSCALAR:
13228       if (strcasecmp (arg, "128") == 0)
13229         avxscalar = vex128;
13230       else if (strcasecmp (arg, "256") == 0)
13231         avxscalar = vex256;
13232       else
13233         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13234       break;
13235
13236     case OPTION_MVEXWIG:
13237       if (strcmp (arg, "0") == 0)
13238         vexwig = vexw0;
13239       else if (strcmp (arg, "1") == 0)
13240         vexwig = vexw1;
13241       else
13242         as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13243       break;
13244
13245     case OPTION_MADD_BND_PREFIX:
13246       add_bnd_prefix = 1;
13247       break;
13248
13249     case OPTION_MEVEXLIG:
13250       if (strcmp (arg, "128") == 0)
13251         evexlig = evexl128;
13252       else if (strcmp (arg, "256") == 0)
13253         evexlig = evexl256;
13254       else  if (strcmp (arg, "512") == 0)
13255         evexlig = evexl512;
13256       else
13257         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13258       break;
13259
13260     case OPTION_MEVEXRCIG:
13261       if (strcmp (arg, "rne") == 0)
13262         evexrcig = rne;
13263       else if (strcmp (arg, "rd") == 0)
13264         evexrcig = rd;
13265       else if (strcmp (arg, "ru") == 0)
13266         evexrcig = ru;
13267       else if (strcmp (arg, "rz") == 0)
13268         evexrcig = rz;
13269       else
13270         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13271       break;
13272
13273     case OPTION_MEVEXWIG:
13274       if (strcmp (arg, "0") == 0)
13275         evexwig = evexw0;
13276       else if (strcmp (arg, "1") == 0)
13277         evexwig = evexw1;
13278       else
13279         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13280       break;
13281
13282 # if defined (TE_PE) || defined (TE_PEP)
13283     case OPTION_MBIG_OBJ:
13284       use_big_obj = 1;
13285       break;
13286 #endif
13287
13288     case OPTION_MOMIT_LOCK_PREFIX:
13289       if (strcasecmp (arg, "yes") == 0)
13290         omit_lock_prefix = 1;
13291       else if (strcasecmp (arg, "no") == 0)
13292         omit_lock_prefix = 0;
13293       else
13294         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13295       break;
13296
13297     case OPTION_MFENCE_AS_LOCK_ADD:
13298       if (strcasecmp (arg, "yes") == 0)
13299         avoid_fence = 1;
13300       else if (strcasecmp (arg, "no") == 0)
13301         avoid_fence = 0;
13302       else
13303         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13304       break;
13305
13306     case OPTION_MLFENCE_AFTER_LOAD:
13307       if (strcasecmp (arg, "yes") == 0)
13308         lfence_after_load = 1;
13309       else if (strcasecmp (arg, "no") == 0)
13310         lfence_after_load = 0;
13311       else
13312         as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13313       break;
13314
13315     case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13316       if (strcasecmp (arg, "all") == 0)
13317         {
13318           lfence_before_indirect_branch = lfence_branch_all;
13319           if (lfence_before_ret == lfence_before_ret_none)
13320             lfence_before_ret = lfence_before_ret_shl;
13321         }
13322       else if (strcasecmp (arg, "memory") == 0)
13323         lfence_before_indirect_branch = lfence_branch_memory;
13324       else if (strcasecmp (arg, "register") == 0)
13325         lfence_before_indirect_branch = lfence_branch_register;
13326       else if (strcasecmp (arg, "none") == 0)
13327         lfence_before_indirect_branch = lfence_branch_none;
13328       else
13329         as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13330                   arg);
13331       break;
13332
13333     case OPTION_MLFENCE_BEFORE_RET:
13334       if (strcasecmp (arg, "or") == 0)
13335         lfence_before_ret = lfence_before_ret_or;
13336       else if (strcasecmp (arg, "not") == 0)
13337         lfence_before_ret = lfence_before_ret_not;
13338       else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13339         lfence_before_ret = lfence_before_ret_shl;
13340       else if (strcasecmp (arg, "none") == 0)
13341         lfence_before_ret = lfence_before_ret_none;
13342       else
13343         as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13344                   arg);
13345       break;
13346
13347     case OPTION_MRELAX_RELOCATIONS:
13348       if (strcasecmp (arg, "yes") == 0)
13349         generate_relax_relocations = 1;
13350       else if (strcasecmp (arg, "no") == 0)
13351         generate_relax_relocations = 0;
13352       else
13353         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13354       break;
13355
13356     case OPTION_MALIGN_BRANCH_BOUNDARY:
13357       {
13358         char *end;
13359         long int align = strtoul (arg, &end, 0);
13360         if (*end == '\0')
13361           {
13362             if (align == 0)
13363               {
13364                 align_branch_power = 0;
13365                 break;
13366               }
13367             else if (align >= 16)
13368               {
13369                 int align_power;
13370                 for (align_power = 0;
13371                      (align & 1) == 0;
13372                      align >>= 1, align_power++)
13373                   continue;
13374                 /* Limit alignment power to 31.  */
13375                 if (align == 1 && align_power < 32)
13376                   {
13377                     align_branch_power = align_power;
13378                     break;
13379                   }
13380               }
13381           }
13382         as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13383       }
13384       break;
13385
13386     case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13387       {
13388         char *end;
13389         int align = strtoul (arg, &end, 0);
13390         /* Some processors only support 5 prefixes.  */
13391         if (*end == '\0' && align >= 0 && align < 6)
13392           {
13393             align_branch_prefix_size = align;
13394             break;
13395           }
13396         as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13397                   arg);
13398       }
13399       break;
13400
13401     case OPTION_MALIGN_BRANCH:
13402       align_branch = 0;
13403       saved = xstrdup (arg);
13404       type = saved;
13405       do
13406         {
13407           next = strchr (type, '+');
13408           if (next)
13409             *next++ = '\0';
13410           if (strcasecmp (type, "jcc") == 0)
13411             align_branch |= align_branch_jcc_bit;
13412           else if (strcasecmp (type, "fused") == 0)
13413             align_branch |= align_branch_fused_bit;
13414           else if (strcasecmp (type, "jmp") == 0)
13415             align_branch |= align_branch_jmp_bit;
13416           else if (strcasecmp (type, "call") == 0)
13417             align_branch |= align_branch_call_bit;
13418           else if (strcasecmp (type, "ret") == 0)
13419             align_branch |= align_branch_ret_bit;
13420           else if (strcasecmp (type, "indirect") == 0)
13421             align_branch |= align_branch_indirect_bit;
13422           else
13423             as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13424           type = next;
13425         }
13426       while (next != NULL);
13427       free (saved);
13428       break;
13429
13430     case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13431       align_branch_power = 5;
13432       align_branch_prefix_size = 5;
13433       align_branch = (align_branch_jcc_bit
13434                       | align_branch_fused_bit
13435                       | align_branch_jmp_bit);
13436       break;
13437
13438     case OPTION_MAMD64:
13439       isa64 = amd64;
13440       break;
13441
13442     case OPTION_MINTEL64:
13443       isa64 = intel64;
13444       break;
13445
13446     case 'O':
13447       if (arg == NULL)
13448         {
13449           optimize = 1;
13450           /* Turn off -Os.  */
13451           optimize_for_space = 0;
13452         }
13453       else if (*arg == 's')
13454         {
13455           optimize_for_space = 1;
13456           /* Turn on all encoding optimizations.  */
13457           optimize = INT_MAX;
13458         }
13459       else
13460         {
13461           optimize = atoi (arg);
13462           /* Turn off -Os.  */
13463           optimize_for_space = 0;
13464         }
13465       break;
13466
13467     default:
13468       return 0;
13469     }
13470   return 1;
13471 }
13472
13473 #define MESSAGE_TEMPLATE \
13474 "                                                                                "
13475
13476 static char *
13477 output_message (FILE *stream, char *p, char *message, char *start,
13478                 int *left_p, const char *name, int len)
13479 {
13480   int size = sizeof (MESSAGE_TEMPLATE);
13481   int left = *left_p;
13482
13483   /* Reserve 2 spaces for ", " or ",\0" */
13484   left -= len + 2;
13485
13486   /* Check if there is any room.  */
13487   if (left >= 0)
13488     {
13489       if (p != start)
13490         {
13491           *p++ = ',';
13492           *p++ = ' ';
13493         }
13494       p = mempcpy (p, name, len);
13495     }
13496   else
13497     {
13498       /* Output the current message now and start a new one.  */
13499       *p++ = ',';
13500       *p = '\0';
13501       fprintf (stream, "%s\n", message);
13502       p = start;
13503       left = size - (start - message) - len - 2;
13504
13505       gas_assert (left >= 0);
13506
13507       p = mempcpy (p, name, len);
13508     }
13509
13510   *left_p = left;
13511   return p;
13512 }
13513
13514 static void
13515 show_arch (FILE *stream, int ext, int check)
13516 {
13517   static char message[] = MESSAGE_TEMPLATE;
13518   char *start = message + 27;
13519   char *p;
13520   int size = sizeof (MESSAGE_TEMPLATE);
13521   int left;
13522   const char *name;
13523   int len;
13524   unsigned int j;
13525
13526   p = start;
13527   left = size - (start - message);
13528   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13529     {
13530       /* Should it be skipped?  */
13531       if (cpu_arch [j].skip)
13532         continue;
13533
13534       name = cpu_arch [j].name;
13535       len = cpu_arch [j].len;
13536       if (*name == '.')
13537         {
13538           /* It is an extension.  Skip if we aren't asked to show it.  */
13539           if (ext)
13540             {
13541               name++;
13542               len--;
13543             }
13544           else
13545             continue;
13546         }
13547       else if (ext)
13548         {
13549           /* It is an processor.  Skip if we show only extension.  */
13550           continue;
13551         }
13552       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13553         {
13554           /* It is an impossible processor - skip.  */
13555           continue;
13556         }
13557
13558       p = output_message (stream, p, message, start, &left, name, len);
13559     }
13560
13561   /* Display disabled extensions.  */
13562   if (ext)
13563     for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13564       {
13565         name = cpu_noarch [j].name;
13566         len = cpu_noarch [j].len;
13567         p = output_message (stream, p, message, start, &left, name,
13568                             len);
13569       }
13570
13571   *p = '\0';
13572   fprintf (stream, "%s\n", message);
13573 }
13574
13575 void
13576 md_show_usage (FILE *stream)
13577 {
13578 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13579   fprintf (stream, _("\
13580   -Qy, -Qn                ignored\n\
13581   -V                      print assembler version number\n\
13582   -k                      ignored\n"));
13583 #endif
13584   fprintf (stream, _("\
13585   -n                      Do not optimize code alignment\n\
13586   -q                      quieten some warnings\n"));
13587 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13588   fprintf (stream, _("\
13589   -s                      ignored\n"));
13590 #endif
13591 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13592                       || defined (TE_PE) || defined (TE_PEP))
13593   fprintf (stream, _("\
13594   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
13595 #endif
13596 #ifdef SVR4_COMMENT_CHARS
13597   fprintf (stream, _("\
13598   --divide                do not treat `/' as a comment character\n"));
13599 #else
13600   fprintf (stream, _("\
13601   --divide                ignored\n"));
13602 #endif
13603   fprintf (stream, _("\
13604   -march=CPU[,+EXTENSION...]\n\
13605                           generate code for CPU and EXTENSION, CPU is one of:\n"));
13606   show_arch (stream, 0, 1);
13607   fprintf (stream, _("\
13608                           EXTENSION is combination of:\n"));
13609   show_arch (stream, 1, 0);
13610   fprintf (stream, _("\
13611   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
13612   show_arch (stream, 0, 0);
13613   fprintf (stream, _("\
13614   -msse2avx               encode SSE instructions with VEX prefix\n"));
13615   fprintf (stream, _("\
13616   -msse-check=[none|error|warning] (default: warning)\n\
13617                           check SSE instructions\n"));
13618   fprintf (stream, _("\
13619   -moperand-check=[none|error|warning] (default: warning)\n\
13620                           check operand combinations for validity\n"));
13621   fprintf (stream, _("\
13622   -mavxscalar=[128|256] (default: 128)\n\
13623                           encode scalar AVX instructions with specific vector\n\
13624                            length\n"));
13625   fprintf (stream, _("\
13626   -mvexwig=[0|1] (default: 0)\n\
13627                           encode VEX instructions with specific VEX.W value\n\
13628                            for VEX.W bit ignored instructions\n"));
13629   fprintf (stream, _("\
13630   -mevexlig=[128|256|512] (default: 128)\n\
13631                           encode scalar EVEX instructions with specific vector\n\
13632                            length\n"));
13633   fprintf (stream, _("\
13634   -mevexwig=[0|1] (default: 0)\n\
13635                           encode EVEX instructions with specific EVEX.W value\n\
13636                            for EVEX.W bit ignored instructions\n"));
13637   fprintf (stream, _("\
13638   -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13639                           encode EVEX instructions with specific EVEX.RC value\n\
13640                            for SAE-only ignored instructions\n"));
13641   fprintf (stream, _("\
13642   -mmnemonic=[att|intel] "));
13643   if (SYSV386_COMPAT)
13644     fprintf (stream, _("(default: att)\n"));
13645   else
13646     fprintf (stream, _("(default: intel)\n"));
13647   fprintf (stream, _("\
13648                           use AT&T/Intel mnemonic\n"));
13649   fprintf (stream, _("\
13650   -msyntax=[att|intel] (default: att)\n\
13651                           use AT&T/Intel syntax\n"));
13652   fprintf (stream, _("\
13653   -mindex-reg             support pseudo index registers\n"));
13654   fprintf (stream, _("\
13655   -mnaked-reg             don't require `%%' prefix for registers\n"));
13656   fprintf (stream, _("\
13657   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
13658 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13659   fprintf (stream, _("\
13660   -mshared                disable branch optimization for shared code\n"));
13661   fprintf (stream, _("\
13662   -mx86-used-note=[no|yes] "));
13663   if (DEFAULT_X86_USED_NOTE)
13664     fprintf (stream, _("(default: yes)\n"));
13665   else
13666     fprintf (stream, _("(default: no)\n"));
13667   fprintf (stream, _("\
13668                           generate x86 used ISA and feature properties\n"));
13669 #endif
13670 #if defined (TE_PE) || defined (TE_PEP)
13671   fprintf (stream, _("\
13672   -mbig-obj               generate big object files\n"));
13673 #endif
13674   fprintf (stream, _("\
13675   -momit-lock-prefix=[no|yes] (default: no)\n\
13676                           strip all lock prefixes\n"));
13677   fprintf (stream, _("\
13678   -mfence-as-lock-add=[no|yes] (default: no)\n\
13679                           encode lfence, mfence and sfence as\n\
13680                            lock addl $0x0, (%%{re}sp)\n"));
13681   fprintf (stream, _("\
13682   -mrelax-relocations=[no|yes] "));
13683   if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13684     fprintf (stream, _("(default: yes)\n"));
13685   else
13686     fprintf (stream, _("(default: no)\n"));
13687   fprintf (stream, _("\
13688                           generate relax relocations\n"));
13689   fprintf (stream, _("\
13690   -malign-branch-boundary=NUM (default: 0)\n\
13691                           align branches within NUM byte boundary\n"));
13692   fprintf (stream, _("\
13693   -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13694                           TYPE is combination of jcc, fused, jmp, call, ret,\n\
13695                            indirect\n\
13696                           specify types of branches to align\n"));
13697   fprintf (stream, _("\
13698   -malign-branch-prefix-size=NUM (default: 5)\n\
13699                           align branches with NUM prefixes per instruction\n"));
13700   fprintf (stream, _("\
13701   -mbranches-within-32B-boundaries\n\
13702                           align branches within 32 byte boundary\n"));
13703   fprintf (stream, _("\
13704   -mlfence-after-load=[no|yes] (default: no)\n\
13705                           generate lfence after load\n"));
13706   fprintf (stream, _("\
13707   -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13708                           generate lfence before indirect near branch\n"));
13709   fprintf (stream, _("\
13710   -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13711                           generate lfence before ret\n"));
13712   fprintf (stream, _("\
13713   -mamd64                 accept only AMD64 ISA [default]\n"));
13714   fprintf (stream, _("\
13715   -mintel64               accept only Intel64 ISA\n"));
13716 }
13717
13718 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13719      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13720      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13721
13722 /* Pick the target format to use.  */
13723
13724 const char *
13725 i386_target_format (void)
13726 {
13727   if (!strncmp (default_arch, "x86_64", 6))
13728     {
13729       update_code_flag (CODE_64BIT, 1);
13730       if (default_arch[6] == '\0')
13731         x86_elf_abi = X86_64_ABI;
13732       else
13733         x86_elf_abi = X86_64_X32_ABI;
13734     }
13735   else if (!strcmp (default_arch, "i386"))
13736     update_code_flag (CODE_32BIT, 1);
13737   else if (!strcmp (default_arch, "iamcu"))
13738     {
13739       update_code_flag (CODE_32BIT, 1);
13740       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13741         {
13742           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13743           cpu_arch_name = "iamcu";
13744           cpu_sub_arch_name = NULL;
13745           cpu_arch_flags = iamcu_flags;
13746           cpu_arch_isa = PROCESSOR_IAMCU;
13747           cpu_arch_isa_flags = iamcu_flags;
13748           if (!cpu_arch_tune_set)
13749             {
13750               cpu_arch_tune = cpu_arch_isa;
13751               cpu_arch_tune_flags = cpu_arch_isa_flags;
13752             }
13753         }
13754       else if (cpu_arch_isa != PROCESSOR_IAMCU)
13755         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13756                   cpu_arch_name);
13757     }
13758   else
13759     as_fatal (_("unknown architecture"));
13760
13761   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13762     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13763   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13764     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13765
13766   switch (OUTPUT_FLAVOR)
13767     {
13768 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13769     case bfd_target_aout_flavour:
13770       return AOUT_TARGET_FORMAT;
13771 #endif
13772 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13773 # if defined (TE_PE) || defined (TE_PEP)
13774     case bfd_target_coff_flavour:
13775       if (flag_code == CODE_64BIT)
13776         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13777       else
13778         return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13779 # elif defined (TE_GO32)
13780     case bfd_target_coff_flavour:
13781       return "coff-go32";
13782 # else
13783     case bfd_target_coff_flavour:
13784       return "coff-i386";
13785 # endif
13786 #endif
13787 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13788     case bfd_target_elf_flavour:
13789       {
13790         const char *format;
13791
13792         switch (x86_elf_abi)
13793           {
13794           default:
13795             format = ELF_TARGET_FORMAT;
13796 #ifndef TE_SOLARIS
13797             tls_get_addr = "___tls_get_addr";
13798 #endif
13799             break;
13800           case X86_64_ABI:
13801             use_rela_relocations = 1;
13802             object_64bit = 1;
13803 #ifndef TE_SOLARIS
13804             tls_get_addr = "__tls_get_addr";
13805 #endif
13806             format = ELF_TARGET_FORMAT64;
13807             break;
13808           case X86_64_X32_ABI:
13809             use_rela_relocations = 1;
13810             object_64bit = 1;
13811 #ifndef TE_SOLARIS
13812             tls_get_addr = "__tls_get_addr";
13813 #endif
13814             disallow_64bit_reloc = 1;
13815             format = ELF_TARGET_FORMAT32;
13816             break;
13817           }
13818         if (cpu_arch_isa == PROCESSOR_L1OM)
13819           {
13820             if (x86_elf_abi != X86_64_ABI)
13821               as_fatal (_("Intel L1OM is 64bit only"));
13822             return ELF_TARGET_L1OM_FORMAT;
13823           }
13824         else if (cpu_arch_isa == PROCESSOR_K1OM)
13825           {
13826             if (x86_elf_abi != X86_64_ABI)
13827               as_fatal (_("Intel K1OM is 64bit only"));
13828             return ELF_TARGET_K1OM_FORMAT;
13829           }
13830         else if (cpu_arch_isa == PROCESSOR_IAMCU)
13831           {
13832             if (x86_elf_abi != I386_ABI)
13833               as_fatal (_("Intel MCU is 32bit only"));
13834             return ELF_TARGET_IAMCU_FORMAT;
13835           }
13836         else
13837           return format;
13838       }
13839 #endif
13840 #if defined (OBJ_MACH_O)
13841     case bfd_target_mach_o_flavour:
13842       if (flag_code == CODE_64BIT)
13843         {
13844           use_rela_relocations = 1;
13845           object_64bit = 1;
13846           return "mach-o-x86-64";
13847         }
13848       else
13849         return "mach-o-i386";
13850 #endif
13851     default:
13852       abort ();
13853       return NULL;
13854     }
13855 }
13856
13857 #endif /* OBJ_MAYBE_ more than one  */
13858 \f
13859 symbolS *
13860 md_undefined_symbol (char *name)
13861 {
13862   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13863       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13864       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13865       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13866     {
13867       if (!GOT_symbol)
13868         {
13869           if (symbol_find (name))
13870             as_bad (_("GOT already in symbol table"));
13871           GOT_symbol = symbol_new (name, undefined_section,
13872                                    &zero_address_frag, 0);
13873         };
13874       return GOT_symbol;
13875     }
13876   return 0;
13877 }
13878
13879 /* Round up a section size to the appropriate boundary.  */
13880
13881 valueT
13882 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13883 {
13884 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13885   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13886     {
13887       /* For a.out, force the section size to be aligned.  If we don't do
13888          this, BFD will align it for us, but it will not write out the
13889          final bytes of the section.  This may be a bug in BFD, but it is
13890          easier to fix it here since that is how the other a.out targets
13891          work.  */
13892       int align;
13893
13894       align = bfd_section_alignment (segment);
13895       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13896     }
13897 #endif
13898
13899   return size;
13900 }
13901
13902 /* On the i386, PC-relative offsets are relative to the start of the
13903    next instruction.  That is, the address of the offset, plus its
13904    size, since the offset is always the last part of the insn.  */
13905
13906 long
13907 md_pcrel_from (fixS *fixP)
13908 {
13909   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13910 }
13911
13912 #ifndef I386COFF
13913
13914 static void
13915 s_bss (int ignore ATTRIBUTE_UNUSED)
13916 {
13917   int temp;
13918
13919 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13920   if (IS_ELF)
13921     obj_elf_section_change_hook ();
13922 #endif
13923   temp = get_absolute_expression ();
13924   subseg_set (bss_section, (subsegT) temp);
13925   demand_empty_rest_of_line ();
13926 }
13927
13928 #endif
13929
13930 /* Remember constant directive.  */
13931
13932 void
13933 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13934 {
13935   if (last_insn.kind != last_insn_directive
13936       && (bfd_section_flags (now_seg) & SEC_CODE))
13937     {
13938       last_insn.seg = now_seg;
13939       last_insn.kind = last_insn_directive;
13940       last_insn.name = "constant directive";
13941       last_insn.file = as_where (&last_insn.line);
13942       if (lfence_before_ret != lfence_before_ret_none)
13943         {
13944           if (lfence_before_indirect_branch != lfence_branch_none)
13945             as_warn (_("constant directive skips -mlfence-before-ret "
13946                        "and -mlfence-before-indirect-branch"));
13947           else
13948             as_warn (_("constant directive skips -mlfence-before-ret"));
13949         }
13950       else if (lfence_before_indirect_branch != lfence_branch_none)
13951         as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13952     }
13953 }
13954
13955 void
13956 i386_validate_fix (fixS *fixp)
13957 {
13958   if (fixp->fx_subsy)
13959     {
13960       if (fixp->fx_subsy == GOT_symbol)
13961         {
13962           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13963             {
13964               if (!object_64bit)
13965                 abort ();
13966 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13967               if (fixp->fx_tcbit2)
13968                 fixp->fx_r_type = (fixp->fx_tcbit
13969                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
13970                                    : BFD_RELOC_X86_64_GOTPCRELX);
13971               else
13972 #endif
13973                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13974             }
13975           else
13976             {
13977               if (!object_64bit)
13978                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13979               else
13980                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13981             }
13982           fixp->fx_subsy = 0;
13983         }
13984     }
13985 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13986   else
13987     {
13988       /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
13989          to section.  Since PLT32 relocation must be against symbols,
13990          turn such PLT32 relocation into PC32 relocation.  */
13991       if (fixp->fx_addsy
13992           && (fixp->fx_r_type == BFD_RELOC_386_PLT32
13993               || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
13994           && symbol_section_p (fixp->fx_addsy))
13995         fixp->fx_r_type = BFD_RELOC_32_PCREL;
13996       if (!object_64bit)
13997         {
13998           if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13999               && fixp->fx_tcbit2)
14000             fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14001         }
14002     }
14003 #endif
14004 }
14005
14006 arelent *
14007 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
14008 {
14009   arelent *rel;
14010   bfd_reloc_code_real_type code;
14011
14012   switch (fixp->fx_r_type)
14013     {
14014 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14015     case BFD_RELOC_SIZE32:
14016     case BFD_RELOC_SIZE64:
14017       if (S_IS_DEFINED (fixp->fx_addsy)
14018           && !S_IS_EXTERNAL (fixp->fx_addsy))
14019         {
14020           /* Resolve size relocation against local symbol to size of
14021              the symbol plus addend.  */
14022           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
14023           if (fixp->fx_r_type == BFD_RELOC_SIZE32
14024               && !fits_in_unsigned_long (value))
14025             as_bad_where (fixp->fx_file, fixp->fx_line,
14026                           _("symbol size computation overflow"));
14027           fixp->fx_addsy = NULL;
14028           fixp->fx_subsy = NULL;
14029           md_apply_fix (fixp, (valueT *) &value, NULL);
14030           return NULL;
14031         }
14032 #endif
14033       /* Fall through.  */
14034
14035     case BFD_RELOC_X86_64_PLT32:
14036     case BFD_RELOC_X86_64_GOT32:
14037     case BFD_RELOC_X86_64_GOTPCREL:
14038     case BFD_RELOC_X86_64_GOTPCRELX:
14039     case BFD_RELOC_X86_64_REX_GOTPCRELX:
14040     case BFD_RELOC_386_PLT32:
14041     case BFD_RELOC_386_GOT32:
14042     case BFD_RELOC_386_GOT32X:
14043     case BFD_RELOC_386_GOTOFF:
14044     case BFD_RELOC_386_GOTPC:
14045     case BFD_RELOC_386_TLS_GD:
14046     case BFD_RELOC_386_TLS_LDM:
14047     case BFD_RELOC_386_TLS_LDO_32:
14048     case BFD_RELOC_386_TLS_IE_32:
14049     case BFD_RELOC_386_TLS_IE:
14050     case BFD_RELOC_386_TLS_GOTIE:
14051     case BFD_RELOC_386_TLS_LE_32:
14052     case BFD_RELOC_386_TLS_LE:
14053     case BFD_RELOC_386_TLS_GOTDESC:
14054     case BFD_RELOC_386_TLS_DESC_CALL:
14055     case BFD_RELOC_X86_64_TLSGD:
14056     case BFD_RELOC_X86_64_TLSLD:
14057     case BFD_RELOC_X86_64_DTPOFF32:
14058     case BFD_RELOC_X86_64_DTPOFF64:
14059     case BFD_RELOC_X86_64_GOTTPOFF:
14060     case BFD_RELOC_X86_64_TPOFF32:
14061     case BFD_RELOC_X86_64_TPOFF64:
14062     case BFD_RELOC_X86_64_GOTOFF64:
14063     case BFD_RELOC_X86_64_GOTPC32:
14064     case BFD_RELOC_X86_64_GOT64:
14065     case BFD_RELOC_X86_64_GOTPCREL64:
14066     case BFD_RELOC_X86_64_GOTPC64:
14067     case BFD_RELOC_X86_64_GOTPLT64:
14068     case BFD_RELOC_X86_64_PLTOFF64:
14069     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14070     case BFD_RELOC_X86_64_TLSDESC_CALL:
14071     case BFD_RELOC_RVA:
14072     case BFD_RELOC_VTABLE_ENTRY:
14073     case BFD_RELOC_VTABLE_INHERIT:
14074 #ifdef TE_PE
14075     case BFD_RELOC_32_SECREL:
14076 #endif
14077       code = fixp->fx_r_type;
14078       break;
14079     case BFD_RELOC_X86_64_32S:
14080       if (!fixp->fx_pcrel)
14081         {
14082           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
14083           code = fixp->fx_r_type;
14084           break;
14085         }
14086       /* Fall through.  */
14087     default:
14088       if (fixp->fx_pcrel)
14089         {
14090           switch (fixp->fx_size)
14091             {
14092             default:
14093               as_bad_where (fixp->fx_file, fixp->fx_line,
14094                             _("can not do %d byte pc-relative relocation"),
14095                             fixp->fx_size);
14096               code = BFD_RELOC_32_PCREL;
14097               break;
14098             case 1: code = BFD_RELOC_8_PCREL;  break;
14099             case 2: code = BFD_RELOC_16_PCREL; break;
14100             case 4: code = BFD_RELOC_32_PCREL; break;
14101 #ifdef BFD64
14102             case 8: code = BFD_RELOC_64_PCREL; break;
14103 #endif
14104             }
14105         }
14106       else
14107         {
14108           switch (fixp->fx_size)
14109             {
14110             default:
14111               as_bad_where (fixp->fx_file, fixp->fx_line,
14112                             _("can not do %d byte relocation"),
14113                             fixp->fx_size);
14114               code = BFD_RELOC_32;
14115               break;
14116             case 1: code = BFD_RELOC_8;  break;
14117             case 2: code = BFD_RELOC_16; break;
14118             case 4: code = BFD_RELOC_32; break;
14119 #ifdef BFD64
14120             case 8: code = BFD_RELOC_64; break;
14121 #endif
14122             }
14123         }
14124       break;
14125     }
14126
14127   if ((code == BFD_RELOC_32
14128        || code == BFD_RELOC_32_PCREL
14129        || code == BFD_RELOC_X86_64_32S)
14130       && GOT_symbol
14131       && fixp->fx_addsy == GOT_symbol)
14132     {
14133       if (!object_64bit)
14134         code = BFD_RELOC_386_GOTPC;
14135       else
14136         code = BFD_RELOC_X86_64_GOTPC32;
14137     }
14138   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14139       && GOT_symbol
14140       && fixp->fx_addsy == GOT_symbol)
14141     {
14142       code = BFD_RELOC_X86_64_GOTPC64;
14143     }
14144
14145   rel = XNEW (arelent);
14146   rel->sym_ptr_ptr = XNEW (asymbol *);
14147   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14148
14149   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14150
14151   if (!use_rela_relocations)
14152     {
14153       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14154          vtable entry to be used in the relocation's section offset.  */
14155       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14156         rel->address = fixp->fx_offset;
14157 #if defined (OBJ_COFF) && defined (TE_PE)
14158       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14159         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14160       else
14161 #endif
14162       rel->addend = 0;
14163     }
14164   /* Use the rela in 64bit mode.  */
14165   else
14166     {
14167       if (disallow_64bit_reloc)
14168         switch (code)
14169           {
14170           case BFD_RELOC_X86_64_DTPOFF64:
14171           case BFD_RELOC_X86_64_TPOFF64:
14172           case BFD_RELOC_64_PCREL:
14173           case BFD_RELOC_X86_64_GOTOFF64:
14174           case BFD_RELOC_X86_64_GOT64:
14175           case BFD_RELOC_X86_64_GOTPCREL64:
14176           case BFD_RELOC_X86_64_GOTPC64:
14177           case BFD_RELOC_X86_64_GOTPLT64:
14178           case BFD_RELOC_X86_64_PLTOFF64:
14179             as_bad_where (fixp->fx_file, fixp->fx_line,
14180                           _("cannot represent relocation type %s in x32 mode"),
14181                           bfd_get_reloc_code_name (code));
14182             break;
14183           default:
14184             break;
14185           }
14186
14187       if (!fixp->fx_pcrel)
14188         rel->addend = fixp->fx_offset;
14189       else
14190         switch (code)
14191           {
14192           case BFD_RELOC_X86_64_PLT32:
14193           case BFD_RELOC_X86_64_GOT32:
14194           case BFD_RELOC_X86_64_GOTPCREL:
14195           case BFD_RELOC_X86_64_GOTPCRELX:
14196           case BFD_RELOC_X86_64_REX_GOTPCRELX:
14197           case BFD_RELOC_X86_64_TLSGD:
14198           case BFD_RELOC_X86_64_TLSLD:
14199           case BFD_RELOC_X86_64_GOTTPOFF:
14200           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14201           case BFD_RELOC_X86_64_TLSDESC_CALL:
14202             rel->addend = fixp->fx_offset - fixp->fx_size;
14203             break;
14204           default:
14205             rel->addend = (section->vma
14206                            - fixp->fx_size
14207                            + fixp->fx_addnumber
14208                            + md_pcrel_from (fixp));
14209             break;
14210           }
14211     }
14212
14213   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14214   if (rel->howto == NULL)
14215     {
14216       as_bad_where (fixp->fx_file, fixp->fx_line,
14217                     _("cannot represent relocation type %s"),
14218                     bfd_get_reloc_code_name (code));
14219       /* Set howto to a garbage value so that we can keep going.  */
14220       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14221       gas_assert (rel->howto != NULL);
14222     }
14223
14224   return rel;
14225 }
14226
14227 #include "tc-i386-intel.c"
14228
14229 void
14230 tc_x86_parse_to_dw2regnum (expressionS *exp)
14231 {
14232   int saved_naked_reg;
14233   char saved_register_dot;
14234
14235   saved_naked_reg = allow_naked_reg;
14236   allow_naked_reg = 1;
14237   saved_register_dot = register_chars['.'];
14238   register_chars['.'] = '.';
14239   allow_pseudo_reg = 1;
14240   expression_and_evaluate (exp);
14241   allow_pseudo_reg = 0;
14242   register_chars['.'] = saved_register_dot;
14243   allow_naked_reg = saved_naked_reg;
14244
14245   if (exp->X_op == O_register && exp->X_add_number >= 0)
14246     {
14247       if ((addressT) exp->X_add_number < i386_regtab_size)
14248         {
14249           exp->X_op = O_constant;
14250           exp->X_add_number = i386_regtab[exp->X_add_number]
14251                               .dw2_regnum[flag_code >> 1];
14252         }
14253       else
14254         exp->X_op = O_illegal;
14255     }
14256 }
14257
14258 void
14259 tc_x86_frame_initial_instructions (void)
14260 {
14261   static unsigned int sp_regno[2];
14262
14263   if (!sp_regno[flag_code >> 1])
14264     {
14265       char *saved_input = input_line_pointer;
14266       char sp[][4] = {"esp", "rsp"};
14267       expressionS exp;
14268
14269       input_line_pointer = sp[flag_code >> 1];
14270       tc_x86_parse_to_dw2regnum (&exp);
14271       gas_assert (exp.X_op == O_constant);
14272       sp_regno[flag_code >> 1] = exp.X_add_number;
14273       input_line_pointer = saved_input;
14274     }
14275
14276   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14277   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14278 }
14279
14280 int
14281 x86_dwarf2_addr_size (void)
14282 {
14283 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14284   if (x86_elf_abi == X86_64_X32_ABI)
14285     return 4;
14286 #endif
14287   return bfd_arch_bits_per_address (stdoutput) / 8;
14288 }
14289
14290 int
14291 i386_elf_section_type (const char *str, size_t len)
14292 {
14293   if (flag_code == CODE_64BIT
14294       && len == sizeof ("unwind") - 1
14295       && strncmp (str, "unwind", 6) == 0)
14296     return SHT_X86_64_UNWIND;
14297
14298   return -1;
14299 }
14300
14301 #ifdef TE_SOLARIS
14302 void
14303 i386_solaris_fix_up_eh_frame (segT sec)
14304 {
14305   if (flag_code == CODE_64BIT)
14306     elf_section_type (sec) = SHT_X86_64_UNWIND;
14307 }
14308 #endif
14309
14310 #ifdef TE_PE
14311 void
14312 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14313 {
14314   expressionS exp;
14315
14316   exp.X_op = O_secrel;
14317   exp.X_add_symbol = symbol;
14318   exp.X_add_number = 0;
14319   emit_expr (&exp, size);
14320 }
14321 #endif
14322
14323 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14324 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
14325
14326 bfd_vma
14327 x86_64_section_letter (int letter, const char **ptr_msg)
14328 {
14329   if (flag_code == CODE_64BIT)
14330     {
14331       if (letter == 'l')
14332         return SHF_X86_64_LARGE;
14333
14334       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14335     }
14336   else
14337     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14338   return -1;
14339 }
14340
14341 bfd_vma
14342 x86_64_section_word (char *str, size_t len)
14343 {
14344   if (len == 5 && flag_code == CODE_64BIT && startswith (str, "large"))
14345     return SHF_X86_64_LARGE;
14346
14347   return -1;
14348 }
14349
14350 static void
14351 handle_large_common (int small ATTRIBUTE_UNUSED)
14352 {
14353   if (flag_code != CODE_64BIT)
14354     {
14355       s_comm_internal (0, elf_common_parse);
14356       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14357     }
14358   else
14359     {
14360       static segT lbss_section;
14361       asection *saved_com_section_ptr = elf_com_section_ptr;
14362       asection *saved_bss_section = bss_section;
14363
14364       if (lbss_section == NULL)
14365         {
14366           flagword applicable;
14367           segT seg = now_seg;
14368           subsegT subseg = now_subseg;
14369
14370           /* The .lbss section is for local .largecomm symbols.  */
14371           lbss_section = subseg_new (".lbss", 0);
14372           applicable = bfd_applicable_section_flags (stdoutput);
14373           bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14374           seg_info (lbss_section)->bss = 1;
14375
14376           subseg_set (seg, subseg);
14377         }
14378
14379       elf_com_section_ptr = &_bfd_elf_large_com_section;
14380       bss_section = lbss_section;
14381
14382       s_comm_internal (0, elf_common_parse);
14383
14384       elf_com_section_ptr = saved_com_section_ptr;
14385       bss_section = saved_bss_section;
14386     }
14387 }
14388 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */