gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2016 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifndef REGISTER_WARNINGS
  37 #define REGISTER_WARNINGS 1
  38 #endif
  39
  40 #ifndef INFER_ADDR_PREFIX
  41 #define INFER_ADDR_PREFIX 1
  42 #endif
  43
  44 #ifndef DEFAULT_ARCH
  45 #define DEFAULT_ARCH "i386"
  46 #endif
  47
  48 #ifndef INLINE
  49 #if __GNUC__ >= 2
  50 #define INLINE __inline__
  51 #else
  52 #define INLINE
  53 #endif
  54 #endif
  55
  56 /* Prefixes will be emitted in the order defined below.
  57    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  58    instruction, and so must come before any prefixes.
  59    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  60    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  61 #define WAIT_PREFIX     0
  62 #define SEG_PREFIX      1
  63 #define ADDR_PREFIX     2
  64 #define DATA_PREFIX     3
  65 #define REP_PREFIX      4
  66 #define HLE_PREFIX      REP_PREFIX
  67 #define BND_PREFIX      REP_PREFIX
  68 #define LOCK_PREFIX     5
  69 #define REX_PREFIX      6       /* must come last.  */
  70 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  71
  72 /* we define the syntax here (modulo base,index,scale syntax) */
  73 #define REGISTER_PREFIX '%'
  74 #define IMMEDIATE_PREFIX '$'
  75 #define ABSOLUTE_PREFIX '*'
  76
  77 /* these are the instruction mnemonic suffixes in AT&T syntax or
  78    memory operand size in Intel syntax.  */
  79 #define WORD_MNEM_SUFFIX  'w'
  80 #define BYTE_MNEM_SUFFIX  'b'
  81 #define SHORT_MNEM_SUFFIX 's'
  82 #define LONG_MNEM_SUFFIX  'l'
  83 #define QWORD_MNEM_SUFFIX  'q'
  84 #define XMMWORD_MNEM_SUFFIX  'x'
  85 #define YMMWORD_MNEM_SUFFIX 'y'
  86 #define ZMMWORD_MNEM_SUFFIX 'z'
  87 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  88    in instructions.  */
  89 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  90
  91 #define END_OF_INSN '\0'
  92
  93 /*
  94   'templates' is for grouping together 'template' structures for opcodes
  95   of the same name.  This is only used for storing the insns in the grand
  96   ole hash table of insns.
  97   The templates themselves start at START and range up to (but not including)
  98   END.
  99   */
 100 typedef struct
 101 {
 102   const insn_template *start;
 103   const insn_template *end;
 104 }
 105 templates;
 106
 107 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 108 typedef struct
 109 {
 110   unsigned int regmem;  /* codes register or memory operand */
 111   unsigned int reg;     /* codes register operand (or extended opcode) */
 112   unsigned int mode;    /* how to interpret regmem & reg */
 113 }
 114 modrm_byte;
 115
 116 /* x86-64 extension prefix.  */
 117 typedef int rex_byte;
 118
 119 /* 386 opcode byte to code indirect addressing.  */
 120 typedef struct
 121 {
 122   unsigned base;
 123   unsigned index;
 124   unsigned scale;
 125 }
 126 sib_byte;
 127
 128 /* x86 arch names, types and features */
 129 typedef struct
 130 {
 131   const char *name;             /* arch name */
 132   unsigned int len;             /* arch string length */
 133   enum processor_type type;     /* arch type */
 134   i386_cpu_flags flags;         /* cpu feature flags */
 135   unsigned int skip;            /* show_arch should skip this. */
 136   unsigned int negated;         /* turn off indicated flags.  */
 137 }
 138 arch_entry;
 139
 140 static void update_code_flag (int, int);
 141 static void set_code_flag (int);
 142 static void set_16bit_gcc_code_flag (int);
 143 static void set_intel_syntax (int);
 144 static void set_intel_mnemonic (int);
 145 static void set_allow_index_reg (int);
 146 static void set_check (int);
 147 static void set_cpu_arch (int);
 148 #ifdef TE_PE
 149 static void pe_directive_secrel (int);
 150 #endif
 151 static void signed_cons (int);
 152 static char *output_invalid (int c);
 153 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 154                                     const char *);
 155 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 156                                        const char *);
 157 static int i386_att_operand (char *);
 158 static int i386_intel_operand (char *, int);
 159 static int i386_intel_simplify (expressionS *);
 160 static int i386_intel_parse_name (const char *, expressionS *);
 161 static const reg_entry *parse_register (char *, char **);
 162 static char *parse_insn (char *, char *);
 163 static char *parse_operands (char *, const char *);
 164 static void swap_operands (void);
 165 static void swap_2_operands (int, int);
 166 static void optimize_imm (void);
 167 static void optimize_disp (void);
 168 static const insn_template *match_template (void);
 169 static int check_string (void);
 170 static int process_suffix (void);
 171 static int check_byte_reg (void);
 172 static int check_long_reg (void);
 173 static int check_qword_reg (void);
 174 static int check_word_reg (void);
 175 static int finalize_imm (void);
 176 static int process_operands (void);
 177 static const seg_entry *build_modrm_byte (void);
 178 static void output_insn (void);
 179 static void output_imm (fragS *, offsetT);
 180 static void output_disp (fragS *, offsetT);
 181 #ifndef I386COFF
 182 static void s_bss (int);
 183 #endif
 184 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 185 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 186 #endif
 187
 188 static const char *default_arch = DEFAULT_ARCH;
 189
 190 /* This struct describes rounding control and SAE in the instruction.  */
 191 struct RC_Operation
 192 {
 193   enum rc_type
 194     {
 195       rne = 0,
 196       rd,
 197       ru,
 198       rz,
 199       saeonly
 200     } type;
 201   int operand;
 202 };
 203
 204 static struct RC_Operation rc_op;
 205
 206 /* The struct describes masking, applied to OPERAND in the instruction.
 207    MASK is a pointer to the corresponding mask register.  ZEROING tells
 208    whether merging or zeroing mask is used.  */
 209 struct Mask_Operation
 210 {
 211   const reg_entry *mask;
 212   unsigned int zeroing;
 213   /* The operand where this operation is associated.  */
 214   int operand;
 215 };
 216
 217 static struct Mask_Operation mask_op;
 218
 219 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 220    broadcast factor.  */
 221 struct Broadcast_Operation
 222 {
 223   /* Type of broadcast: no broadcast, {1to8}, or {1to16}.  */
 224   int type;
 225
 226   /* Index of broadcasted operand.  */
 227   int operand;
 228 };
 229
 230 static struct Broadcast_Operation broadcast_op;
 231
 232 /* VEX prefix.  */
 233 typedef struct
 234 {
 235   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 236   unsigned char bytes[4];
 237   unsigned int length;
 238   /* Destination or source register specifier.  */
 239   const reg_entry *register_specifier;
 240 } vex_prefix;
 241
 242 /* 'md_assemble ()' gathers together information and puts it into a
 243    i386_insn.  */
 244
 245 union i386_op
 246   {
 247     expressionS *disps;
 248     expressionS *imms;
 249     const reg_entry *regs;
 250   };
 251
 252 enum i386_error
 253   {
 254     operand_size_mismatch,
 255     operand_type_mismatch,
 256     register_type_mismatch,
 257     number_of_operands_mismatch,
 258     invalid_instruction_suffix,
 259     bad_imm4,
 260     old_gcc_only,
 261     unsupported_with_intel_mnemonic,
 262     unsupported_syntax,
 263     unsupported,
 264     invalid_vsib_address,
 265     invalid_vector_register_set,
 266     unsupported_vector_index_register,
 267     unsupported_broadcast,
 268     broadcast_not_on_src_operand,
 269     broadcast_needed,
 270     unsupported_masking,
 271     mask_not_on_destination,
 272     no_default_mask,
 273     unsupported_rc_sae,
 274     rc_sae_operand_not_last_imm,
 275     invalid_register_operand,
 276     try_vector_disp8
 277   };
 278
 279 struct _i386_insn
 280   {
 281     /* TM holds the template for the insn were currently assembling.  */
 282     insn_template tm;
 283
 284     /* SUFFIX holds the instruction size suffix for byte, word, dword
 285        or qword, if given.  */
 286     char suffix;
 287
 288     /* OPERANDS gives the number of given operands.  */
 289     unsigned int operands;
 290
 291     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 292        of given register, displacement, memory operands and immediate
 293        operands.  */
 294     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 295
 296     /* TYPES [i] is the type (see above #defines) which tells us how to
 297        use OP[i] for the corresponding operand.  */
 298     i386_operand_type types[MAX_OPERANDS];
 299
 300     /* Displacement expression, immediate expression, or register for each
 301        operand.  */
 302     union i386_op op[MAX_OPERANDS];
 303
 304     /* Flags for operands.  */
 305     unsigned int flags[MAX_OPERANDS];
 306 #define Operand_PCrel 1
 307
 308     /* Relocation type for operand */
 309     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 310
 311     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 312        the base index byte below.  */
 313     const reg_entry *base_reg;
 314     const reg_entry *index_reg;
 315     unsigned int log2_scale_factor;
 316
 317     /* SEG gives the seg_entries of this insn.  They are zero unless
 318        explicit segment overrides are given.  */
 319     const seg_entry *seg[2];
 320
 321     /* PREFIX holds all the given prefix opcodes (usually null).
 322        PREFIXES is the number of prefix opcodes.  */
 323     unsigned int prefixes;
 324     unsigned char prefix[MAX_PREFIXES];
 325
 326     /* RM and SIB are the modrm byte and the sib byte where the
 327        addressing modes of this insn are encoded.  */
 328     modrm_byte rm;
 329     rex_byte rex;
 330     rex_byte vrex;
 331     sib_byte sib;
 332     vex_prefix vex;
 333
 334     /* Masking attributes.  */
 335     struct Mask_Operation *mask;
 336
 337     /* Rounding control and SAE attributes.  */
 338     struct RC_Operation *rounding;
 339
 340     /* Broadcasting attributes.  */
 341     struct Broadcast_Operation *broadcast;
 342
 343     /* Compressed disp8*N attribute.  */
 344     unsigned int memshift;
 345
 346     /* Swap operand in encoding.  */
 347     unsigned int swap_operand;
 348
 349     /* Prefer 8bit or 32bit displacement in encoding.  */
 350     enum
 351       {
 352         disp_encoding_default = 0,
 353         disp_encoding_8bit,
 354         disp_encoding_32bit
 355       } disp_encoding;
 356
 357     /* REP prefix.  */
 358     const char *rep_prefix;
 359
 360     /* HLE prefix.  */
 361     const char *hle_prefix;
 362
 363     /* Have BND prefix.  */
 364     const char *bnd_prefix;
 365
 366     /* Need VREX to support upper 16 registers.  */
 367     int need_vrex;
 368
 369     /* Error message.  */
 370     enum i386_error error;
 371   };
 372
 373 typedef struct _i386_insn i386_insn;
 374
 375 /* Link RC type with corresponding string, that'll be looked for in
 376    asm.  */
 377 struct RC_name
 378 {
 379   enum rc_type type;
 380   const char *name;
 381   unsigned int len;
 382 };
 383
 384 static const struct RC_name RC_NamesTable[] =
 385 {
 386   {  rne, STRING_COMMA_LEN ("rn-sae") },
 387   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 388   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 389   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 390   {  saeonly,  STRING_COMMA_LEN ("sae") },
 391 };
 392
 393 /* List of chars besides those in app.c:symbol_chars that can start an
 394    operand.  Used to prevent the scrubber eating vital white-space.  */
 395 const char extra_symbol_chars[] = "*%-([{"
 396 #ifdef LEX_AT
 397         "@"
 398 #endif
 399 #ifdef LEX_QM
 400         "?"
 401 #endif
 402         ;
 403
 404 #if (defined (TE_I386AIX)                               \
 405      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 406          && !defined (TE_GNU)                           \
 407          && !defined (TE_LINUX)                         \
 408          && !defined (TE_NACL)                          \
 409          && !defined (TE_NETWARE)                       \
 410          && !defined (TE_FreeBSD)                       \
 411          && !defined (TE_DragonFly)                     \
 412          && !defined (TE_NetBSD)))
 413 /* This array holds the chars that always start a comment.  If the
 414    pre-processor is disabled, these aren't very useful.  The option
 415    --divide will remove '/' from this list.  */
 416 const char *i386_comment_chars = "#/";
 417 #define SVR4_COMMENT_CHARS 1
 418 #define PREFIX_SEPARATOR '\\'
 419
 420 #else
 421 const char *i386_comment_chars = "#";
 422 #define PREFIX_SEPARATOR '/'
 423 #endif
 424
 425 /* This array holds the chars that only start a comment at the beginning of
 426    a line.  If the line seems to have the form '# 123 filename'
 427    .line and .file directives will appear in the pre-processed output.
 428    Note that input_file.c hand checks for '#' at the beginning of the
 429    first line of the input file.  This is because the compiler outputs
 430    #NO_APP at the beginning of its output.
 431    Also note that comments started like this one will always work if
 432    '/' isn't otherwise defined.  */
 433 const char line_comment_chars[] = "#/";
 434
 435 const char line_separator_chars[] = ";";
 436
 437 /* Chars that can be used to separate mant from exp in floating point
 438    nums.  */
 439 const char EXP_CHARS[] = "eE";
 440
 441 /* Chars that mean this number is a floating point constant
 442    As in 0f12.456
 443    or    0d1.2345e12.  */
 444 const char FLT_CHARS[] = "fFdDxX";
 445
 446 /* Tables for lexical analysis.  */
 447 static char mnemonic_chars[256];
 448 static char register_chars[256];
 449 static char operand_chars[256];
 450 static char identifier_chars[256];
 451 static char digit_chars[256];
 452
 453 /* Lexical macros.  */
 454 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 455 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 456 #define is_register_char(x) (register_chars[(unsigned char) x])
 457 #define is_space_char(x) ((x) == ' ')
 458 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 459 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 460
 461 /* All non-digit non-letter characters that may occur in an operand.  */
 462 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 463
 464 /* md_assemble() always leaves the strings it's passed unaltered.  To
 465    effect this we maintain a stack of saved characters that we've smashed
 466    with '\0's (indicating end of strings for various sub-fields of the
 467    assembler instruction).  */
 468 static char save_stack[32];
 469 static char *save_stack_p;
 470 #define END_STRING_AND_SAVE(s) \
 471         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 472 #define RESTORE_END_STRING(s) \
 473         do { *(s) = *--save_stack_p; } while (0)
 474
 475 /* The instruction we're assembling.  */
 476 static i386_insn i;
 477
 478 /* Possible templates for current insn.  */
 479 static const templates *current_templates;
 480
 481 /* Per instruction expressionS buffers: max displacements & immediates.  */
 482 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 483 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 484
 485 /* Current operand we are working on.  */
 486 static int this_operand = -1;
 487
 488 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 489    these.  */
 490
 491 enum flag_code {
 492         CODE_32BIT,
 493         CODE_16BIT,
 494         CODE_64BIT };
 495
 496 static enum flag_code flag_code;
 497 static unsigned int object_64bit;
 498 static unsigned int disallow_64bit_reloc;
 499 static int use_rela_relocations = 0;
 500
 501 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 502      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 503      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 504
 505 /* The ELF ABI to use.  */
 506 enum x86_elf_abi
 507 {
 508   I386_ABI,
 509   X86_64_ABI,
 510   X86_64_X32_ABI
 511 };
 512
 513 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 514 #endif
 515
 516 #if defined (TE_PE) || defined (TE_PEP)
 517 /* Use big object file format.  */
 518 static int use_big_obj = 0;
 519 #endif
 520
 521 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 522 /* 1 if generating code for a shared library.  */
 523 static int shared = 0;
 524 #endif
 525
 526 /* 1 for intel syntax,
 527    0 if att syntax.  */
 528 static int intel_syntax = 0;
 529
 530 /* 1 for intel mnemonic,
 531    0 if att mnemonic.  */
 532 static int intel_mnemonic = !SYSV386_COMPAT;
 533
 534 /* 1 if support old (<= 2.8.1) versions of gcc.  */
 535 static int old_gcc = OLDGCC_COMPAT;
 536
 537 /* 1 if pseudo registers are permitted.  */
 538 static int allow_pseudo_reg = 0;
 539
 540 /* 1 if register prefix % not required.  */
 541 static int allow_naked_reg = 0;
 542
 543 /* 1 if the assembler should add BND prefix for all control-tranferring
 544    instructions supporting it, even if this prefix wasn't specified
 545    explicitly.  */
 546 static int add_bnd_prefix = 0;
 547
 548 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 549 static int allow_index_reg = 0;
 550
 551 /* 1 if the assembler should ignore LOCK prefix, even if it was
 552    specified explicitly.  */
 553 static int omit_lock_prefix = 0;
 554
 555 /* 1 if the assembler should encode lfence, mfence, and sfence as
 556    "lock addl $0, (%{re}sp)".  */
 557 static int avoid_fence = 0;
 558
 559 /* 1 if the assembler should generate relax relocations.  */
 560
 561 static int generate_relax_relocations
 562   = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
 563
 564 static enum check_kind
 565   {
 566     check_none = 0,
 567     check_warning,
 568     check_error
 569   }
 570 sse_check, operand_check = check_warning;
 571
 572 /* Register prefix used for error message.  */
 573 static const char *register_prefix = "%";
 574
 575 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 576    leave, push, and pop instructions so that gcc has the same stack
 577    frame as in 32 bit mode.  */
 578 static char stackop_size = '\0';
 579
 580 /* Non-zero to optimize code alignment.  */
 581 int optimize_align_code = 1;
 582
 583 /* Non-zero to quieten some warnings.  */
 584 static int quiet_warnings = 0;
 585
 586 /* CPU name.  */
 587 static const char *cpu_arch_name = NULL;
 588 static char *cpu_sub_arch_name = NULL;
 589
 590 /* CPU feature flags.  */
 591 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 592
 593 /* If we have selected a cpu we are generating instructions for.  */
 594 static int cpu_arch_tune_set = 0;
 595
 596 /* Cpu we are generating instructions for.  */
 597 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 598
 599 /* CPU feature flags of cpu we are generating instructions for.  */
 600 static i386_cpu_flags cpu_arch_tune_flags;
 601
 602 /* CPU instruction set architecture used.  */
 603 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 604
 605 /* CPU feature flags of instruction set architecture used.  */
 606 i386_cpu_flags cpu_arch_isa_flags;
 607
 608 /* If set, conditional jumps are not automatically promoted to handle
 609    larger than a byte offset.  */
 610 static unsigned int no_cond_jump_promotion = 0;
 611
 612 /* Encode SSE instructions with VEX prefix.  */
 613 static unsigned int sse2avx;
 614
 615 /* Encode scalar AVX instructions with specific vector length.  */
 616 static enum
 617   {
 618     vex128 = 0,
 619     vex256
 620   } avxscalar;
 621
 622 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 623 static enum
 624   {
 625     evexl128 = 0,
 626     evexl256,
 627     evexl512
 628   } evexlig;
 629
 630 /* Encode EVEX WIG instructions with specific evex.w.  */
 631 static enum
 632   {
 633     evexw0 = 0,
 634     evexw1
 635   } evexwig;
 636
 637 /* Value to encode in EVEX RC bits, for SAE-only instructions.  */
 638 static enum rc_type evexrcig = rne;
 639
 640 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 641 static symbolS *GOT_symbol;
 642
 643 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 644 unsigned int x86_dwarf2_return_column;
 645
 646 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 647 int x86_cie_data_alignment;
 648
 649 /* Interface to relax_segment.
 650    There are 3 major relax states for 386 jump insns because the
 651    different types of jumps add different sizes to frags when we're
 652    figuring out what sort of jump to choose to reach a given label.  */
 653
 654 /* Types.  */
 655 #define UNCOND_JUMP 0
 656 #define COND_JUMP 1
 657 #define COND_JUMP86 2
 658
 659 /* Sizes.  */
 660 #define CODE16  1
 661 #define SMALL   0
 662 #define SMALL16 (SMALL | CODE16)
 663 #define BIG     2
 664 #define BIG16   (BIG | CODE16)
 665
 666 #ifndef INLINE
 667 #ifdef __GNUC__
 668 #define INLINE __inline__
 669 #else
 670 #define INLINE
 671 #endif
 672 #endif
 673
 674 #define ENCODE_RELAX_STATE(type, size) \
 675   ((relax_substateT) (((type) << 2) | (size)))
 676 #define TYPE_FROM_RELAX_STATE(s) \
 677   ((s) >> 2)
 678 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 679     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 680
 681 /* This table is used by relax_frag to promote short jumps to long
 682    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 683    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 684    don't allow a short jump in a 32 bit code segment to be promoted to
 685    a 16 bit offset jump because it's slower (requires data size
 686    prefix), and doesn't work, unless the destination is in the bottom
 687    64k of the code segment (The top 16 bits of eip are zeroed).  */
 688
 689 const relax_typeS md_relax_table[] =
 690 {
 691   /* The fields are:
 692      1) most positive reach of this state,
 693      2) most negative reach of this state,
 694      3) how many bytes this mode will have in the variable part of the frag
 695      4) which index into the table to try if we can't fit into this one.  */
 696
 697   /* UNCOND_JUMP states.  */
 698   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 699   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 700   /* dword jmp adds 4 bytes to frag:
 701      0 extra opcode bytes, 4 displacement bytes.  */
 702   {0, 0, 4, 0},
 703   /* word jmp adds 2 byte2 to frag:
 704      0 extra opcode bytes, 2 displacement bytes.  */
 705   {0, 0, 2, 0},
 706
 707   /* COND_JUMP states.  */
 708   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 709   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 710   /* dword conditionals adds 5 bytes to frag:
 711      1 extra opcode byte, 4 displacement bytes.  */
 712   {0, 0, 5, 0},
 713   /* word conditionals add 3 bytes to frag:
 714      1 extra opcode byte, 2 displacement bytes.  */
 715   {0, 0, 3, 0},
 716
 717   /* COND_JUMP86 states.  */
 718   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 719   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 720   /* dword conditionals adds 5 bytes to frag:
 721      1 extra opcode byte, 4 displacement bytes.  */
 722   {0, 0, 5, 0},
 723   /* word conditionals add 4 bytes to frag:
 724      1 displacement byte and a 3 byte long branch insn.  */
 725   {0, 0, 4, 0}
 726 };
 727
 728 static const arch_entry cpu_arch[] =
 729 {
 730   /* Do not replace the first two entries - i386_target_format()
 731      relies on them being there in this order.  */
 732   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 733     CPU_GENERIC32_FLAGS, 0, 0 },
 734   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 735     CPU_GENERIC64_FLAGS, 0, 0 },
 736   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 737     CPU_NONE_FLAGS, 0, 0 },
 738   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 739     CPU_I186_FLAGS, 0, 0 },
 740   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 741     CPU_I286_FLAGS, 0, 0 },
 742   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 743     CPU_I386_FLAGS, 0, 0 },
 744   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 745     CPU_I486_FLAGS, 0, 0 },
 746   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 747     CPU_I586_FLAGS, 0, 0 },
 748   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 749     CPU_I686_FLAGS, 0, 0 },
 750   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 751     CPU_I586_FLAGS, 0, 0 },
 752   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 753     CPU_PENTIUMPRO_FLAGS, 0, 0 },
 754   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 755     CPU_P2_FLAGS, 0, 0 },
 756   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 757     CPU_P3_FLAGS, 0, 0 },
 758   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 759     CPU_P4_FLAGS, 0, 0 },
 760   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 761     CPU_CORE_FLAGS, 0, 0 },
 762   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 763     CPU_NOCONA_FLAGS, 0, 0 },
 764   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 765     CPU_CORE_FLAGS, 1, 0 },
 766   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 767     CPU_CORE_FLAGS, 0, 0 },
 768   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 769     CPU_CORE2_FLAGS, 1, 0 },
 770   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 771     CPU_CORE2_FLAGS, 0, 0 },
 772   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 773     CPU_COREI7_FLAGS, 0, 0 },
 774   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 775     CPU_L1OM_FLAGS, 0, 0 },
 776   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 777     CPU_K1OM_FLAGS, 0, 0 },
 778   { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
 779     CPU_IAMCU_FLAGS, 0, 0 },
 780   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 781     CPU_K6_FLAGS, 0, 0 },
 782   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 783     CPU_K6_2_FLAGS, 0, 0 },
 784   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 785     CPU_ATHLON_FLAGS, 0, 0 },
 786   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 787     CPU_K8_FLAGS, 1, 0 },
 788   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 789     CPU_K8_FLAGS, 0, 0 },
 790   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 791     CPU_K8_FLAGS, 0, 0 },
 792   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 793     CPU_AMDFAM10_FLAGS, 0, 0 },
 794   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 795     CPU_BDVER1_FLAGS, 0, 0 },
 796   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 797     CPU_BDVER2_FLAGS, 0, 0 },
 798   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 799     CPU_BDVER3_FLAGS, 0, 0 },
 800   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
 801     CPU_BDVER4_FLAGS, 0, 0 },
 802   { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
 803     CPU_ZNVER1_FLAGS, 0, 0 },
 804   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
 805     CPU_BTVER1_FLAGS, 0, 0 },
 806   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
 807     CPU_BTVER2_FLAGS, 0, 0 },
 808   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
 809     CPU_8087_FLAGS, 0, 0 },
 810   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
 811     CPU_287_FLAGS, 0, 0 },
 812   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
 813     CPU_387_FLAGS, 0, 0 },
 814   { STRING_COMMA_LEN (".no87"), PROCESSOR_UNKNOWN,
 815     CPU_ANY87_FLAGS, 0, 1 },
 816   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
 817     CPU_MMX_FLAGS, 0, 0 },
 818   { STRING_COMMA_LEN (".nommx"), PROCESSOR_UNKNOWN,
 819     CPU_3DNOWA_FLAGS, 0, 1 },
 820   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
 821     CPU_SSE_FLAGS, 0, 0 },
 822   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
 823     CPU_SSE2_FLAGS, 0, 0 },
 824   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
 825     CPU_SSE3_FLAGS, 0, 0 },
 826   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
 827     CPU_SSSE3_FLAGS, 0, 0 },
 828   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
 829     CPU_SSE4_1_FLAGS, 0, 0 },
 830   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
 831     CPU_SSE4_2_FLAGS, 0, 0 },
 832   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
 833     CPU_SSE4_2_FLAGS, 0, 0 },
 834   { STRING_COMMA_LEN (".nosse"), PROCESSOR_UNKNOWN,
 835     CPU_ANY_SSE_FLAGS, 0, 1 },
 836   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
 837     CPU_AVX_FLAGS, 0, 0 },
 838   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
 839     CPU_AVX2_FLAGS, 0, 0 },
 840   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
 841     CPU_AVX512F_FLAGS, 0, 0 },
 842   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
 843     CPU_AVX512CD_FLAGS, 0, 0 },
 844   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
 845     CPU_AVX512ER_FLAGS, 0, 0 },
 846   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
 847     CPU_AVX512PF_FLAGS, 0, 0 },
 848   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
 849     CPU_AVX512DQ_FLAGS, 0, 0 },
 850   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
 851     CPU_AVX512BW_FLAGS, 0, 0 },
 852   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
 853     CPU_AVX512VL_FLAGS, 0, 0 },
 854   { STRING_COMMA_LEN (".noavx"), PROCESSOR_UNKNOWN,
 855     CPU_ANY_AVX_FLAGS, 0, 1 },
 856   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
 857     CPU_VMX_FLAGS, 0, 0 },
 858   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
 859     CPU_VMFUNC_FLAGS, 0, 0 },
 860   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
 861     CPU_SMX_FLAGS, 0, 0 },
 862   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
 863     CPU_XSAVE_FLAGS, 0, 0 },
 864   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
 865     CPU_XSAVEOPT_FLAGS, 0, 0 },
 866   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
 867     CPU_XSAVEC_FLAGS, 0, 0 },
 868   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
 869     CPU_XSAVES_FLAGS, 0, 0 },
 870   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
 871     CPU_AES_FLAGS, 0, 0 },
 872   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
 873     CPU_PCLMUL_FLAGS, 0, 0 },
 874   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
 875     CPU_PCLMUL_FLAGS, 1, 0 },
 876   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
 877     CPU_FSGSBASE_FLAGS, 0, 0 },
 878   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
 879     CPU_RDRND_FLAGS, 0, 0 },
 880   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
 881     CPU_F16C_FLAGS, 0, 0 },
 882   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
 883     CPU_BMI2_FLAGS, 0, 0 },
 884   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
 885     CPU_FMA_FLAGS, 0, 0 },
 886   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
 887     CPU_FMA4_FLAGS, 0, 0 },
 888   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
 889     CPU_XOP_FLAGS, 0, 0 },
 890   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
 891     CPU_LWP_FLAGS, 0, 0 },
 892   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
 893     CPU_MOVBE_FLAGS, 0, 0 },
 894   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
 895     CPU_CX16_FLAGS, 0, 0 },
 896   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
 897     CPU_EPT_FLAGS, 0, 0 },
 898   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
 899     CPU_LZCNT_FLAGS, 0, 0 },
 900   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
 901     CPU_HLE_FLAGS, 0, 0 },
 902   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
 903     CPU_RTM_FLAGS, 0, 0 },
 904   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
 905     CPU_INVPCID_FLAGS, 0, 0 },
 906   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
 907     CPU_CLFLUSH_FLAGS, 0, 0 },
 908   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
 909     CPU_NOP_FLAGS, 0, 0 },
 910   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
 911     CPU_SYSCALL_FLAGS, 0, 0 },
 912   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
 913     CPU_RDTSCP_FLAGS, 0, 0 },
 914   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
 915     CPU_3DNOW_FLAGS, 0, 0 },
 916   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
 917     CPU_3DNOWA_FLAGS, 0, 0 },
 918   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
 919     CPU_PADLOCK_FLAGS, 0, 0 },
 920   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
 921     CPU_SVME_FLAGS, 1, 0 },
 922   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
 923     CPU_SVME_FLAGS, 0, 0 },
 924   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
 925     CPU_SSE4A_FLAGS, 0, 0 },
 926   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
 927     CPU_ABM_FLAGS, 0, 0 },
 928   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
 929     CPU_BMI_FLAGS, 0, 0 },
 930   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
 931     CPU_TBM_FLAGS, 0, 0 },
 932   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
 933     CPU_ADX_FLAGS, 0, 0 },
 934   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
 935     CPU_RDSEED_FLAGS, 0, 0 },
 936   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
 937     CPU_PRFCHW_FLAGS, 0, 0 },
 938   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
 939     CPU_SMAP_FLAGS, 0, 0 },
 940   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
 941     CPU_MPX_FLAGS, 0, 0 },
 942   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
 943     CPU_SHA_FLAGS, 0, 0 },
 944   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
 945     CPU_CLFLUSHOPT_FLAGS, 0, 0 },
 946   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
 947     CPU_PREFETCHWT1_FLAGS, 0, 0 },
 948   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
 949     CPU_SE1_FLAGS, 0, 0 },
 950   { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
 951     CPU_CLWB_FLAGS, 0, 0 },
 952   { STRING_COMMA_LEN (".pcommit"), PROCESSOR_UNKNOWN,
 953     CPU_PCOMMIT_FLAGS, 0, 0 },
 954   { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
 955     CPU_AVX512IFMA_FLAGS, 0, 0 },
 956   { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
 957     CPU_AVX512VBMI_FLAGS, 0, 0 },
 958   { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
 959     CPU_CLZERO_FLAGS, 0, 0 },
 960   { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
 961     CPU_MWAITX_FLAGS, 0, 0 },
 962   { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
 963     CPU_OSPKE_FLAGS, 0, 0 },
 964 };
 965
 966 #ifdef I386COFF
 967 /* Like s_lcomm_internal in gas/read.c but the alignment string
 968    is allowed to be optional.  */
 969
 970 static symbolS *
 971 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
 972 {
 973   addressT align = 0;
 974
 975   SKIP_WHITESPACE ();
 976
 977   if (needs_align
 978       && *input_line_pointer == ',')
 979     {
 980       align = parse_align (needs_align - 1);
 981
 982       if (align == (addressT) -1)
 983         return NULL;
 984     }
 985   else
 986     {
 987       if (size >= 8)
 988         align = 3;
 989       else if (size >= 4)
 990         align = 2;
 991       else if (size >= 2)
 992         align = 1;
 993       else
 994         align = 0;
 995     }
 996
 997   bss_alloc (symbolP, size, align);
 998   return symbolP;
 999 }
1000
1001 static void
1002 pe_lcomm (int needs_align)
1003 {
1004   s_comm_internal (needs_align * 2, pe_lcomm_internal);
1005 }
1006 #endif
1007
1008 const pseudo_typeS md_pseudo_table[] =
1009 {
1010 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1011   {"align", s_align_bytes, 0},
1012 #else
1013   {"align", s_align_ptwo, 0},
1014 #endif
1015   {"arch", set_cpu_arch, 0},
1016 #ifndef I386COFF
1017   {"bss", s_bss, 0},
1018 #else
1019   {"lcomm", pe_lcomm, 1},
1020 #endif
1021   {"ffloat", float_cons, 'f'},
1022   {"dfloat", float_cons, 'd'},
1023   {"tfloat", float_cons, 'x'},
1024   {"value", cons, 2},
1025   {"slong", signed_cons, 4},
1026   {"noopt", s_ignore, 0},
1027   {"optim", s_ignore, 0},
1028   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1029   {"code16", set_code_flag, CODE_16BIT},
1030   {"code32", set_code_flag, CODE_32BIT},
1031   {"code64", set_code_flag, CODE_64BIT},
1032   {"intel_syntax", set_intel_syntax, 1},
1033   {"att_syntax", set_intel_syntax, 0},
1034   {"intel_mnemonic", set_intel_mnemonic, 1},
1035   {"att_mnemonic", set_intel_mnemonic, 0},
1036   {"allow_index_reg", set_allow_index_reg, 1},
1037   {"disallow_index_reg", set_allow_index_reg, 0},
1038   {"sse_check", set_check, 0},
1039   {"operand_check", set_check, 1},
1040 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1041   {"largecomm", handle_large_common, 0},
1042 #else
1043   {"file", (void (*) (int)) dwarf2_directive_file, 0},
1044   {"loc", dwarf2_directive_loc, 0},
1045   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1046 #endif
1047 #ifdef TE_PE
1048   {"secrel32", pe_directive_secrel, 0},
1049 #endif
1050   {0, 0, 0}
1051 };
1052
1053 /* For interface with expression ().  */
1054 extern char *input_line_pointer;
1055
1056 /* Hash table for instruction mnemonic lookup.  */
1057 static struct hash_control *op_hash;
1058
1059 /* Hash table for register lookup.  */
1060 static struct hash_control *reg_hash;
1061 \f
1062 void
1063 i386_align_code (fragS *fragP, int count)
1064 {
1065   /* Various efficient no-op patterns for aligning code labels.
1066      Note: Don't try to assemble the instructions in the comments.
1067      0L and 0w are not legal.  */
1068   static const unsigned char f32_1[] =
1069     {0x90};                                     /* nop                  */
1070   static const unsigned char f32_2[] =
1071     {0x66,0x90};                                /* xchg %ax,%ax */
1072   static const unsigned char f32_3[] =
1073     {0x8d,0x76,0x00};                           /* leal 0(%esi),%esi    */
1074   static const unsigned char f32_4[] =
1075     {0x8d,0x74,0x26,0x00};                      /* leal 0(%esi,1),%esi  */
1076   static const unsigned char f32_5[] =
1077     {0x90,                                      /* nop                  */
1078      0x8d,0x74,0x26,0x00};                      /* leal 0(%esi,1),%esi  */
1079   static const unsigned char f32_6[] =
1080     {0x8d,0xb6,0x00,0x00,0x00,0x00};            /* leal 0L(%esi),%esi   */
1081   static const unsigned char f32_7[] =
1082     {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00};       /* leal 0L(%esi,1),%esi */
1083   static const unsigned char f32_8[] =
1084     {0x90,                                      /* nop                  */
1085      0x8d,0xb4,0x26,0x00,0x00,0x00,0x00};       /* leal 0L(%esi,1),%esi */
1086   static const unsigned char f32_9[] =
1087     {0x89,0xf6,                                 /* movl %esi,%esi       */
1088      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1089   static const unsigned char f32_10[] =
1090     {0x8d,0x76,0x00,                            /* leal 0(%esi),%esi    */
1091      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1092   static const unsigned char f32_11[] =
1093     {0x8d,0x74,0x26,0x00,                       /* leal 0(%esi,1),%esi  */
1094      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1095   static const unsigned char f32_12[] =
1096     {0x8d,0xb6,0x00,0x00,0x00,0x00,             /* leal 0L(%esi),%esi   */
1097      0x8d,0xbf,0x00,0x00,0x00,0x00};            /* leal 0L(%edi),%edi   */
1098   static const unsigned char f32_13[] =
1099     {0x8d,0xb6,0x00,0x00,0x00,0x00,             /* leal 0L(%esi),%esi   */
1100      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1101   static const unsigned char f32_14[] =
1102     {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00,        /* leal 0L(%esi,1),%esi */
1103      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1104   static const unsigned char f16_3[] =
1105     {0x8d,0x74,0x00};                           /* lea 0(%esi),%esi     */
1106   static const unsigned char f16_4[] =
1107     {0x8d,0xb4,0x00,0x00};                      /* lea 0w(%si),%si      */
1108   static const unsigned char f16_5[] =
1109     {0x90,                                      /* nop                  */
1110      0x8d,0xb4,0x00,0x00};                      /* lea 0w(%si),%si      */
1111   static const unsigned char f16_6[] =
1112     {0x89,0xf6,                                 /* mov %si,%si          */
1113      0x8d,0xbd,0x00,0x00};                      /* lea 0w(%di),%di      */
1114   static const unsigned char f16_7[] =
1115     {0x8d,0x74,0x00,                            /* lea 0(%si),%si       */
1116      0x8d,0xbd,0x00,0x00};                      /* lea 0w(%di),%di      */
1117   static const unsigned char f16_8[] =
1118     {0x8d,0xb4,0x00,0x00,                       /* lea 0w(%si),%si      */
1119      0x8d,0xbd,0x00,0x00};                      /* lea 0w(%di),%di      */
1120   static const unsigned char jump_31[] =
1121     {0xeb,0x1d,0x90,0x90,0x90,0x90,0x90,        /* jmp .+31; lotsa nops */
1122      0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1123      0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1124      0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
1125   static const unsigned char *const f32_patt[] = {
1126     f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
1127     f32_9, f32_10, f32_11, f32_12, f32_13, f32_14
1128   };
1129   static const unsigned char *const f16_patt[] = {
1130     f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8
1131   };
1132   /* nopl (%[re]ax) */
1133   static const unsigned char alt_3[] =
1134     {0x0f,0x1f,0x00};
1135   /* nopl 0(%[re]ax) */
1136   static const unsigned char alt_4[] =
1137     {0x0f,0x1f,0x40,0x00};
1138   /* nopl 0(%[re]ax,%[re]ax,1) */
1139   static const unsigned char alt_5[] =
1140     {0x0f,0x1f,0x44,0x00,0x00};
1141   /* nopw 0(%[re]ax,%[re]ax,1) */
1142   static const unsigned char alt_6[] =
1143     {0x66,0x0f,0x1f,0x44,0x00,0x00};
1144   /* nopl 0L(%[re]ax) */
1145   static const unsigned char alt_7[] =
1146     {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1147   /* nopl 0L(%[re]ax,%[re]ax,1) */
1148   static const unsigned char alt_8[] =
1149     {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1150   /* nopw 0L(%[re]ax,%[re]ax,1) */
1151   static const unsigned char alt_9[] =
1152     {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1153   /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1154   static const unsigned char alt_10[] =
1155     {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1156   static const unsigned char *const alt_patt[] = {
1157     f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1158     alt_9, alt_10
1159   };
1160
1161   /* Only align for at least a positive non-zero boundary. */
1162   if (count <= 0 || count > MAX_MEM_FOR_RS_ALIGN_CODE)
1163     return;
1164
1165   /* We need to decide which NOP sequence to use for 32bit and
1166      64bit. When -mtune= is used:
1167
1168      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1169      PROCESSOR_GENERIC32, f32_patt will be used.
1170      2. For the rest, alt_patt will be used.
1171
1172      When -mtune= isn't used, alt_patt will be used if
1173      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1174      be used.
1175
1176      When -march= or .arch is used, we can't use anything beyond
1177      cpu_arch_isa_flags.   */
1178
1179   if (flag_code == CODE_16BIT)
1180     {
1181       if (count > 8)
1182         {
1183           memcpy (fragP->fr_literal + fragP->fr_fix,
1184                   jump_31, count);
1185           /* Adjust jump offset.  */
1186           fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1187         }
1188       else
1189         memcpy (fragP->fr_literal + fragP->fr_fix,
1190                 f16_patt[count - 1], count);
1191     }
1192   else
1193     {
1194       const unsigned char *const *patt = NULL;
1195
1196       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1197         {
1198           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1199           switch (cpu_arch_tune)
1200             {
1201             case PROCESSOR_UNKNOWN:
1202               /* We use cpu_arch_isa_flags to check if we SHOULD
1203                  optimize with nops.  */
1204               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1205                 patt = alt_patt;
1206               else
1207                 patt = f32_patt;
1208               break;
1209             case PROCESSOR_PENTIUM4:
1210             case PROCESSOR_NOCONA:
1211             case PROCESSOR_CORE:
1212             case PROCESSOR_CORE2:
1213             case PROCESSOR_COREI7:
1214             case PROCESSOR_L1OM:
1215             case PROCESSOR_K1OM:
1216             case PROCESSOR_GENERIC64:
1217             case PROCESSOR_K6:
1218             case PROCESSOR_ATHLON:
1219             case PROCESSOR_K8:
1220             case PROCESSOR_AMDFAM10:
1221             case PROCESSOR_BD:
1222             case PROCESSOR_ZNVER:
1223             case PROCESSOR_BT:
1224               patt = alt_patt;
1225               break;
1226             case PROCESSOR_I386:
1227             case PROCESSOR_I486:
1228             case PROCESSOR_PENTIUM:
1229             case PROCESSOR_PENTIUMPRO:
1230             case PROCESSOR_IAMCU:
1231             case PROCESSOR_GENERIC32:
1232               patt = f32_patt;
1233               break;
1234             }
1235         }
1236       else
1237         {
1238           switch (fragP->tc_frag_data.tune)
1239             {
1240             case PROCESSOR_UNKNOWN:
1241               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1242                  PROCESSOR_UNKNOWN.  */
1243               abort ();
1244               break;
1245
1246             case PROCESSOR_I386:
1247             case PROCESSOR_I486:
1248             case PROCESSOR_PENTIUM:
1249             case PROCESSOR_IAMCU:
1250             case PROCESSOR_K6:
1251             case PROCESSOR_ATHLON:
1252             case PROCESSOR_K8:
1253             case PROCESSOR_AMDFAM10:
1254             case PROCESSOR_BD:
1255             case PROCESSOR_ZNVER:
1256             case PROCESSOR_BT:
1257             case PROCESSOR_GENERIC32:
1258               /* We use cpu_arch_isa_flags to check if we CAN optimize
1259                  with nops.  */
1260               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1261                 patt = alt_patt;
1262               else
1263                 patt = f32_patt;
1264               break;
1265             case PROCESSOR_PENTIUMPRO:
1266             case PROCESSOR_PENTIUM4:
1267             case PROCESSOR_NOCONA:
1268             case PROCESSOR_CORE:
1269             case PROCESSOR_CORE2:
1270             case PROCESSOR_COREI7:
1271             case PROCESSOR_L1OM:
1272             case PROCESSOR_K1OM:
1273               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1274                 patt = alt_patt;
1275               else
1276                 patt = f32_patt;
1277               break;
1278             case PROCESSOR_GENERIC64:
1279               patt = alt_patt;
1280               break;
1281             }
1282         }
1283
1284       if (patt == f32_patt)
1285         {
1286           /* If the padding is less than 15 bytes, we use the normal
1287              ones.  Otherwise, we use a jump instruction and adjust
1288              its offset.   */
1289           int limit;
1290
1291           /* For 64bit, the limit is 3 bytes.  */
1292           if (flag_code == CODE_64BIT
1293               && fragP->tc_frag_data.isa_flags.bitfield.cpulm)
1294             limit = 3;
1295           else
1296             limit = 15;
1297           if (count < limit)
1298             memcpy (fragP->fr_literal + fragP->fr_fix,
1299                     patt[count - 1], count);
1300           else
1301             {
1302               memcpy (fragP->fr_literal + fragP->fr_fix,
1303                       jump_31, count);
1304               /* Adjust jump offset.  */
1305               fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1306             }
1307         }
1308       else
1309         {
1310           /* Maximum length of an instruction is 10 byte.  If the
1311              padding is greater than 10 bytes and we don't use jump,
1312              we have to break it into smaller pieces.  */
1313           int padding = count;
1314           while (padding > 10)
1315             {
1316               padding -= 10;
1317               memcpy (fragP->fr_literal + fragP->fr_fix + padding,
1318                       patt [9], 10);
1319             }
1320
1321           if (padding)
1322             memcpy (fragP->fr_literal + fragP->fr_fix,
1323                     patt [padding - 1], padding);
1324         }
1325     }
1326   fragP->fr_var = count;
1327 }
1328
1329 static INLINE int
1330 operand_type_all_zero (const union i386_operand_type *x)
1331 {
1332   switch (ARRAY_SIZE(x->array))
1333     {
1334     case 3:
1335       if (x->array[2])
1336         return 0;
1337     case 2:
1338       if (x->array[1])
1339         return 0;
1340     case 1:
1341       return !x->array[0];
1342     default:
1343       abort ();
1344     }
1345 }
1346
1347 static INLINE void
1348 operand_type_set (union i386_operand_type *x, unsigned int v)
1349 {
1350   switch (ARRAY_SIZE(x->array))
1351     {
1352     case 3:
1353       x->array[2] = v;
1354     case 2:
1355       x->array[1] = v;
1356     case 1:
1357       x->array[0] = v;
1358       break;
1359     default:
1360       abort ();
1361     }
1362 }
1363
1364 static INLINE int
1365 operand_type_equal (const union i386_operand_type *x,
1366                     const union i386_operand_type *y)
1367 {
1368   switch (ARRAY_SIZE(x->array))
1369     {
1370     case 3:
1371       if (x->array[2] != y->array[2])
1372         return 0;
1373     case 2:
1374       if (x->array[1] != y->array[1])
1375         return 0;
1376     case 1:
1377       return x->array[0] == y->array[0];
1378       break;
1379     default:
1380       abort ();
1381     }
1382 }
1383
1384 static INLINE int
1385 cpu_flags_all_zero (const union i386_cpu_flags *x)
1386 {
1387   switch (ARRAY_SIZE(x->array))
1388     {
1389     case 3:
1390       if (x->array[2])
1391         return 0;
1392     case 2:
1393       if (x->array[1])
1394         return 0;
1395     case 1:
1396       return !x->array[0];
1397     default:
1398       abort ();
1399     }
1400 }
1401
1402 static INLINE int
1403 cpu_flags_equal (const union i386_cpu_flags *x,
1404                  const union i386_cpu_flags *y)
1405 {
1406   switch (ARRAY_SIZE(x->array))
1407     {
1408     case 3:
1409       if (x->array[2] != y->array[2])
1410         return 0;
1411     case 2:
1412       if (x->array[1] != y->array[1])
1413         return 0;
1414     case 1:
1415       return x->array[0] == y->array[0];
1416       break;
1417     default:
1418       abort ();
1419     }
1420 }
1421
1422 static INLINE int
1423 cpu_flags_check_cpu64 (i386_cpu_flags f)
1424 {
1425   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1426            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1427 }
1428
1429 static INLINE i386_cpu_flags
1430 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1431 {
1432   switch (ARRAY_SIZE (x.array))
1433     {
1434     case 3:
1435       x.array [2] &= y.array [2];
1436     case 2:
1437       x.array [1] &= y.array [1];
1438     case 1:
1439       x.array [0] &= y.array [0];
1440       break;
1441     default:
1442       abort ();
1443     }
1444   return x;
1445 }
1446
1447 static INLINE i386_cpu_flags
1448 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1449 {
1450   switch (ARRAY_SIZE (x.array))
1451     {
1452     case 3:
1453       x.array [2] |= y.array [2];
1454     case 2:
1455       x.array [1] |= y.array [1];
1456     case 1:
1457       x.array [0] |= y.array [0];
1458       break;
1459     default:
1460       abort ();
1461     }
1462   return x;
1463 }
1464
1465 static INLINE i386_cpu_flags
1466 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1467 {
1468   switch (ARRAY_SIZE (x.array))
1469     {
1470     case 3:
1471       x.array [2] &= ~y.array [2];
1472     case 2:
1473       x.array [1] &= ~y.array [1];
1474     case 1:
1475       x.array [0] &= ~y.array [0];
1476       break;
1477     default:
1478       abort ();
1479     }
1480   return x;
1481 }
1482
1483 static int
1484 valid_iamcu_cpu_flags (const i386_cpu_flags *flags)
1485 {
1486   if (cpu_arch_isa == PROCESSOR_IAMCU)
1487     {
1488       static const i386_cpu_flags iamcu_flags = CPU_IAMCU_COMPAT_FLAGS;
1489       i386_cpu_flags compat_flags;
1490       compat_flags = cpu_flags_and_not (*flags, iamcu_flags);
1491       return cpu_flags_all_zero (&compat_flags);
1492     }
1493   else
1494     return 1;
1495 }
1496
1497 #define CPU_FLAGS_ARCH_MATCH            0x1
1498 #define CPU_FLAGS_64BIT_MATCH           0x2
1499 #define CPU_FLAGS_AES_MATCH             0x4
1500 #define CPU_FLAGS_PCLMUL_MATCH          0x8
1501 #define CPU_FLAGS_AVX_MATCH            0x10
1502
1503 #define CPU_FLAGS_32BIT_MATCH \
1504   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_AES_MATCH \
1505    | CPU_FLAGS_PCLMUL_MATCH | CPU_FLAGS_AVX_MATCH)
1506 #define CPU_FLAGS_PERFECT_MATCH \
1507   (CPU_FLAGS_32BIT_MATCH | CPU_FLAGS_64BIT_MATCH)
1508
1509 /* Return CPU flags match bits. */
1510
1511 static int
1512 cpu_flags_match (const insn_template *t)
1513 {
1514   i386_cpu_flags x = t->cpu_flags;
1515   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1516
1517   x.bitfield.cpu64 = 0;
1518   x.bitfield.cpuno64 = 0;
1519
1520   if (cpu_flags_all_zero (&x))
1521     {
1522       /* This instruction is available on all archs.  */
1523       match |= CPU_FLAGS_32BIT_MATCH;
1524     }
1525   else
1526     {
1527       /* This instruction is available only on some archs.  */
1528       i386_cpu_flags cpu = cpu_arch_flags;
1529
1530       cpu.bitfield.cpu64 = 0;
1531       cpu.bitfield.cpuno64 = 0;
1532       cpu = cpu_flags_and (x, cpu);
1533       if (!cpu_flags_all_zero (&cpu))
1534         {
1535           if (x.bitfield.cpuavx)
1536             {
1537               /* We only need to check AES/PCLMUL/SSE2AVX with AVX.  */
1538               if (cpu.bitfield.cpuavx)
1539                 {
1540                   /* Check SSE2AVX.  */
1541                   if (!t->opcode_modifier.sse2avx|| sse2avx)
1542                     {
1543                       match |= (CPU_FLAGS_ARCH_MATCH
1544                                 | CPU_FLAGS_AVX_MATCH);
1545                       /* Check AES.  */
1546                       if (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1547                         match |= CPU_FLAGS_AES_MATCH;
1548                       /* Check PCLMUL.  */
1549                       if (!x.bitfield.cpupclmul
1550                           || cpu.bitfield.cpupclmul)
1551                         match |= CPU_FLAGS_PCLMUL_MATCH;
1552                     }
1553                 }
1554               else
1555                 match |= CPU_FLAGS_ARCH_MATCH;
1556             }
1557           else
1558             match |= CPU_FLAGS_32BIT_MATCH;
1559         }
1560     }
1561   return match;
1562 }
1563
1564 static INLINE i386_operand_type
1565 operand_type_and (i386_operand_type x, i386_operand_type y)
1566 {
1567   switch (ARRAY_SIZE (x.array))
1568     {
1569     case 3:
1570       x.array [2] &= y.array [2];
1571     case 2:
1572       x.array [1] &= y.array [1];
1573     case 1:
1574       x.array [0] &= y.array [0];
1575       break;
1576     default:
1577       abort ();
1578     }
1579   return x;
1580 }
1581
1582 static INLINE i386_operand_type
1583 operand_type_or (i386_operand_type x, i386_operand_type y)
1584 {
1585   switch (ARRAY_SIZE (x.array))
1586     {
1587     case 3:
1588       x.array [2] |= y.array [2];
1589     case 2:
1590       x.array [1] |= y.array [1];
1591     case 1:
1592       x.array [0] |= y.array [0];
1593       break;
1594     default:
1595       abort ();
1596     }
1597   return x;
1598 }
1599
1600 static INLINE i386_operand_type
1601 operand_type_xor (i386_operand_type x, i386_operand_type y)
1602 {
1603   switch (ARRAY_SIZE (x.array))
1604     {
1605     case 3:
1606       x.array [2] ^= y.array [2];
1607     case 2:
1608       x.array [1] ^= y.array [1];
1609     case 1:
1610       x.array [0] ^= y.array [0];
1611       break;
1612     default:
1613       abort ();
1614     }
1615   return x;
1616 }
1617
1618 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1619 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1620 static const i386_operand_type control = OPERAND_TYPE_CONTROL;
1621 static const i386_operand_type inoutportreg
1622   = OPERAND_TYPE_INOUTPORTREG;
1623 static const i386_operand_type reg16_inoutportreg
1624   = OPERAND_TYPE_REG16_INOUTPORTREG;
1625 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1626 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1627 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1628 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1629 static const i386_operand_type anydisp
1630   = OPERAND_TYPE_ANYDISP;
1631 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1632 static const i386_operand_type regymm = OPERAND_TYPE_REGYMM;
1633 static const i386_operand_type regzmm = OPERAND_TYPE_REGZMM;
1634 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1635 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1636 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1637 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1638 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1639 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1640 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1641 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1642 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1643 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1644 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1645
1646 enum operand_type
1647 {
1648   reg,
1649   imm,
1650   disp,
1651   anymem
1652 };
1653
1654 static INLINE int
1655 operand_type_check (i386_operand_type t, enum operand_type c)
1656 {
1657   switch (c)
1658     {
1659     case reg:
1660       return (t.bitfield.reg8
1661               || t.bitfield.reg16
1662               || t.bitfield.reg32
1663               || t.bitfield.reg64);
1664
1665     case imm:
1666       return (t.bitfield.imm8
1667               || t.bitfield.imm8s
1668               || t.bitfield.imm16
1669               || t.bitfield.imm32
1670               || t.bitfield.imm32s
1671               || t.bitfield.imm64);
1672
1673     case disp:
1674       return (t.bitfield.disp8
1675               || t.bitfield.disp16
1676               || t.bitfield.disp32
1677               || t.bitfield.disp32s
1678               || t.bitfield.disp64);
1679
1680     case anymem:
1681       return (t.bitfield.disp8
1682               || t.bitfield.disp16
1683               || t.bitfield.disp32
1684               || t.bitfield.disp32s
1685               || t.bitfield.disp64
1686               || t.bitfield.baseindex);
1687
1688     default:
1689       abort ();
1690     }
1691
1692   return 0;
1693 }
1694
1695 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit on
1696    operand J for instruction template T.  */
1697
1698 static INLINE int
1699 match_reg_size (const insn_template *t, unsigned int j)
1700 {
1701   return !((i.types[j].bitfield.byte
1702             && !t->operand_types[j].bitfield.byte)
1703            || (i.types[j].bitfield.word
1704                && !t->operand_types[j].bitfield.word)
1705            || (i.types[j].bitfield.dword
1706                && !t->operand_types[j].bitfield.dword)
1707            || (i.types[j].bitfield.qword
1708                && !t->operand_types[j].bitfield.qword));
1709 }
1710
1711 /* Return 1 if there is no conflict in any size on operand J for
1712    instruction template T.  */
1713
1714 static INLINE int
1715 match_mem_size (const insn_template *t, unsigned int j)
1716 {
1717   return (match_reg_size (t, j)
1718           && !((i.types[j].bitfield.unspecified
1719                 && !i.broadcast
1720                 && !t->operand_types[j].bitfield.unspecified)
1721                || (i.types[j].bitfield.fword
1722                    && !t->operand_types[j].bitfield.fword)
1723                || (i.types[j].bitfield.tbyte
1724                    && !t->operand_types[j].bitfield.tbyte)
1725                || (i.types[j].bitfield.xmmword
1726                    && !t->operand_types[j].bitfield.xmmword)
1727                || (i.types[j].bitfield.ymmword
1728                    && !t->operand_types[j].bitfield.ymmword)
1729                || (i.types[j].bitfield.zmmword
1730                    && !t->operand_types[j].bitfield.zmmword)));
1731 }
1732
1733 /* Return 1 if there is no size conflict on any operands for
1734    instruction template T.  */
1735
1736 static INLINE int
1737 operand_size_match (const insn_template *t)
1738 {
1739   unsigned int j;
1740   int match = 1;
1741
1742   /* Don't check jump instructions.  */
1743   if (t->opcode_modifier.jump
1744       || t->opcode_modifier.jumpbyte
1745       || t->opcode_modifier.jumpdword
1746       || t->opcode_modifier.jumpintersegment)
1747     return match;
1748
1749   /* Check memory and accumulator operand size.  */
1750   for (j = 0; j < i.operands; j++)
1751     {
1752       if (t->operand_types[j].bitfield.anysize)
1753         continue;
1754
1755       if (t->operand_types[j].bitfield.acc && !match_reg_size (t, j))
1756         {
1757           match = 0;
1758           break;
1759         }
1760
1761       if (i.types[j].bitfield.mem && !match_mem_size (t, j))
1762         {
1763           match = 0;
1764           break;
1765         }
1766     }
1767
1768   if (match)
1769     return match;
1770   else if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
1771     {
1772 mismatch:
1773       i.error = operand_size_mismatch;
1774       return 0;
1775     }
1776
1777   /* Check reverse.  */
1778   gas_assert (i.operands == 2);
1779
1780   match = 1;
1781   for (j = 0; j < 2; j++)
1782     {
1783       if (t->operand_types[j].bitfield.acc
1784           && !match_reg_size (t, j ? 0 : 1))
1785         goto mismatch;
1786
1787       if (i.types[j].bitfield.mem
1788           && !match_mem_size (t, j ? 0 : 1))
1789         goto mismatch;
1790     }
1791
1792   return match;
1793 }
1794
1795 static INLINE int
1796 operand_type_match (i386_operand_type overlap,
1797                     i386_operand_type given)
1798 {
1799   i386_operand_type temp = overlap;
1800
1801   temp.bitfield.jumpabsolute = 0;
1802   temp.bitfield.unspecified = 0;
1803   temp.bitfield.byte = 0;
1804   temp.bitfield.word = 0;
1805   temp.bitfield.dword = 0;
1806   temp.bitfield.fword = 0;
1807   temp.bitfield.qword = 0;
1808   temp.bitfield.tbyte = 0;
1809   temp.bitfield.xmmword = 0;
1810   temp.bitfield.ymmword = 0;
1811   temp.bitfield.zmmword = 0;
1812   if (operand_type_all_zero (&temp))
1813     goto mismatch;
1814
1815   if (given.bitfield.baseindex == overlap.bitfield.baseindex
1816       && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
1817     return 1;
1818
1819 mismatch:
1820   i.error = operand_type_mismatch;
1821   return 0;
1822 }
1823
1824 /* If given types g0 and g1 are registers they must be of the same type
1825    unless the expected operand type register overlap is null.
1826    Note that Acc in a template matches every size of reg.  */
1827
1828 static INLINE int
1829 operand_type_register_match (i386_operand_type m0,
1830                              i386_operand_type g0,
1831                              i386_operand_type t0,
1832                              i386_operand_type m1,
1833                              i386_operand_type g1,
1834                              i386_operand_type t1)
1835 {
1836   if (!operand_type_check (g0, reg))
1837     return 1;
1838
1839   if (!operand_type_check (g1, reg))
1840     return 1;
1841
1842   if (g0.bitfield.reg8 == g1.bitfield.reg8
1843       && g0.bitfield.reg16 == g1.bitfield.reg16
1844       && g0.bitfield.reg32 == g1.bitfield.reg32
1845       && g0.bitfield.reg64 == g1.bitfield.reg64)
1846     return 1;
1847
1848   if (m0.bitfield.acc)
1849     {
1850       t0.bitfield.reg8 = 1;
1851       t0.bitfield.reg16 = 1;
1852       t0.bitfield.reg32 = 1;
1853       t0.bitfield.reg64 = 1;
1854     }
1855
1856   if (m1.bitfield.acc)
1857     {
1858       t1.bitfield.reg8 = 1;
1859       t1.bitfield.reg16 = 1;
1860       t1.bitfield.reg32 = 1;
1861       t1.bitfield.reg64 = 1;
1862     }
1863
1864   if (!(t0.bitfield.reg8 & t1.bitfield.reg8)
1865       && !(t0.bitfield.reg16 & t1.bitfield.reg16)
1866       && !(t0.bitfield.reg32 & t1.bitfield.reg32)
1867       && !(t0.bitfield.reg64 & t1.bitfield.reg64))
1868     return 1;
1869
1870   i.error = register_type_mismatch;
1871
1872   return 0;
1873 }
1874
1875 static INLINE unsigned int
1876 register_number (const reg_entry *r)
1877 {
1878   unsigned int nr = r->reg_num;
1879
1880   if (r->reg_flags & RegRex)
1881     nr += 8;
1882
1883   if (r->reg_flags & RegVRex)
1884     nr += 16;
1885
1886   return nr;
1887 }
1888
1889 static INLINE unsigned int
1890 mode_from_disp_size (i386_operand_type t)
1891 {
1892   if (t.bitfield.disp8 || t.bitfield.vec_disp8)
1893     return 1;
1894   else if (t.bitfield.disp16
1895            || t.bitfield.disp32
1896            || t.bitfield.disp32s)
1897     return 2;
1898   else
1899     return 0;
1900 }
1901
1902 static INLINE int
1903 fits_in_signed_byte (addressT num)
1904 {
1905   return num + 0x80 <= 0xff;
1906 }
1907
1908 static INLINE int
1909 fits_in_unsigned_byte (addressT num)
1910 {
1911   return num <= 0xff;
1912 }
1913
1914 static INLINE int
1915 fits_in_unsigned_word (addressT num)
1916 {
1917   return num <= 0xffff;
1918 }
1919
1920 static INLINE int
1921 fits_in_signed_word (addressT num)
1922 {
1923   return num + 0x8000 <= 0xffff;
1924 }
1925
1926 static INLINE int
1927 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
1928 {
1929 #ifndef BFD64
1930   return 1;
1931 #else
1932   return num + 0x80000000 <= 0xffffffff;
1933 #endif
1934 }                               /* fits_in_signed_long() */
1935
1936 static INLINE int
1937 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
1938 {
1939 #ifndef BFD64
1940   return 1;
1941 #else
1942   return num <= 0xffffffff;
1943 #endif
1944 }                               /* fits_in_unsigned_long() */
1945
1946 static INLINE int
1947 fits_in_vec_disp8 (offsetT num)
1948 {
1949   int shift = i.memshift;
1950   unsigned int mask;
1951
1952   if (shift == -1)
1953     abort ();
1954
1955   mask = (1 << shift) - 1;
1956
1957   /* Return 0 if NUM isn't properly aligned.  */
1958   if ((num & mask))
1959     return 0;
1960
1961   /* Check if NUM will fit in 8bit after shift.  */
1962   return fits_in_signed_byte (num >> shift);
1963 }
1964
1965 static INLINE int
1966 fits_in_imm4 (offsetT num)
1967 {
1968   return (num & 0xf) == num;
1969 }
1970
1971 static i386_operand_type
1972 smallest_imm_type (offsetT num)
1973 {
1974   i386_operand_type t;
1975
1976   operand_type_set (&t, 0);
1977   t.bitfield.imm64 = 1;
1978
1979   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
1980     {
1981       /* This code is disabled on the 486 because all the Imm1 forms
1982          in the opcode table are slower on the i486.  They're the
1983          versions with the implicitly specified single-position
1984          displacement, which has another syntax if you really want to
1985          use that form.  */
1986       t.bitfield.imm1 = 1;
1987       t.bitfield.imm8 = 1;
1988       t.bitfield.imm8s = 1;
1989       t.bitfield.imm16 = 1;
1990       t.bitfield.imm32 = 1;
1991       t.bitfield.imm32s = 1;
1992     }
1993   else if (fits_in_signed_byte (num))
1994     {
1995       t.bitfield.imm8 = 1;
1996       t.bitfield.imm8s = 1;
1997       t.bitfield.imm16 = 1;
1998       t.bitfield.imm32 = 1;
1999       t.bitfield.imm32s = 1;
2000     }
2001   else if (fits_in_unsigned_byte (num))
2002     {
2003       t.bitfield.imm8 = 1;
2004       t.bitfield.imm16 = 1;
2005       t.bitfield.imm32 = 1;
2006       t.bitfield.imm32s = 1;
2007     }
2008   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2009     {
2010       t.bitfield.imm16 = 1;
2011       t.bitfield.imm32 = 1;
2012       t.bitfield.imm32s = 1;
2013     }
2014   else if (fits_in_signed_long (num))
2015     {
2016       t.bitfield.imm32 = 1;
2017       t.bitfield.imm32s = 1;
2018     }
2019   else if (fits_in_unsigned_long (num))
2020     t.bitfield.imm32 = 1;
2021
2022   return t;
2023 }
2024
2025 static offsetT
2026 offset_in_range (offsetT val, int size)
2027 {
2028   addressT mask;
2029
2030   switch (size)
2031     {
2032     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2033     case 2: mask = ((addressT) 1 << 16) - 1; break;
2034     case 4: mask = ((addressT) 2 << 31) - 1; break;
2035 #ifdef BFD64
2036     case 8: mask = ((addressT) 2 << 63) - 1; break;
2037 #endif
2038     default: abort ();
2039     }
2040
2041 #ifdef BFD64
2042   /* If BFD64, sign extend val for 32bit address mode.  */
2043   if (flag_code != CODE_64BIT
2044       || i.prefix[ADDR_PREFIX])
2045     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2046       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2047 #endif
2048
2049   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2050     {
2051       char buf1[40], buf2[40];
2052
2053       sprint_value (buf1, val);
2054       sprint_value (buf2, val & mask);
2055       as_warn (_("%s shortened to %s"), buf1, buf2);
2056     }
2057   return val & mask;
2058 }
2059
2060 enum PREFIX_GROUP
2061 {
2062   PREFIX_EXIST = 0,
2063   PREFIX_LOCK,
2064   PREFIX_REP,
2065   PREFIX_OTHER
2066 };
2067
2068 /* Returns
2069    a. PREFIX_EXIST if attempting to add a prefix where one from the
2070    same class already exists.
2071    b. PREFIX_LOCK if lock prefix is added.
2072    c. PREFIX_REP if rep/repne prefix is added.
2073    d. PREFIX_OTHER if other prefix is added.
2074  */
2075
2076 static enum PREFIX_GROUP
2077 add_prefix (unsigned int prefix)
2078 {
2079   enum PREFIX_GROUP ret = PREFIX_OTHER;
2080   unsigned int q;
2081
2082   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2083       && flag_code == CODE_64BIT)
2084     {
2085       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2086           || ((i.prefix[REX_PREFIX] & (REX_R | REX_X | REX_B))
2087               && (prefix & (REX_R | REX_X | REX_B))))
2088         ret = PREFIX_EXIST;
2089       q = REX_PREFIX;
2090     }
2091   else
2092     {
2093       switch (prefix)
2094         {
2095         default:
2096           abort ();
2097
2098         case CS_PREFIX_OPCODE:
2099         case DS_PREFIX_OPCODE:
2100         case ES_PREFIX_OPCODE:
2101         case FS_PREFIX_OPCODE:
2102         case GS_PREFIX_OPCODE:
2103         case SS_PREFIX_OPCODE:
2104           q = SEG_PREFIX;
2105           break;
2106
2107         case REPNE_PREFIX_OPCODE:
2108         case REPE_PREFIX_OPCODE:
2109           q = REP_PREFIX;
2110           ret = PREFIX_REP;
2111           break;
2112
2113         case LOCK_PREFIX_OPCODE:
2114           q = LOCK_PREFIX;
2115           ret = PREFIX_LOCK;
2116           break;
2117
2118         case FWAIT_OPCODE:
2119           q = WAIT_PREFIX;
2120           break;
2121
2122         case ADDR_PREFIX_OPCODE:
2123           q = ADDR_PREFIX;
2124           break;
2125
2126         case DATA_PREFIX_OPCODE:
2127           q = DATA_PREFIX;
2128           break;
2129         }
2130       if (i.prefix[q] != 0)
2131         ret = PREFIX_EXIST;
2132     }
2133
2134   if (ret)
2135     {
2136       if (!i.prefix[q])
2137         ++i.prefixes;
2138       i.prefix[q] |= prefix;
2139     }
2140   else
2141     as_bad (_("same type of prefix used twice"));
2142
2143   return ret;
2144 }
2145
2146 static void
2147 update_code_flag (int value, int check)
2148 {
2149   PRINTF_LIKE ((*as_error));
2150
2151   flag_code = (enum flag_code) value;
2152   if (flag_code == CODE_64BIT)
2153     {
2154       cpu_arch_flags.bitfield.cpu64 = 1;
2155       cpu_arch_flags.bitfield.cpuno64 = 0;
2156     }
2157   else
2158     {
2159       cpu_arch_flags.bitfield.cpu64 = 0;
2160       cpu_arch_flags.bitfield.cpuno64 = 1;
2161     }
2162   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2163     {
2164       if (check)
2165         as_error = as_fatal;
2166       else
2167         as_error = as_bad;
2168       (*as_error) (_("64bit mode not supported on `%s'."),
2169                    cpu_arch_name ? cpu_arch_name : default_arch);
2170     }
2171   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2172     {
2173       if (check)
2174         as_error = as_fatal;
2175       else
2176         as_error = as_bad;
2177       (*as_error) (_("32bit mode not supported on `%s'."),
2178                    cpu_arch_name ? cpu_arch_name : default_arch);
2179     }
2180   stackop_size = '\0';
2181 }
2182
2183 static void
2184 set_code_flag (int value)
2185 {
2186   update_code_flag (value, 0);
2187 }
2188
2189 static void
2190 set_16bit_gcc_code_flag (int new_code_flag)
2191 {
2192   flag_code = (enum flag_code) new_code_flag;
2193   if (flag_code != CODE_16BIT)
2194     abort ();
2195   cpu_arch_flags.bitfield.cpu64 = 0;
2196   cpu_arch_flags.bitfield.cpuno64 = 1;
2197   stackop_size = LONG_MNEM_SUFFIX;
2198 }
2199
2200 static void
2201 set_intel_syntax (int syntax_flag)
2202 {
2203   /* Find out if register prefixing is specified.  */
2204   int ask_naked_reg = 0;
2205
2206   SKIP_WHITESPACE ();
2207   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2208     {
2209       char *string;
2210       int e = get_symbol_name (&string);
2211
2212       if (strcmp (string, "prefix") == 0)
2213         ask_naked_reg = 1;
2214       else if (strcmp (string, "noprefix") == 0)
2215         ask_naked_reg = -1;
2216       else
2217         as_bad (_("bad argument to syntax directive."));
2218       (void) restore_line_pointer (e);
2219     }
2220   demand_empty_rest_of_line ();
2221
2222   intel_syntax = syntax_flag;
2223
2224   if (ask_naked_reg == 0)
2225     allow_naked_reg = (intel_syntax
2226                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2227   else
2228     allow_naked_reg = (ask_naked_reg < 0);
2229
2230   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2231
2232   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2233   identifier_chars['$'] = intel_syntax ? '$' : 0;
2234   register_prefix = allow_naked_reg ? "" : "%";
2235 }
2236
2237 static void
2238 set_intel_mnemonic (int mnemonic_flag)
2239 {
2240   intel_mnemonic = mnemonic_flag;
2241 }
2242
2243 static void
2244 set_allow_index_reg (int flag)
2245 {
2246   allow_index_reg = flag;
2247 }
2248
2249 static void
2250 set_check (int what)
2251 {
2252   enum check_kind *kind;
2253   const char *str;
2254
2255   if (what)
2256     {
2257       kind = &operand_check;
2258       str = "operand";
2259     }
2260   else
2261     {
2262       kind = &sse_check;
2263       str = "sse";
2264     }
2265
2266   SKIP_WHITESPACE ();
2267
2268   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2269     {
2270       char *string;
2271       int e = get_symbol_name (&string);
2272
2273       if (strcmp (string, "none") == 0)
2274         *kind = check_none;
2275       else if (strcmp (string, "warning") == 0)
2276         *kind = check_warning;
2277       else if (strcmp (string, "error") == 0)
2278         *kind = check_error;
2279       else
2280         as_bad (_("bad argument to %s_check directive."), str);
2281       (void) restore_line_pointer (e);
2282     }
2283   else
2284     as_bad (_("missing argument for %s_check directive"), str);
2285
2286   demand_empty_rest_of_line ();
2287 }
2288
2289 static void
2290 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2291                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2292 {
2293 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2294   static const char *arch;
2295
2296   /* Intel LIOM is only supported on ELF.  */
2297   if (!IS_ELF)
2298     return;
2299
2300   if (!arch)
2301     {
2302       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2303          use default_arch.  */
2304       arch = cpu_arch_name;
2305       if (!arch)
2306         arch = default_arch;
2307     }
2308
2309   /* If we are targeting Intel MCU, we must enable it.  */
2310   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2311       || new_flag.bitfield.cpuiamcu)
2312     return;
2313
2314   /* If we are targeting Intel L1OM, we must enable it.  */
2315   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2316       || new_flag.bitfield.cpul1om)
2317     return;
2318
2319   /* If we are targeting Intel K1OM, we must enable it.  */
2320   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2321       || new_flag.bitfield.cpuk1om)
2322     return;
2323
2324   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2325 #endif
2326 }
2327
2328 static void
2329 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2330 {
2331   SKIP_WHITESPACE ();
2332
2333   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2334     {
2335       char *string;
2336       int e = get_symbol_name (&string);
2337       unsigned int j;
2338       i386_cpu_flags flags;
2339
2340       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2341         {
2342           if (strcmp (string, cpu_arch[j].name) == 0)
2343             {
2344               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2345
2346               if (*string != '.')
2347                 {
2348                   cpu_arch_name = cpu_arch[j].name;
2349                   cpu_sub_arch_name = NULL;
2350                   cpu_arch_flags = cpu_arch[j].flags;
2351                   if (flag_code == CODE_64BIT)
2352                     {
2353                       cpu_arch_flags.bitfield.cpu64 = 1;
2354                       cpu_arch_flags.bitfield.cpuno64 = 0;
2355                     }
2356                   else
2357                     {
2358                       cpu_arch_flags.bitfield.cpu64 = 0;
2359                       cpu_arch_flags.bitfield.cpuno64 = 1;
2360                     }
2361                   cpu_arch_isa = cpu_arch[j].type;
2362                   cpu_arch_isa_flags = cpu_arch[j].flags;
2363                   if (!cpu_arch_tune_set)
2364                     {
2365                       cpu_arch_tune = cpu_arch_isa;
2366                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2367                     }
2368                   break;
2369                 }
2370
2371               if (!cpu_arch[j].negated)
2372                 flags = cpu_flags_or (cpu_arch_flags,
2373                                       cpu_arch[j].flags);
2374               else
2375                 flags = cpu_flags_and_not (cpu_arch_flags,
2376                                            cpu_arch[j].flags);
2377
2378               if (!valid_iamcu_cpu_flags (&flags))
2379                 as_fatal (_("`%s' isn't valid for Intel MCU"),
2380                           cpu_arch[j].name);
2381               else if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2382                 {
2383                   if (cpu_sub_arch_name)
2384                     {
2385                       char *name = cpu_sub_arch_name;
2386                       cpu_sub_arch_name = concat (name,
2387                                                   cpu_arch[j].name,
2388                                                   (const char *) NULL);
2389                       free (name);
2390                     }
2391                   else
2392                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2393                   cpu_arch_flags = flags;
2394                   cpu_arch_isa_flags = flags;
2395                 }
2396               (void) restore_line_pointer (e);
2397               demand_empty_rest_of_line ();
2398               return;
2399             }
2400         }
2401       if (j >= ARRAY_SIZE (cpu_arch))
2402         as_bad (_("no such architecture: `%s'"), string);
2403
2404       *input_line_pointer = e;
2405     }
2406   else
2407     as_bad (_("missing cpu architecture"));
2408
2409   no_cond_jump_promotion = 0;
2410   if (*input_line_pointer == ','
2411       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2412     {
2413       char *string;
2414       char e;
2415
2416       ++input_line_pointer;
2417       e = get_symbol_name (&string);
2418
2419       if (strcmp (string, "nojumps") == 0)
2420         no_cond_jump_promotion = 1;
2421       else if (strcmp (string, "jumps") == 0)
2422         ;
2423       else
2424         as_bad (_("no such architecture modifier: `%s'"), string);
2425
2426       (void) restore_line_pointer (e);
2427     }
2428
2429   demand_empty_rest_of_line ();
2430 }
2431
2432 enum bfd_architecture
2433 i386_arch (void)
2434 {
2435   if (cpu_arch_isa == PROCESSOR_L1OM)
2436     {
2437       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2438           || flag_code != CODE_64BIT)
2439         as_fatal (_("Intel L1OM is 64bit ELF only"));
2440       return bfd_arch_l1om;
2441     }
2442   else if (cpu_arch_isa == PROCESSOR_K1OM)
2443     {
2444       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2445           || flag_code != CODE_64BIT)
2446         as_fatal (_("Intel K1OM is 64bit ELF only"));
2447       return bfd_arch_k1om;
2448     }
2449   else if (cpu_arch_isa == PROCESSOR_IAMCU)
2450     {
2451       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2452           || flag_code == CODE_64BIT)
2453         as_fatal (_("Intel MCU is 32bit ELF only"));
2454       return bfd_arch_iamcu;
2455     }
2456   else
2457     return bfd_arch_i386;
2458 }
2459
2460 unsigned long
2461 i386_mach (void)
2462 {
2463   if (!strncmp (default_arch, "x86_64", 6))
2464     {
2465       if (cpu_arch_isa == PROCESSOR_L1OM)
2466         {
2467           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2468               || default_arch[6] != '\0')
2469             as_fatal (_("Intel L1OM is 64bit ELF only"));
2470           return bfd_mach_l1om;
2471         }
2472       else if (cpu_arch_isa == PROCESSOR_K1OM)
2473         {
2474           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2475               || default_arch[6] != '\0')
2476             as_fatal (_("Intel K1OM is 64bit ELF only"));
2477           return bfd_mach_k1om;
2478         }
2479       else if (default_arch[6] == '\0')
2480         return bfd_mach_x86_64;
2481       else
2482         return bfd_mach_x64_32;
2483     }
2484   else if (!strcmp (default_arch, "i386")
2485            || !strcmp (default_arch, "iamcu"))
2486     {
2487       if (cpu_arch_isa == PROCESSOR_IAMCU)
2488         {
2489           if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
2490             as_fatal (_("Intel MCU is 32bit ELF only"));
2491           return bfd_mach_i386_iamcu;
2492         }
2493       else
2494         return bfd_mach_i386_i386;
2495     }
2496   else
2497     as_fatal (_("unknown architecture"));
2498 }
2499 \f
2500 void
2501 md_begin (void)
2502 {
2503   const char *hash_err;
2504
2505   /* Initialize op_hash hash table.  */
2506   op_hash = hash_new ();
2507
2508   {
2509     const insn_template *optab;
2510     templates *core_optab;
2511
2512     /* Setup for loop.  */
2513     optab = i386_optab;
2514     core_optab = (templates *) xmalloc (sizeof (templates));
2515     core_optab->start = optab;
2516
2517     while (1)
2518       {
2519         ++optab;
2520         if (optab->name == NULL
2521             || strcmp (optab->name, (optab - 1)->name) != 0)
2522           {
2523             /* different name --> ship out current template list;
2524                add to hash table; & begin anew.  */
2525             core_optab->end = optab;
2526             hash_err = hash_insert (op_hash,
2527                                     (optab - 1)->name,
2528                                     (void *) core_optab);
2529             if (hash_err)
2530               {
2531                 as_fatal (_("can't hash %s: %s"),
2532                           (optab - 1)->name,
2533                           hash_err);
2534               }
2535             if (optab->name == NULL)
2536               break;
2537             core_optab = (templates *) xmalloc (sizeof (templates));
2538             core_optab->start = optab;
2539           }
2540       }
2541   }
2542
2543   /* Initialize reg_hash hash table.  */
2544   reg_hash = hash_new ();
2545   {
2546     const reg_entry *regtab;
2547     unsigned int regtab_size = i386_regtab_size;
2548
2549     for (regtab = i386_regtab; regtab_size--; regtab++)
2550       {
2551         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2552         if (hash_err)
2553           as_fatal (_("can't hash %s: %s"),
2554                     regtab->reg_name,
2555                     hash_err);
2556       }
2557   }
2558
2559   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
2560   {
2561     int c;
2562     char *p;
2563
2564     for (c = 0; c < 256; c++)
2565       {
2566         if (ISDIGIT (c))
2567           {
2568             digit_chars[c] = c;
2569             mnemonic_chars[c] = c;
2570             register_chars[c] = c;
2571             operand_chars[c] = c;
2572           }
2573         else if (ISLOWER (c))
2574           {
2575             mnemonic_chars[c] = c;
2576             register_chars[c] = c;
2577             operand_chars[c] = c;
2578           }
2579         else if (ISUPPER (c))
2580           {
2581             mnemonic_chars[c] = TOLOWER (c);
2582             register_chars[c] = mnemonic_chars[c];
2583             operand_chars[c] = c;
2584           }
2585         else if (c == '{' || c == '}')
2586           operand_chars[c] = c;
2587
2588         if (ISALPHA (c) || ISDIGIT (c))
2589           identifier_chars[c] = c;
2590         else if (c >= 128)
2591           {
2592             identifier_chars[c] = c;
2593             operand_chars[c] = c;
2594           }
2595       }
2596
2597 #ifdef LEX_AT
2598     identifier_chars['@'] = '@';
2599 #endif
2600 #ifdef LEX_QM
2601     identifier_chars['?'] = '?';
2602     operand_chars['?'] = '?';
2603 #endif
2604     digit_chars['-'] = '-';
2605     mnemonic_chars['_'] = '_';
2606     mnemonic_chars['-'] = '-';
2607     mnemonic_chars['.'] = '.';
2608     identifier_chars['_'] = '_';
2609     identifier_chars['.'] = '.';
2610
2611     for (p = operand_special_chars; *p != '\0'; p++)
2612       operand_chars[(unsigned char) *p] = *p;
2613   }
2614
2615   if (flag_code == CODE_64BIT)
2616     {
2617 #if defined (OBJ_COFF) && defined (TE_PE)
2618       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2619                                   ? 32 : 16);
2620 #else
2621       x86_dwarf2_return_column = 16;
2622 #endif
2623       x86_cie_data_alignment = -8;
2624     }
2625   else
2626     {
2627       x86_dwarf2_return_column = 8;
2628       x86_cie_data_alignment = -4;
2629     }
2630 }
2631
2632 void
2633 i386_print_statistics (FILE *file)
2634 {
2635   hash_print_statistics (file, "i386 opcode", op_hash);
2636   hash_print_statistics (file, "i386 register", reg_hash);
2637 }
2638 \f
2639 #ifdef DEBUG386
2640
2641 /* Debugging routines for md_assemble.  */
2642 static void pte (insn_template *);
2643 static void pt (i386_operand_type);
2644 static void pe (expressionS *);
2645 static void ps (symbolS *);
2646
2647 static void
2648 pi (char *line, i386_insn *x)
2649 {
2650   unsigned int j;
2651
2652   fprintf (stdout, "%s: template ", line);
2653   pte (&x->tm);
2654   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
2655            x->base_reg ? x->base_reg->reg_name : "none",
2656            x->index_reg ? x->index_reg->reg_name : "none",
2657            x->log2_scale_factor);
2658   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
2659            x->rm.mode, x->rm.reg, x->rm.regmem);
2660   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
2661            x->sib.base, x->sib.index, x->sib.scale);
2662   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
2663            (x->rex & REX_W) != 0,
2664            (x->rex & REX_R) != 0,
2665            (x->rex & REX_X) != 0,
2666            (x->rex & REX_B) != 0);
2667   for (j = 0; j < x->operands; j++)
2668     {
2669       fprintf (stdout, "    #%d:  ", j + 1);
2670       pt (x->types[j]);
2671       fprintf (stdout, "\n");
2672       if (x->types[j].bitfield.reg8
2673           || x->types[j].bitfield.reg16
2674           || x->types[j].bitfield.reg32
2675           || x->types[j].bitfield.reg64
2676           || x->types[j].bitfield.regmmx
2677           || x->types[j].bitfield.regxmm
2678           || x->types[j].bitfield.regymm
2679           || x->types[j].bitfield.regzmm
2680           || x->types[j].bitfield.sreg2
2681           || x->types[j].bitfield.sreg3
2682           || x->types[j].bitfield.control
2683           || x->types[j].bitfield.debug
2684           || x->types[j].bitfield.test)
2685         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2686       if (operand_type_check (x->types[j], imm))
2687         pe (x->op[j].imms);
2688       if (operand_type_check (x->types[j], disp))
2689         pe (x->op[j].disps);
2690     }
2691 }
2692
2693 static void
2694 pte (insn_template *t)
2695 {
2696   unsigned int j;
2697   fprintf (stdout, " %d operands ", t->operands);
2698   fprintf (stdout, "opcode %x ", t->base_opcode);
2699   if (t->extension_opcode != None)
2700     fprintf (stdout, "ext %x ", t->extension_opcode);
2701   if (t->opcode_modifier.d)
2702     fprintf (stdout, "D");
2703   if (t->opcode_modifier.w)
2704     fprintf (stdout, "W");
2705   fprintf (stdout, "\n");
2706   for (j = 0; j < t->operands; j++)
2707     {
2708       fprintf (stdout, "    #%d type ", j + 1);
2709       pt (t->operand_types[j]);
2710       fprintf (stdout, "\n");
2711     }
2712 }
2713
2714 static void
2715 pe (expressionS *e)
2716 {
2717   fprintf (stdout, "    operation     %d\n", e->X_op);
2718   fprintf (stdout, "    add_number    %ld (%lx)\n",
2719            (long) e->X_add_number, (long) e->X_add_number);
2720   if (e->X_add_symbol)
2721     {
2722       fprintf (stdout, "    add_symbol    ");
2723       ps (e->X_add_symbol);
2724       fprintf (stdout, "\n");
2725     }
2726   if (e->X_op_symbol)
2727     {
2728       fprintf (stdout, "    op_symbol    ");
2729       ps (e->X_op_symbol);
2730       fprintf (stdout, "\n");
2731     }
2732 }
2733
2734 static void
2735 ps (symbolS *s)
2736 {
2737   fprintf (stdout, "%s type %s%s",
2738            S_GET_NAME (s),
2739            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
2740            segment_name (S_GET_SEGMENT (s)));
2741 }
2742
2743 static struct type_name
2744   {
2745     i386_operand_type mask;
2746     const char *name;
2747   }
2748 const type_names[] =
2749 {
2750   { OPERAND_TYPE_REG8, "r8" },
2751   { OPERAND_TYPE_REG16, "r16" },
2752   { OPERAND_TYPE_REG32, "r32" },
2753   { OPERAND_TYPE_REG64, "r64" },
2754   { OPERAND_TYPE_IMM8, "i8" },
2755   { OPERAND_TYPE_IMM8, "i8s" },
2756   { OPERAND_TYPE_IMM16, "i16" },
2757   { OPERAND_TYPE_IMM32, "i32" },
2758   { OPERAND_TYPE_IMM32S, "i32s" },
2759   { OPERAND_TYPE_IMM64, "i64" },
2760   { OPERAND_TYPE_IMM1, "i1" },
2761   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
2762   { OPERAND_TYPE_DISP8, "d8" },
2763   { OPERAND_TYPE_DISP16, "d16" },
2764   { OPERAND_TYPE_DISP32, "d32" },
2765   { OPERAND_TYPE_DISP32S, "d32s" },
2766   { OPERAND_TYPE_DISP64, "d64" },
2767   { OPERAND_TYPE_VEC_DISP8, "Vector d8" },
2768   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
2769   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
2770   { OPERAND_TYPE_CONTROL, "control reg" },
2771   { OPERAND_TYPE_TEST, "test reg" },
2772   { OPERAND_TYPE_DEBUG, "debug reg" },
2773   { OPERAND_TYPE_FLOATREG, "FReg" },
2774   { OPERAND_TYPE_FLOATACC, "FAcc" },
2775   { OPERAND_TYPE_SREG2, "SReg2" },
2776   { OPERAND_TYPE_SREG3, "SReg3" },
2777   { OPERAND_TYPE_ACC, "Acc" },
2778   { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
2779   { OPERAND_TYPE_REGMMX, "rMMX" },
2780   { OPERAND_TYPE_REGXMM, "rXMM" },
2781   { OPERAND_TYPE_REGYMM, "rYMM" },
2782   { OPERAND_TYPE_REGZMM, "rZMM" },
2783   { OPERAND_TYPE_REGMASK, "Mask reg" },
2784   { OPERAND_TYPE_ESSEG, "es" },
2785 };
2786
2787 static void
2788 pt (i386_operand_type t)
2789 {
2790   unsigned int j;
2791   i386_operand_type a;
2792
2793   for (j = 0; j < ARRAY_SIZE (type_names); j++)
2794     {
2795       a = operand_type_and (t, type_names[j].mask);
2796       if (!operand_type_all_zero (&a))
2797         fprintf (stdout, "%s, ",  type_names[j].name);
2798     }
2799   fflush (stdout);
2800 }
2801
2802 #endif /* DEBUG386 */
2803 \f
2804 static bfd_reloc_code_real_type
2805 reloc (unsigned int size,
2806        int pcrel,
2807        int sign,
2808        bfd_reloc_code_real_type other)
2809 {
2810   if (other != NO_RELOC)
2811     {
2812       reloc_howto_type *rel;
2813
2814       if (size == 8)
2815         switch (other)
2816           {
2817           case BFD_RELOC_X86_64_GOT32:
2818             return BFD_RELOC_X86_64_GOT64;
2819             break;
2820           case BFD_RELOC_X86_64_GOTPLT64:
2821             return BFD_RELOC_X86_64_GOTPLT64;
2822             break;
2823           case BFD_RELOC_X86_64_PLTOFF64:
2824             return BFD_RELOC_X86_64_PLTOFF64;
2825             break;
2826           case BFD_RELOC_X86_64_GOTPC32:
2827             other = BFD_RELOC_X86_64_GOTPC64;
2828             break;
2829           case BFD_RELOC_X86_64_GOTPCREL:
2830             other = BFD_RELOC_X86_64_GOTPCREL64;
2831             break;
2832           case BFD_RELOC_X86_64_TPOFF32:
2833             other = BFD_RELOC_X86_64_TPOFF64;
2834             break;
2835           case BFD_RELOC_X86_64_DTPOFF32:
2836             other = BFD_RELOC_X86_64_DTPOFF64;
2837             break;
2838           default:
2839             break;
2840           }
2841
2842 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2843       if (other == BFD_RELOC_SIZE32)
2844         {
2845           if (size == 8)
2846             other = BFD_RELOC_SIZE64;
2847           if (pcrel)
2848             {
2849               as_bad (_("there are no pc-relative size relocations"));
2850               return NO_RELOC;
2851             }
2852         }
2853 #endif
2854
2855       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
2856       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
2857         sign = -1;
2858
2859       rel = bfd_reloc_type_lookup (stdoutput, other);
2860       if (!rel)
2861         as_bad (_("unknown relocation (%u)"), other);
2862       else if (size != bfd_get_reloc_size (rel))
2863         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
2864                 bfd_get_reloc_size (rel),
2865                 size);
2866       else if (pcrel && !rel->pc_relative)
2867         as_bad (_("non-pc-relative relocation for pc-relative field"));
2868       else if ((rel->complain_on_overflow == complain_overflow_signed
2869                 && !sign)
2870                || (rel->complain_on_overflow == complain_overflow_unsigned
2871                    && sign > 0))
2872         as_bad (_("relocated field and relocation type differ in signedness"));
2873       else
2874         return other;
2875       return NO_RELOC;
2876     }
2877
2878   if (pcrel)
2879     {
2880       if (!sign)
2881         as_bad (_("there are no unsigned pc-relative relocations"));
2882       switch (size)
2883         {
2884         case 1: return BFD_RELOC_8_PCREL;
2885         case 2: return BFD_RELOC_16_PCREL;
2886         case 4: return BFD_RELOC_32_PCREL;
2887         case 8: return BFD_RELOC_64_PCREL;
2888         }
2889       as_bad (_("cannot do %u byte pc-relative relocation"), size);
2890     }
2891   else
2892     {
2893       if (sign > 0)
2894         switch (size)
2895           {
2896           case 4: return BFD_RELOC_X86_64_32S;
2897           }
2898       else
2899         switch (size)
2900           {
2901           case 1: return BFD_RELOC_8;
2902           case 2: return BFD_RELOC_16;
2903           case 4: return BFD_RELOC_32;
2904           case 8: return BFD_RELOC_64;
2905           }
2906       as_bad (_("cannot do %s %u byte relocation"),
2907               sign > 0 ? "signed" : "unsigned", size);
2908     }
2909
2910   return NO_RELOC;
2911 }
2912
2913 /* Here we decide which fixups can be adjusted to make them relative to
2914    the beginning of the section instead of the symbol.  Basically we need
2915    to make sure that the dynamic relocations are done correctly, so in
2916    some cases we force the original symbol to be used.  */
2917
2918 int
2919 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
2920 {
2921 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2922   if (!IS_ELF)
2923     return 1;
2924
2925   /* Don't adjust pc-relative references to merge sections in 64-bit
2926      mode.  */
2927   if (use_rela_relocations
2928       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
2929       && fixP->fx_pcrel)
2930     return 0;
2931
2932   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
2933      and changed later by validate_fix.  */
2934   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
2935       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
2936     return 0;
2937
2938   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
2939      for size relocations.  */
2940   if (fixP->fx_r_type == BFD_RELOC_SIZE32
2941       || fixP->fx_r_type == BFD_RELOC_SIZE64
2942       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
2943       || fixP->fx_r_type == BFD_RELOC_386_PLT32
2944       || fixP->fx_r_type == BFD_RELOC_386_GOT32
2945       || fixP->fx_r_type == BFD_RELOC_386_GOT32X
2946       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
2947       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
2948       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
2949       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
2950       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
2951       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
2952       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
2953       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
2954       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
2955       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
2956       || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
2957       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
2958       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
2959       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
2960       || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
2961       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
2962       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
2963       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
2964       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
2965       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
2966       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
2967       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
2968       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
2969       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
2970       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
2971       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
2972       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
2973     return 0;
2974 #endif
2975   return 1;
2976 }
2977
2978 static int
2979 intel_float_operand (const char *mnemonic)
2980 {
2981   /* Note that the value returned is meaningful only for opcodes with (memory)
2982      operands, hence the code here is free to improperly handle opcodes that
2983      have no operands (for better performance and smaller code). */
2984
2985   if (mnemonic[0] != 'f')
2986     return 0; /* non-math */
2987
2988   switch (mnemonic[1])
2989     {
2990     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
2991        the fs segment override prefix not currently handled because no
2992        call path can make opcodes without operands get here */
2993     case 'i':
2994       return 2 /* integer op */;
2995     case 'l':
2996       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
2997         return 3; /* fldcw/fldenv */
2998       break;
2999     case 'n':
3000       if (mnemonic[2] != 'o' /* fnop */)
3001         return 3; /* non-waiting control op */
3002       break;
3003     case 'r':
3004       if (mnemonic[2] == 's')
3005         return 3; /* frstor/frstpm */
3006       break;
3007     case 's':
3008       if (mnemonic[2] == 'a')
3009         return 3; /* fsave */
3010       if (mnemonic[2] == 't')
3011         {
3012           switch (mnemonic[3])
3013             {
3014             case 'c': /* fstcw */
3015             case 'd': /* fstdw */
3016             case 'e': /* fstenv */
3017             case 's': /* fsts[gw] */
3018               return 3;
3019             }
3020         }
3021       break;
3022     case 'x':
3023       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3024         return 0; /* fxsave/fxrstor are not really math ops */
3025       break;
3026     }
3027
3028   return 1;
3029 }
3030
3031 /* Build the VEX prefix.  */
3032
3033 static void
3034 build_vex_prefix (const insn_template *t)
3035 {
3036   unsigned int register_specifier;
3037   unsigned int implied_prefix;
3038   unsigned int vector_length;
3039
3040   /* Check register specifier.  */
3041   if (i.vex.register_specifier)
3042     {
3043       register_specifier =
3044         ~register_number (i.vex.register_specifier) & 0xf;
3045       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3046     }
3047   else
3048     register_specifier = 0xf;
3049
3050   /* Use 2-byte VEX prefix by swappping destination and source
3051      operand.  */
3052   if (!i.swap_operand
3053       && i.operands == i.reg_operands
3054       && i.tm.opcode_modifier.vexopcode == VEX0F
3055       && i.tm.opcode_modifier.s
3056       && i.rex == REX_B)
3057     {
3058       unsigned int xchg = i.operands - 1;
3059       union i386_op temp_op;
3060       i386_operand_type temp_type;
3061
3062       temp_type = i.types[xchg];
3063       i.types[xchg] = i.types[0];
3064       i.types[0] = temp_type;
3065       temp_op = i.op[xchg];
3066       i.op[xchg] = i.op[0];
3067       i.op[0] = temp_op;
3068
3069       gas_assert (i.rm.mode == 3);
3070
3071       i.rex = REX_R;
3072       xchg = i.rm.regmem;
3073       i.rm.regmem = i.rm.reg;
3074       i.rm.reg = xchg;
3075
3076       /* Use the next insn.  */
3077       i.tm = t[1];
3078     }
3079
3080   if (i.tm.opcode_modifier.vex == VEXScalar)
3081     vector_length = avxscalar;
3082   else
3083     vector_length = i.tm.opcode_modifier.vex == VEX256 ? 1 : 0;
3084
3085   switch ((i.tm.base_opcode >> 8) & 0xff)
3086     {
3087     case 0:
3088       implied_prefix = 0;
3089       break;
3090     case DATA_PREFIX_OPCODE:
3091       implied_prefix = 1;
3092       break;
3093     case REPE_PREFIX_OPCODE:
3094       implied_prefix = 2;
3095       break;
3096     case REPNE_PREFIX_OPCODE:
3097       implied_prefix = 3;
3098       break;
3099     default:
3100       abort ();
3101     }
3102
3103   /* Use 2-byte VEX prefix if possible.  */
3104   if (i.tm.opcode_modifier.vexopcode == VEX0F
3105       && i.tm.opcode_modifier.vexw != VEXW1
3106       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3107     {
3108       /* 2-byte VEX prefix.  */
3109       unsigned int r;
3110
3111       i.vex.length = 2;
3112       i.vex.bytes[0] = 0xc5;
3113
3114       /* Check the REX.R bit.  */
3115       r = (i.rex & REX_R) ? 0 : 1;
3116       i.vex.bytes[1] = (r << 7
3117                         | register_specifier << 3
3118                         | vector_length << 2
3119                         | implied_prefix);
3120     }
3121   else
3122     {
3123       /* 3-byte VEX prefix.  */
3124       unsigned int m, w;
3125
3126       i.vex.length = 3;
3127
3128       switch (i.tm.opcode_modifier.vexopcode)
3129         {
3130         case VEX0F:
3131           m = 0x1;
3132           i.vex.bytes[0] = 0xc4;
3133           break;
3134         case VEX0F38:
3135           m = 0x2;
3136           i.vex.bytes[0] = 0xc4;
3137           break;
3138         case VEX0F3A:
3139           m = 0x3;
3140           i.vex.bytes[0] = 0xc4;
3141           break;
3142         case XOP08:
3143           m = 0x8;
3144           i.vex.bytes[0] = 0x8f;
3145           break;
3146         case XOP09:
3147           m = 0x9;
3148           i.vex.bytes[0] = 0x8f;
3149           break;
3150         case XOP0A:
3151           m = 0xa;
3152           i.vex.bytes[0] = 0x8f;
3153           break;
3154         default:
3155           abort ();
3156         }
3157
3158       /* The high 3 bits of the second VEX byte are 1's compliment
3159          of RXB bits from REX.  */
3160       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3161
3162       /* Check the REX.W bit.  */
3163       w = (i.rex & REX_W) ? 1 : 0;
3164       if (i.tm.opcode_modifier.vexw == VEXW1)
3165         w = 1;
3166
3167       i.vex.bytes[2] = (w << 7
3168                         | register_specifier << 3
3169                         | vector_length << 2
3170                         | implied_prefix);
3171     }
3172 }
3173
3174 /* Build the EVEX prefix.  */
3175
3176 static void
3177 build_evex_prefix (void)
3178 {
3179   unsigned int register_specifier;
3180   unsigned int implied_prefix;
3181   unsigned int m, w;
3182   rex_byte vrex_used = 0;
3183
3184   /* Check register specifier.  */
3185   if (i.vex.register_specifier)
3186     {
3187       gas_assert ((i.vrex & REX_X) == 0);
3188
3189       register_specifier = i.vex.register_specifier->reg_num;
3190       if ((i.vex.register_specifier->reg_flags & RegRex))
3191         register_specifier += 8;
3192       /* The upper 16 registers are encoded in the fourth byte of the
3193          EVEX prefix.  */
3194       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3195         i.vex.bytes[3] = 0x8;
3196       register_specifier = ~register_specifier & 0xf;
3197     }
3198   else
3199     {
3200       register_specifier = 0xf;
3201
3202       /* Encode upper 16 vector index register in the fourth byte of
3203          the EVEX prefix.  */
3204       if (!(i.vrex & REX_X))
3205         i.vex.bytes[3] = 0x8;
3206       else
3207         vrex_used |= REX_X;
3208     }
3209
3210   switch ((i.tm.base_opcode >> 8) & 0xff)
3211     {
3212     case 0:
3213       implied_prefix = 0;
3214       break;
3215     case DATA_PREFIX_OPCODE:
3216       implied_prefix = 1;
3217       break;
3218     case REPE_PREFIX_OPCODE:
3219       implied_prefix = 2;
3220       break;
3221     case REPNE_PREFIX_OPCODE:
3222       implied_prefix = 3;
3223       break;
3224     default:
3225       abort ();
3226     }
3227
3228   /* 4 byte EVEX prefix.  */
3229   i.vex.length = 4;
3230   i.vex.bytes[0] = 0x62;
3231
3232   /* mmmm bits.  */
3233   switch (i.tm.opcode_modifier.vexopcode)
3234     {
3235     case VEX0F:
3236       m = 1;
3237       break;
3238     case VEX0F38:
3239       m = 2;
3240       break;
3241     case VEX0F3A:
3242       m = 3;
3243       break;
3244     default:
3245       abort ();
3246       break;
3247     }
3248
3249   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3250      bits from REX.  */
3251   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3252
3253   /* The fifth bit of the second EVEX byte is 1's compliment of the
3254      REX_R bit in VREX.  */
3255   if (!(i.vrex & REX_R))
3256     i.vex.bytes[1] |= 0x10;
3257   else
3258     vrex_used |= REX_R;
3259
3260   if ((i.reg_operands + i.imm_operands) == i.operands)
3261     {
3262       /* When all operands are registers, the REX_X bit in REX is not
3263          used.  We reuse it to encode the upper 16 registers, which is
3264          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3265          as 1's compliment.  */
3266       if ((i.vrex & REX_B))
3267         {
3268           vrex_used |= REX_B;
3269           i.vex.bytes[1] &= ~0x40;
3270         }
3271     }
3272
3273   /* EVEX instructions shouldn't need the REX prefix.  */
3274   i.vrex &= ~vrex_used;
3275   gas_assert (i.vrex == 0);
3276
3277   /* Check the REX.W bit.  */
3278   w = (i.rex & REX_W) ? 1 : 0;
3279   if (i.tm.opcode_modifier.vexw)
3280     {
3281       if (i.tm.opcode_modifier.vexw == VEXW1)
3282         w = 1;
3283     }
3284   /* If w is not set it means we are dealing with WIG instruction.  */
3285   else if (!w)
3286     {
3287       if (evexwig == evexw1)
3288         w = 1;
3289     }
3290
3291   /* Encode the U bit.  */
3292   implied_prefix |= 0x4;
3293
3294   /* The third byte of the EVEX prefix.  */
3295   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3296
3297   /* The fourth byte of the EVEX prefix.  */
3298   /* The zeroing-masking bit.  */
3299   if (i.mask && i.mask->zeroing)
3300     i.vex.bytes[3] |= 0x80;
3301
3302   /* Don't always set the broadcast bit if there is no RC.  */
3303   if (!i.rounding)
3304     {
3305       /* Encode the vector length.  */
3306       unsigned int vec_length;
3307
3308       switch (i.tm.opcode_modifier.evex)
3309         {
3310         case EVEXLIG: /* LL' is ignored */
3311           vec_length = evexlig << 5;
3312           break;
3313         case EVEX128:
3314           vec_length = 0 << 5;
3315           break;
3316         case EVEX256:
3317           vec_length = 1 << 5;
3318           break;
3319         case EVEX512:
3320           vec_length = 2 << 5;
3321           break;
3322         default:
3323           abort ();
3324           break;
3325         }
3326       i.vex.bytes[3] |= vec_length;
3327       /* Encode the broadcast bit.  */
3328       if (i.broadcast)
3329         i.vex.bytes[3] |= 0x10;
3330     }
3331   else
3332     {
3333       if (i.rounding->type != saeonly)
3334         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3335       else
3336         i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3337     }
3338
3339   if (i.mask && i.mask->mask)
3340     i.vex.bytes[3] |= i.mask->mask->reg_num;
3341 }
3342
3343 static void
3344 process_immext (void)
3345 {
3346   expressionS *exp;
3347
3348   if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3349       && i.operands > 0)
3350     {
3351       /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3352          with an opcode suffix which is coded in the same place as an
3353          8-bit immediate field would be.
3354          Here we check those operands and remove them afterwards.  */
3355       unsigned int x;
3356
3357       for (x = 0; x < i.operands; x++)
3358         if (register_number (i.op[x].regs) != x)
3359           as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3360                   register_prefix, i.op[x].regs->reg_name, x + 1,
3361                   i.tm.name);
3362
3363       i.operands = 0;
3364     }
3365
3366   if (i.tm.cpu_flags.bitfield.cpumwaitx && i.operands > 0)
3367     {
3368       /* MONITORX/MWAITX instructions have fixed operands with an opcode
3369          suffix which is coded in the same place as an 8-bit immediate
3370          field would be.
3371          Here we check those operands and remove them afterwards.  */
3372       unsigned int x;
3373
3374       if (i.operands != 3)
3375         abort();
3376
3377       for (x = 0; x < 2; x++)
3378         if (register_number (i.op[x].regs) != x)
3379           goto bad_register_operand;
3380
3381       /* Check for third operand for mwaitx/monitorx insn.  */
3382       if (register_number (i.op[x].regs)
3383           != (x + (i.tm.extension_opcode == 0xfb)))
3384         {
3385 bad_register_operand:
3386           as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3387                   register_prefix, i.op[x].regs->reg_name, x+1,
3388                   i.tm.name);
3389         }
3390
3391       i.operands = 0;
3392     }
3393
3394   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3395      which is coded in the same place as an 8-bit immediate field
3396      would be.  Here we fake an 8-bit immediate operand from the
3397      opcode suffix stored in tm.extension_opcode.
3398
3399      AVX instructions also use this encoding, for some of
3400      3 argument instructions.  */
3401
3402   gas_assert (i.imm_operands <= 1
3403               && (i.operands <= 2
3404                   || ((i.tm.opcode_modifier.vex
3405                        || i.tm.opcode_modifier.evex)
3406                       && i.operands <= 4)));
3407
3408   exp = &im_expressions[i.imm_operands++];
3409   i.op[i.operands].imms = exp;
3410   i.types[i.operands] = imm8;
3411   i.operands++;
3412   exp->X_op = O_constant;
3413   exp->X_add_number = i.tm.extension_opcode;
3414   i.tm.extension_opcode = None;
3415 }
3416
3417
3418 static int
3419 check_hle (void)
3420 {
3421   switch (i.tm.opcode_modifier.hleprefixok)
3422     {
3423     default:
3424       abort ();
3425     case HLEPrefixNone:
3426       as_bad (_("invalid instruction `%s' after `%s'"),
3427               i.tm.name, i.hle_prefix);
3428       return 0;
3429     case HLEPrefixLock:
3430       if (i.prefix[LOCK_PREFIX])
3431         return 1;
3432       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3433       return 0;
3434     case HLEPrefixAny:
3435       return 1;
3436     case HLEPrefixRelease:
3437       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3438         {
3439           as_bad (_("instruction `%s' after `xacquire' not allowed"),
3440                   i.tm.name);
3441           return 0;
3442         }
3443       if (i.mem_operands == 0
3444           || !operand_type_check (i.types[i.operands - 1], anymem))
3445         {
3446           as_bad (_("memory destination needed for instruction `%s'"
3447                     " after `xrelease'"), i.tm.name);
3448           return 0;
3449         }
3450       return 1;
3451     }
3452 }
3453
3454 /* This is the guts of the machine-dependent assembler.  LINE points to a
3455    machine dependent instruction.  This function is supposed to emit
3456    the frags/bytes it assembles to.  */
3457
3458 void
3459 md_assemble (char *line)
3460 {
3461   unsigned int j;
3462   char mnemonic[MAX_MNEM_SIZE];
3463   const insn_template *t;
3464
3465   /* Initialize globals.  */
3466   memset (&i, '\0', sizeof (i));
3467   for (j = 0; j < MAX_OPERANDS; j++)
3468     i.reloc[j] = NO_RELOC;
3469   memset (disp_expressions, '\0', sizeof (disp_expressions));
3470   memset (im_expressions, '\0', sizeof (im_expressions));
3471   save_stack_p = save_stack;
3472
3473   /* First parse an instruction mnemonic & call i386_operand for the operands.
3474      We assume that the scrubber has arranged it so that line[0] is the valid
3475      start of a (possibly prefixed) mnemonic.  */
3476
3477   line = parse_insn (line, mnemonic);
3478   if (line == NULL)
3479     return;
3480
3481   line = parse_operands (line, mnemonic);
3482   this_operand = -1;
3483   if (line == NULL)
3484     return;
3485
3486   /* Now we've parsed the mnemonic into a set of templates, and have the
3487      operands at hand.  */
3488
3489   /* All intel opcodes have reversed operands except for "bound" and
3490      "enter".  We also don't reverse intersegment "jmp" and "call"
3491      instructions with 2 immediate operands so that the immediate segment
3492      precedes the offset, as it does when in AT&T mode. */
3493   if (intel_syntax
3494       && i.operands > 1
3495       && (strcmp (mnemonic, "bound") != 0)
3496       && (strcmp (mnemonic, "invlpga") != 0)
3497       && !(operand_type_check (i.types[0], imm)
3498            && operand_type_check (i.types[1], imm)))
3499     swap_operands ();
3500
3501   /* The order of the immediates should be reversed
3502      for 2 immediates extrq and insertq instructions */
3503   if (i.imm_operands == 2
3504       && (strcmp (mnemonic, "extrq") == 0
3505           || strcmp (mnemonic, "insertq") == 0))
3506       swap_2_operands (0, 1);
3507
3508   if (i.imm_operands)
3509     optimize_imm ();
3510
3511   /* Don't optimize displacement for movabs since it only takes 64bit
3512      displacement.  */
3513   if (i.disp_operands
3514       && i.disp_encoding != disp_encoding_32bit
3515       && (flag_code != CODE_64BIT
3516           || strcmp (mnemonic, "movabs") != 0))
3517     optimize_disp ();
3518
3519   /* Next, we find a template that matches the given insn,
3520      making sure the overlap of the given operands types is consistent
3521      with the template operand types.  */
3522
3523   if (!(t = match_template ()))
3524     return;
3525
3526   if (sse_check != check_none
3527       && !i.tm.opcode_modifier.noavx
3528       && (i.tm.cpu_flags.bitfield.cpusse
3529           || i.tm.cpu_flags.bitfield.cpusse2
3530           || i.tm.cpu_flags.bitfield.cpusse3
3531           || i.tm.cpu_flags.bitfield.cpussse3
3532           || i.tm.cpu_flags.bitfield.cpusse4_1
3533           || i.tm.cpu_flags.bitfield.cpusse4_2))
3534     {
3535       (sse_check == check_warning
3536        ? as_warn
3537        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
3538     }
3539
3540   /* Zap movzx and movsx suffix.  The suffix has been set from
3541      "word ptr" or "byte ptr" on the source operand in Intel syntax
3542      or extracted from mnemonic in AT&T syntax.  But we'll use
3543      the destination register to choose the suffix for encoding.  */
3544   if ((i.tm.base_opcode & ~9) == 0x0fb6)
3545     {
3546       /* In Intel syntax, there must be a suffix.  In AT&T syntax, if
3547          there is no suffix, the default will be byte extension.  */
3548       if (i.reg_operands != 2
3549           && !i.suffix
3550           && intel_syntax)
3551         as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
3552
3553       i.suffix = 0;
3554     }
3555
3556   if (i.tm.opcode_modifier.fwait)
3557     if (!add_prefix (FWAIT_OPCODE))
3558       return;
3559
3560   /* Check if REP prefix is OK.  */
3561   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
3562     {
3563       as_bad (_("invalid instruction `%s' after `%s'"),
3564                 i.tm.name, i.rep_prefix);
3565       return;
3566     }
3567
3568   /* Check for lock without a lockable instruction.  Destination operand
3569      must be memory unless it is xchg (0x86).  */
3570   if (i.prefix[LOCK_PREFIX]
3571       && (!i.tm.opcode_modifier.islockable
3572           || i.mem_operands == 0
3573           || (i.tm.base_opcode != 0x86
3574               && !operand_type_check (i.types[i.operands - 1], anymem))))
3575     {
3576       as_bad (_("expecting lockable instruction after `lock'"));
3577       return;
3578     }
3579
3580   /* Check if HLE prefix is OK.  */
3581   if (i.hle_prefix && !check_hle ())
3582     return;
3583
3584   /* Check BND prefix.  */
3585   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
3586     as_bad (_("expecting valid branch instruction after `bnd'"));
3587
3588   if (i.tm.cpu_flags.bitfield.cpumpx
3589       && flag_code == CODE_64BIT
3590       && i.prefix[ADDR_PREFIX])
3591     as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
3592
3593   /* Insert BND prefix.  */
3594   if (add_bnd_prefix
3595       && i.tm.opcode_modifier.bndprefixok
3596       && !i.prefix[BND_PREFIX])
3597     add_prefix (BND_PREFIX_OPCODE);
3598
3599   /* Check string instruction segment overrides.  */
3600   if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
3601     {
3602       if (!check_string ())
3603         return;
3604       i.disp_operands = 0;
3605     }
3606
3607   if (!process_suffix ())
3608     return;
3609
3610   /* Update operand types.  */
3611   for (j = 0; j < i.operands; j++)
3612     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
3613
3614   /* Make still unresolved immediate matches conform to size of immediate
3615      given in i.suffix.  */
3616   if (!finalize_imm ())
3617     return;
3618
3619   if (i.types[0].bitfield.imm1)
3620     i.imm_operands = 0; /* kludge for shift insns.  */
3621
3622   /* We only need to check those implicit registers for instructions
3623      with 3 operands or less.  */
3624   if (i.operands <= 3)
3625     for (j = 0; j < i.operands; j++)
3626       if (i.types[j].bitfield.inoutportreg
3627           || i.types[j].bitfield.shiftcount
3628           || i.types[j].bitfield.acc
3629           || i.types[j].bitfield.floatacc)
3630         i.reg_operands--;
3631
3632   /* ImmExt should be processed after SSE2AVX.  */
3633   if (!i.tm.opcode_modifier.sse2avx
3634       && i.tm.opcode_modifier.immext)
3635     process_immext ();
3636
3637   /* For insns with operands there are more diddles to do to the opcode.  */
3638   if (i.operands)
3639     {
3640       if (!process_operands ())
3641         return;
3642     }
3643   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
3644     {
3645       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
3646       as_warn (_("translating to `%sp'"), i.tm.name);
3647     }
3648
3649   if (i.tm.opcode_modifier.vex || i.tm.opcode_modifier.evex)
3650     {
3651       if (flag_code == CODE_16BIT)
3652         {
3653           as_bad (_("instruction `%s' isn't supported in 16-bit mode."),
3654                   i.tm.name);
3655           return;
3656         }
3657
3658       if (i.tm.opcode_modifier.vex)
3659         build_vex_prefix (t);
3660       else
3661         build_evex_prefix ();
3662     }
3663
3664   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
3665      instructions may define INT_OPCODE as well, so avoid this corner
3666      case for those instructions that use MODRM.  */
3667   if (i.tm.base_opcode == INT_OPCODE
3668       && !i.tm.opcode_modifier.modrm
3669       && i.op[0].imms->X_add_number == 3)
3670     {
3671       i.tm.base_opcode = INT3_OPCODE;
3672       i.imm_operands = 0;
3673     }
3674
3675   if ((i.tm.opcode_modifier.jump
3676        || i.tm.opcode_modifier.jumpbyte
3677        || i.tm.opcode_modifier.jumpdword)
3678       && i.op[0].disps->X_op == O_constant)
3679     {
3680       /* Convert "jmp constant" (and "call constant") to a jump (call) to
3681          the absolute address given by the constant.  Since ix86 jumps and
3682          calls are pc relative, we need to generate a reloc.  */
3683       i.op[0].disps->X_add_symbol = &abs_symbol;
3684       i.op[0].disps->X_op = O_symbol;
3685     }
3686
3687   if (i.tm.opcode_modifier.rex64)
3688     i.rex |= REX_W;
3689
3690   /* For 8 bit registers we need an empty rex prefix.  Also if the
3691      instruction already has a prefix, we need to convert old
3692      registers to new ones.  */
3693
3694   if ((i.types[0].bitfield.reg8
3695        && (i.op[0].regs->reg_flags & RegRex64) != 0)
3696       || (i.types[1].bitfield.reg8
3697           && (i.op[1].regs->reg_flags & RegRex64) != 0)
3698       || ((i.types[0].bitfield.reg8
3699            || i.types[1].bitfield.reg8)
3700           && i.rex != 0))
3701     {
3702       int x;
3703
3704       i.rex |= REX_OPCODE;
3705       for (x = 0; x < 2; x++)
3706         {
3707           /* Look for 8 bit operand that uses old registers.  */
3708           if (i.types[x].bitfield.reg8
3709               && (i.op[x].regs->reg_flags & RegRex64) == 0)
3710             {
3711               /* In case it is "hi" register, give up.  */
3712               if (i.op[x].regs->reg_num > 3)
3713                 as_bad (_("can't encode register '%s%s' in an "
3714                           "instruction requiring REX prefix."),
3715                         register_prefix, i.op[x].regs->reg_name);
3716
3717               /* Otherwise it is equivalent to the extended register.
3718                  Since the encoding doesn't change this is merely
3719                  cosmetic cleanup for debug output.  */
3720
3721               i.op[x].regs = i.op[x].regs + 8;
3722             }
3723         }
3724     }
3725
3726   if (i.rex != 0)
3727     add_prefix (REX_OPCODE | i.rex);
3728
3729   /* We are ready to output the insn.  */
3730   output_insn ();
3731 }
3732
3733 static char *
3734 parse_insn (char *line, char *mnemonic)
3735 {
3736   char *l = line;
3737   char *token_start = l;
3738   char *mnem_p;
3739   int supported;
3740   const insn_template *t;
3741   char *dot_p = NULL;
3742
3743   while (1)
3744     {
3745       mnem_p = mnemonic;
3746       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
3747         {
3748           if (*mnem_p == '.')
3749             dot_p = mnem_p;
3750           mnem_p++;
3751           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
3752             {
3753               as_bad (_("no such instruction: `%s'"), token_start);
3754               return NULL;
3755             }
3756           l++;
3757         }
3758       if (!is_space_char (*l)
3759           && *l != END_OF_INSN
3760           && (intel_syntax
3761               || (*l != PREFIX_SEPARATOR
3762                   && *l != ',')))
3763         {
3764           as_bad (_("invalid character %s in mnemonic"),
3765                   output_invalid (*l));
3766           return NULL;
3767         }
3768       if (token_start == l)
3769         {
3770           if (!intel_syntax && *l == PREFIX_SEPARATOR)
3771             as_bad (_("expecting prefix; got nothing"));
3772           else
3773             as_bad (_("expecting mnemonic; got nothing"));
3774           return NULL;
3775         }
3776
3777       /* Look up instruction (or prefix) via hash table.  */
3778       current_templates = (const templates *) hash_find (op_hash, mnemonic);
3779
3780       if (*l != END_OF_INSN
3781           && (!is_space_char (*l) || l[1] != END_OF_INSN)
3782           && current_templates
3783           && current_templates->start->opcode_modifier.isprefix)
3784         {
3785           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
3786             {
3787               as_bad ((flag_code != CODE_64BIT
3788                        ? _("`%s' is only supported in 64-bit mode")
3789                        : _("`%s' is not supported in 64-bit mode")),
3790                       current_templates->start->name);
3791               return NULL;
3792             }
3793           /* If we are in 16-bit mode, do not allow addr16 or data16.
3794              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
3795           if ((current_templates->start->opcode_modifier.size16
3796                || current_templates->start->opcode_modifier.size32)
3797               && flag_code != CODE_64BIT
3798               && (current_templates->start->opcode_modifier.size32
3799                   ^ (flag_code == CODE_16BIT)))
3800             {
3801               as_bad (_("redundant %s prefix"),
3802                       current_templates->start->name);
3803               return NULL;
3804             }
3805           /* Add prefix, checking for repeated prefixes.  */
3806           switch (add_prefix (current_templates->start->base_opcode))
3807             {
3808             case PREFIX_EXIST:
3809               return NULL;
3810             case PREFIX_REP:
3811               if (current_templates->start->cpu_flags.bitfield.cpuhle)
3812                 i.hle_prefix = current_templates->start->name;
3813               else if (current_templates->start->cpu_flags.bitfield.cpumpx)
3814                 i.bnd_prefix = current_templates->start->name;
3815               else
3816                 i.rep_prefix = current_templates->start->name;
3817               break;
3818             default:
3819               break;
3820             }
3821           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
3822           token_start = ++l;
3823         }
3824       else
3825         break;
3826     }
3827
3828   if (!current_templates)
3829     {
3830       /* Check if we should swap operand or force 32bit displacement in
3831          encoding.  */
3832       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
3833         i.swap_operand = 1;
3834       else if (mnem_p - 3 == dot_p
3835                && dot_p[1] == 'd'
3836                && dot_p[2] == '8')
3837         i.disp_encoding = disp_encoding_8bit;
3838       else if (mnem_p - 4 == dot_p
3839                && dot_p[1] == 'd'
3840                && dot_p[2] == '3'
3841                && dot_p[3] == '2')
3842         i.disp_encoding = disp_encoding_32bit;
3843       else
3844         goto check_suffix;
3845       mnem_p = dot_p;
3846       *dot_p = '\0';
3847       current_templates = (const templates *) hash_find (op_hash, mnemonic);
3848     }
3849
3850   if (!current_templates)
3851     {
3852 check_suffix:
3853       /* See if we can get a match by trimming off a suffix.  */
3854       switch (mnem_p[-1])
3855         {
3856         case WORD_MNEM_SUFFIX:
3857           if (intel_syntax && (intel_float_operand (mnemonic) & 2))
3858             i.suffix = SHORT_MNEM_SUFFIX;
3859           else
3860         case BYTE_MNEM_SUFFIX:
3861         case QWORD_MNEM_SUFFIX:
3862           i.suffix = mnem_p[-1];
3863           mnem_p[-1] = '\0';
3864           current_templates = (const templates *) hash_find (op_hash,
3865                                                              mnemonic);
3866           break;
3867         case SHORT_MNEM_SUFFIX:
3868         case LONG_MNEM_SUFFIX:
3869           if (!intel_syntax)
3870             {
3871               i.suffix = mnem_p[-1];
3872               mnem_p[-1] = '\0';
3873               current_templates = (const templates *) hash_find (op_hash,
3874                                                                  mnemonic);
3875             }
3876           break;
3877
3878           /* Intel Syntax.  */
3879         case 'd':
3880           if (intel_syntax)
3881             {
3882               if (intel_float_operand (mnemonic) == 1)
3883                 i.suffix = SHORT_MNEM_SUFFIX;
3884               else
3885                 i.suffix = LONG_MNEM_SUFFIX;
3886               mnem_p[-1] = '\0';
3887               current_templates = (const templates *) hash_find (op_hash,
3888                                                                  mnemonic);
3889             }
3890           break;
3891         }
3892       if (!current_templates)
3893         {
3894           as_bad (_("no such instruction: `%s'"), token_start);
3895           return NULL;
3896         }
3897     }
3898
3899   if (current_templates->start->opcode_modifier.jump
3900       || current_templates->start->opcode_modifier.jumpbyte)
3901     {
3902       /* Check for a branch hint.  We allow ",pt" and ",pn" for
3903          predict taken and predict not taken respectively.
3904          I'm not sure that branch hints actually do anything on loop
3905          and jcxz insns (JumpByte) for current Pentium4 chips.  They
3906          may work in the future and it doesn't hurt to accept them
3907          now.  */
3908       if (l[0] == ',' && l[1] == 'p')
3909         {
3910           if (l[2] == 't')
3911             {
3912               if (!add_prefix (DS_PREFIX_OPCODE))
3913                 return NULL;
3914               l += 3;
3915             }
3916           else if (l[2] == 'n')
3917             {
3918               if (!add_prefix (CS_PREFIX_OPCODE))
3919                 return NULL;
3920               l += 3;
3921             }
3922         }
3923     }
3924   /* Any other comma loses.  */
3925   if (*l == ',')
3926     {
3927       as_bad (_("invalid character %s in mnemonic"),
3928               output_invalid (*l));
3929       return NULL;
3930     }
3931
3932   /* Check if instruction is supported on specified architecture.  */
3933   supported = 0;
3934   for (t = current_templates->start; t < current_templates->end; ++t)
3935     {
3936       supported |= cpu_flags_match (t);
3937       if (supported == CPU_FLAGS_PERFECT_MATCH)
3938         goto skip;
3939     }
3940
3941   if (!(supported & CPU_FLAGS_64BIT_MATCH))
3942     {
3943       as_bad (flag_code == CODE_64BIT
3944               ? _("`%s' is not supported in 64-bit mode")
3945               : _("`%s' is only supported in 64-bit mode"),
3946               current_templates->start->name);
3947       return NULL;
3948     }
3949   if (supported != CPU_FLAGS_PERFECT_MATCH)
3950     {
3951       as_bad (_("`%s' is not supported on `%s%s'"),
3952               current_templates->start->name,
3953               cpu_arch_name ? cpu_arch_name : default_arch,
3954               cpu_sub_arch_name ? cpu_sub_arch_name : "");
3955       return NULL;
3956     }
3957
3958 skip:
3959   if (!cpu_arch_flags.bitfield.cpui386
3960            && (flag_code != CODE_16BIT))
3961     {
3962       as_warn (_("use .code16 to ensure correct addressing mode"));
3963     }
3964
3965   return l;
3966 }
3967
3968 static char *
3969 parse_operands (char *l, const char *mnemonic)
3970 {
3971   char *token_start;
3972
3973   /* 1 if operand is pending after ','.  */
3974   unsigned int expecting_operand = 0;
3975
3976   /* Non-zero if operand parens not balanced.  */
3977   unsigned int paren_not_balanced;
3978
3979   while (*l != END_OF_INSN)
3980     {
3981       /* Skip optional white space before operand.  */
3982       if (is_space_char (*l))
3983         ++l;
3984       if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
3985         {
3986           as_bad (_("invalid character %s before operand %d"),
3987                   output_invalid (*l),
3988                   i.operands + 1);
3989           return NULL;
3990         }
3991       token_start = l;  /* After white space.  */
3992       paren_not_balanced = 0;
3993       while (paren_not_balanced || *l != ',')
3994         {
3995           if (*l == END_OF_INSN)
3996             {
3997               if (paren_not_balanced)
3998                 {
3999                   if (!intel_syntax)
4000                     as_bad (_("unbalanced parenthesis in operand %d."),
4001                             i.operands + 1);
4002                   else
4003                     as_bad (_("unbalanced brackets in operand %d."),
4004                             i.operands + 1);
4005                   return NULL;
4006                 }
4007               else
4008                 break;  /* we are done */
4009             }
4010           else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
4011             {
4012               as_bad (_("invalid character %s in operand %d"),
4013                       output_invalid (*l),
4014                       i.operands + 1);
4015               return NULL;
4016             }
4017           if (!intel_syntax)
4018             {
4019               if (*l == '(')
4020                 ++paren_not_balanced;
4021               if (*l == ')')
4022                 --paren_not_balanced;
4023             }
4024           else
4025             {
4026               if (*l == '[')
4027                 ++paren_not_balanced;
4028               if (*l == ']')
4029                 --paren_not_balanced;
4030             }
4031           l++;
4032         }
4033       if (l != token_start)
4034         {                       /* Yes, we've read in another operand.  */
4035           unsigned int operand_ok;
4036           this_operand = i.operands++;
4037           i.types[this_operand].bitfield.unspecified = 1;
4038           if (i.operands > MAX_OPERANDS)
4039             {
4040               as_bad (_("spurious operands; (%d operands/instruction max)"),
4041                       MAX_OPERANDS);
4042               return NULL;
4043             }
4044           /* Now parse operand adding info to 'i' as we go along.  */
4045           END_STRING_AND_SAVE (l);
4046
4047           if (intel_syntax)
4048             operand_ok =
4049               i386_intel_operand (token_start,
4050                                   intel_float_operand (mnemonic));
4051           else
4052             operand_ok = i386_att_operand (token_start);
4053
4054           RESTORE_END_STRING (l);
4055           if (!operand_ok)
4056             return NULL;
4057         }
4058       else
4059         {
4060           if (expecting_operand)
4061             {
4062             expecting_operand_after_comma:
4063               as_bad (_("expecting operand after ','; got nothing"));
4064               return NULL;
4065             }
4066           if (*l == ',')
4067             {
4068               as_bad (_("expecting operand before ','; got nothing"));
4069               return NULL;
4070             }
4071         }
4072
4073       /* Now *l must be either ',' or END_OF_INSN.  */
4074       if (*l == ',')
4075         {
4076           if (*++l == END_OF_INSN)
4077             {
4078               /* Just skip it, if it's \n complain.  */
4079               goto expecting_operand_after_comma;
4080             }
4081           expecting_operand = 1;
4082         }
4083     }
4084   return l;
4085 }
4086
4087 static void
4088 swap_2_operands (int xchg1, int xchg2)
4089 {
4090   union i386_op temp_op;
4091   i386_operand_type temp_type;
4092   enum bfd_reloc_code_real temp_reloc;
4093
4094   temp_type = i.types[xchg2];
4095   i.types[xchg2] = i.types[xchg1];
4096   i.types[xchg1] = temp_type;
4097   temp_op = i.op[xchg2];
4098   i.op[xchg2] = i.op[xchg1];
4099   i.op[xchg1] = temp_op;
4100   temp_reloc = i.reloc[xchg2];
4101   i.reloc[xchg2] = i.reloc[xchg1];
4102   i.reloc[xchg1] = temp_reloc;
4103
4104   if (i.mask)
4105     {
4106       if (i.mask->operand == xchg1)
4107         i.mask->operand = xchg2;
4108       else if (i.mask->operand == xchg2)
4109         i.mask->operand = xchg1;
4110     }
4111   if (i.broadcast)
4112     {
4113       if (i.broadcast->operand == xchg1)
4114         i.broadcast->operand = xchg2;
4115       else if (i.broadcast->operand == xchg2)
4116         i.broadcast->operand = xchg1;
4117     }
4118   if (i.rounding)
4119     {
4120       if (i.rounding->operand == xchg1)
4121         i.rounding->operand = xchg2;
4122       else if (i.rounding->operand == xchg2)
4123         i.rounding->operand = xchg1;
4124     }
4125 }
4126
4127 static void
4128 swap_operands (void)
4129 {
4130   switch (i.operands)
4131     {
4132     case 5:
4133     case 4:
4134       swap_2_operands (1, i.operands - 2);
4135     case 3:
4136     case 2:
4137       swap_2_operands (0, i.operands - 1);
4138       break;
4139     default:
4140       abort ();
4141     }
4142
4143   if (i.mem_operands == 2)
4144     {
4145       const seg_entry *temp_seg;
4146       temp_seg = i.seg[0];
4147       i.seg[0] = i.seg[1];
4148       i.seg[1] = temp_seg;
4149     }
4150 }
4151
4152 /* Try to ensure constant immediates are represented in the smallest
4153    opcode possible.  */
4154 static void
4155 optimize_imm (void)
4156 {
4157   char guess_suffix = 0;
4158   int op;
4159
4160   if (i.suffix)
4161     guess_suffix = i.suffix;
4162   else if (i.reg_operands)
4163     {
4164       /* Figure out a suffix from the last register operand specified.
4165          We can't do this properly yet, ie. excluding InOutPortReg,
4166          but the following works for instructions with immediates.
4167          In any case, we can't set i.suffix yet.  */
4168       for (op = i.operands; --op >= 0;)
4169         if (i.types[op].bitfield.reg8)
4170           {
4171             guess_suffix = BYTE_MNEM_SUFFIX;
4172             break;
4173           }
4174         else if (i.types[op].bitfield.reg16)
4175           {
4176             guess_suffix = WORD_MNEM_SUFFIX;
4177             break;
4178           }
4179         else if (i.types[op].bitfield.reg32)
4180           {
4181             guess_suffix = LONG_MNEM_SUFFIX;
4182             break;
4183           }
4184         else if (i.types[op].bitfield.reg64)
4185           {
4186             guess_suffix = QWORD_MNEM_SUFFIX;
4187             break;
4188           }
4189     }
4190   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
4191     guess_suffix = WORD_MNEM_SUFFIX;
4192
4193   for (op = i.operands; --op >= 0;)
4194     if (operand_type_check (i.types[op], imm))
4195       {
4196         switch (i.op[op].imms->X_op)
4197           {
4198           case O_constant:
4199             /* If a suffix is given, this operand may be shortened.  */
4200             switch (guess_suffix)
4201               {
4202               case LONG_MNEM_SUFFIX:
4203                 i.types[op].bitfield.imm32 = 1;
4204                 i.types[op].bitfield.imm64 = 1;
4205                 break;
4206               case WORD_MNEM_SUFFIX:
4207                 i.types[op].bitfield.imm16 = 1;
4208                 i.types[op].bitfield.imm32 = 1;
4209                 i.types[op].bitfield.imm32s = 1;
4210                 i.types[op].bitfield.imm64 = 1;
4211                 break;
4212               case BYTE_MNEM_SUFFIX:
4213                 i.types[op].bitfield.imm8 = 1;
4214                 i.types[op].bitfield.imm8s = 1;
4215                 i.types[op].bitfield.imm16 = 1;
4216                 i.types[op].bitfield.imm32 = 1;
4217                 i.types[op].bitfield.imm32s = 1;
4218                 i.types[op].bitfield.imm64 = 1;
4219                 break;
4220               }
4221
4222             /* If this operand is at most 16 bits, convert it
4223                to a signed 16 bit number before trying to see
4224                whether it will fit in an even smaller size.
4225                This allows a 16-bit operand such as $0xffe0 to
4226                be recognised as within Imm8S range.  */
4227             if ((i.types[op].bitfield.imm16)
4228                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
4229               {
4230                 i.op[op].imms->X_add_number =
4231                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
4232               }
4233 #ifdef BFD64
4234             /* Store 32-bit immediate in 64-bit for 64-bit BFD.  */
4235             if ((i.types[op].bitfield.imm32)
4236                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
4237                     == 0))
4238               {
4239                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
4240                                                 ^ ((offsetT) 1 << 31))
4241                                                - ((offsetT) 1 << 31));
4242               }
4243 #endif
4244             i.types[op]
4245               = operand_type_or (i.types[op],
4246                                  smallest_imm_type (i.op[op].imms->X_add_number));
4247
4248             /* We must avoid matching of Imm32 templates when 64bit
4249                only immediate is available.  */
4250             if (guess_suffix == QWORD_MNEM_SUFFIX)
4251               i.types[op].bitfield.imm32 = 0;
4252             break;
4253
4254           case O_absent:
4255           case O_register:
4256             abort ();
4257
4258             /* Symbols and expressions.  */
4259           default:
4260             /* Convert symbolic operand to proper sizes for matching, but don't
4261                prevent matching a set of insns that only supports sizes other
4262                than those matching the insn suffix.  */
4263             {
4264               i386_operand_type mask, allowed;
4265               const insn_template *t;
4266
4267               operand_type_set (&mask, 0);
4268               operand_type_set (&allowed, 0);
4269
4270               for (t = current_templates->start;
4271                    t < current_templates->end;
4272                    ++t)
4273                 allowed = operand_type_or (allowed,
4274                                            t->operand_types[op]);
4275               switch (guess_suffix)
4276                 {
4277                 case QWORD_MNEM_SUFFIX:
4278                   mask.bitfield.imm64 = 1;
4279                   mask.bitfield.imm32s = 1;
4280                   break;
4281                 case LONG_MNEM_SUFFIX:
4282                   mask.bitfield.imm32 = 1;
4283                   break;
4284                 case WORD_MNEM_SUFFIX:
4285                   mask.bitfield.imm16 = 1;
4286                   break;
4287                 case BYTE_MNEM_SUFFIX:
4288                   mask.bitfield.imm8 = 1;
4289                   break;
4290                 default:
4291                   break;
4292                 }
4293               allowed = operand_type_and (mask, allowed);
4294               if (!operand_type_all_zero (&allowed))
4295                 i.types[op] = operand_type_and (i.types[op], mask);
4296             }
4297             break;
4298           }
4299       }
4300 }
4301
4302 /* Try to use the smallest displacement type too.  */
4303 static void
4304 optimize_disp (void)
4305 {
4306   int op;
4307
4308   for (op = i.operands; --op >= 0;)
4309     if (operand_type_check (i.types[op], disp))
4310       {
4311         if (i.op[op].disps->X_op == O_constant)
4312           {
4313             offsetT op_disp = i.op[op].disps->X_add_number;
4314
4315             if (i.types[op].bitfield.disp16
4316                 && (op_disp & ~(offsetT) 0xffff) == 0)
4317               {
4318                 /* If this operand is at most 16 bits, convert
4319                    to a signed 16 bit number and don't use 64bit
4320                    displacement.  */
4321                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
4322                 i.types[op].bitfield.disp64 = 0;
4323               }
4324 #ifdef BFD64
4325             /* Optimize 64-bit displacement to 32-bit for 64-bit BFD.  */
4326             if (i.types[op].bitfield.disp32
4327                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
4328               {
4329                 /* If this operand is at most 32 bits, convert
4330                    to a signed 32 bit number and don't use 64bit
4331                    displacement.  */
4332                 op_disp &= (((offsetT) 2 << 31) - 1);
4333                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
4334                 i.types[op].bitfield.disp64 = 0;
4335               }
4336 #endif
4337             if (!op_disp && i.types[op].bitfield.baseindex)
4338               {
4339                 i.types[op].bitfield.disp8 = 0;
4340                 i.types[op].bitfield.disp16 = 0;
4341                 i.types[op].bitfield.disp32 = 0;
4342                 i.types[op].bitfield.disp32s = 0;
4343                 i.types[op].bitfield.disp64 = 0;
4344                 i.op[op].disps = 0;
4345                 i.disp_operands--;
4346               }
4347             else if (flag_code == CODE_64BIT)
4348               {
4349                 if (fits_in_signed_long (op_disp))
4350                   {
4351                     i.types[op].bitfield.disp64 = 0;
4352                     i.types[op].bitfield.disp32s = 1;
4353                   }
4354                 if (i.prefix[ADDR_PREFIX]
4355                     && fits_in_unsigned_long (op_disp))
4356                   i.types[op].bitfield.disp32 = 1;
4357               }
4358             if ((i.types[op].bitfield.disp32
4359                  || i.types[op].bitfield.disp32s
4360                  || i.types[op].bitfield.disp16)
4361                 && fits_in_signed_byte (op_disp))
4362               i.types[op].bitfield.disp8 = 1;
4363           }
4364         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
4365                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
4366           {
4367             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
4368                          i.op[op].disps, 0, i.reloc[op]);
4369             i.types[op].bitfield.disp8 = 0;
4370             i.types[op].bitfield.disp16 = 0;
4371             i.types[op].bitfield.disp32 = 0;
4372             i.types[op].bitfield.disp32s = 0;
4373             i.types[op].bitfield.disp64 = 0;
4374           }
4375         else
4376           /* We only support 64bit displacement on constants.  */
4377           i.types[op].bitfield.disp64 = 0;
4378       }
4379 }
4380
4381 /* Check if operands are valid for the instruction.  */
4382
4383 static int
4384 check_VecOperands (const insn_template *t)
4385 {
4386   unsigned int op;
4387
4388   /* Without VSIB byte, we can't have a vector register for index.  */
4389   if (!t->opcode_modifier.vecsib
4390       && i.index_reg
4391       && (i.index_reg->reg_type.bitfield.regxmm
4392           || i.index_reg->reg_type.bitfield.regymm
4393           || i.index_reg->reg_type.bitfield.regzmm))
4394     {
4395       i.error = unsupported_vector_index_register;
4396       return 1;
4397     }
4398
4399   /* Check if default mask is allowed.  */
4400   if (t->opcode_modifier.nodefmask
4401       && (!i.mask || i.mask->mask->reg_num == 0))
4402     {
4403       i.error = no_default_mask;
4404       return 1;
4405     }
4406
4407   /* For VSIB byte, we need a vector register for index, and all vector
4408      registers must be distinct.  */
4409   if (t->opcode_modifier.vecsib)
4410     {
4411       if (!i.index_reg
4412           || !((t->opcode_modifier.vecsib == VecSIB128
4413                 && i.index_reg->reg_type.bitfield.regxmm)
4414                || (t->opcode_modifier.vecsib == VecSIB256
4415                    && i.index_reg->reg_type.bitfield.regymm)
4416                || (t->opcode_modifier.vecsib == VecSIB512
4417                    && i.index_reg->reg_type.bitfield.regzmm)))
4418       {
4419         i.error = invalid_vsib_address;
4420         return 1;
4421       }
4422
4423       gas_assert (i.reg_operands == 2 || i.mask);
4424       if (i.reg_operands == 2 && !i.mask)
4425         {
4426           gas_assert (i.types[0].bitfield.regxmm
4427                       || i.types[0].bitfield.regymm);
4428           gas_assert (i.types[2].bitfield.regxmm
4429                       || i.types[2].bitfield.regymm);
4430           if (operand_check == check_none)
4431             return 0;
4432           if (register_number (i.op[0].regs)
4433               != register_number (i.index_reg)
4434               && register_number (i.op[2].regs)
4435                  != register_number (i.index_reg)
4436               && register_number (i.op[0].regs)
4437                  != register_number (i.op[2].regs))
4438             return 0;
4439           if (operand_check == check_error)
4440             {
4441               i.error = invalid_vector_register_set;
4442               return 1;
4443             }
4444           as_warn (_("mask, index, and destination registers should be distinct"));
4445         }
4446       else if (i.reg_operands == 1 && i.mask)
4447         {
4448           if ((i.types[1].bitfield.regymm
4449                || i.types[1].bitfield.regzmm)
4450               && (register_number (i.op[1].regs)
4451                   == register_number (i.index_reg)))
4452             {
4453               if (operand_check == check_error)
4454                 {
4455                   i.error = invalid_vector_register_set;
4456                   return 1;
4457                 }
4458               if (operand_check != check_none)
4459                 as_warn (_("index and destination registers should be distinct"));
4460             }
4461         }
4462     }
4463
4464   /* Check if broadcast is supported by the instruction and is applied
4465      to the memory operand.  */
4466   if (i.broadcast)
4467     {
4468       int broadcasted_opnd_size;
4469
4470       /* Check if specified broadcast is supported in this instruction,
4471          and it's applied to memory operand of DWORD or QWORD type,
4472          depending on VecESize.  */
4473       if (i.broadcast->type != t->opcode_modifier.broadcast
4474           || !i.types[i.broadcast->operand].bitfield.mem
4475           || (t->opcode_modifier.vecesize == 0
4476               && !i.types[i.broadcast->operand].bitfield.dword
4477               && !i.types[i.broadcast->operand].bitfield.unspecified)
4478           || (t->opcode_modifier.vecesize == 1
4479               && !i.types[i.broadcast->operand].bitfield.qword
4480               && !i.types[i.broadcast->operand].bitfield.unspecified))
4481         goto bad_broadcast;
4482
4483       broadcasted_opnd_size = t->opcode_modifier.vecesize ? 64 : 32;
4484       if (i.broadcast->type == BROADCAST_1TO16)
4485         broadcasted_opnd_size <<= 4; /* Broadcast 1to16.  */
4486       else if (i.broadcast->type == BROADCAST_1TO8)
4487         broadcasted_opnd_size <<= 3; /* Broadcast 1to8.  */
4488       else if (i.broadcast->type == BROADCAST_1TO4)
4489         broadcasted_opnd_size <<= 2; /* Broadcast 1to4.  */
4490       else if (i.broadcast->type == BROADCAST_1TO2)
4491         broadcasted_opnd_size <<= 1; /* Broadcast 1to2.  */
4492       else
4493         goto bad_broadcast;
4494
4495       if ((broadcasted_opnd_size == 256
4496            && !t->operand_types[i.broadcast->operand].bitfield.ymmword)
4497           || (broadcasted_opnd_size == 512
4498               && !t->operand_types[i.broadcast->operand].bitfield.zmmword))
4499         {
4500         bad_broadcast:
4501           i.error = unsupported_broadcast;
4502           return 1;
4503         }
4504     }
4505   /* If broadcast is supported in this instruction, we need to check if
4506      operand of one-element size isn't specified without broadcast.  */
4507   else if (t->opcode_modifier.broadcast && i.mem_operands)
4508     {
4509       /* Find memory operand.  */
4510       for (op = 0; op < i.operands; op++)
4511         if (operand_type_check (i.types[op], anymem))
4512           break;
4513       gas_assert (op < i.operands);
4514       /* Check size of the memory operand.  */
4515       if ((t->opcode_modifier.vecesize == 0
4516            && i.types[op].bitfield.dword)
4517           || (t->opcode_modifier.vecesize == 1
4518               && i.types[op].bitfield.qword))
4519         {
4520           i.error = broadcast_needed;
4521           return 1;
4522         }
4523     }
4524
4525   /* Check if requested masking is supported.  */
4526   if (i.mask
4527       && (!t->opcode_modifier.masking
4528           || (i.mask->zeroing
4529               && t->opcode_modifier.masking == MERGING_MASKING)))
4530     {
4531       i.error = unsupported_masking;
4532       return 1;
4533     }
4534
4535   /* Check if masking is applied to dest operand.  */
4536   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
4537     {
4538       i.error = mask_not_on_destination;
4539       return 1;
4540     }
4541
4542   /* Check RC/SAE.  */
4543   if (i.rounding)
4544     {
4545       if ((i.rounding->type != saeonly
4546            && !t->opcode_modifier.staticrounding)
4547           || (i.rounding->type == saeonly
4548               && (t->opcode_modifier.staticrounding
4549                   || !t->opcode_modifier.sae)))
4550         {
4551           i.error = unsupported_rc_sae;
4552           return 1;
4553         }
4554       /* If the instruction has several immediate operands and one of
4555          them is rounding, the rounding operand should be the last
4556          immediate operand.  */
4557       if (i.imm_operands > 1
4558           && i.rounding->operand != (int) (i.imm_operands - 1))
4559         {
4560           i.error = rc_sae_operand_not_last_imm;
4561           return 1;
4562         }
4563     }
4564
4565   /* Check vector Disp8 operand.  */
4566   if (t->opcode_modifier.disp8memshift)
4567     {
4568       if (i.broadcast)
4569         i.memshift = t->opcode_modifier.vecesize ? 3 : 2;
4570       else
4571         i.memshift = t->opcode_modifier.disp8memshift;
4572
4573       for (op = 0; op < i.operands; op++)
4574         if (operand_type_check (i.types[op], disp)
4575             && i.op[op].disps->X_op == O_constant)
4576           {
4577             offsetT value = i.op[op].disps->X_add_number;
4578             int vec_disp8_ok
4579               = (i.disp_encoding != disp_encoding_32bit
4580                  && fits_in_vec_disp8 (value));
4581             if (t->operand_types [op].bitfield.vec_disp8)
4582               {
4583                 if (vec_disp8_ok)
4584                   i.types[op].bitfield.vec_disp8 = 1;
4585                 else
4586                   {
4587                     /* Vector insn can only have Vec_Disp8/Disp32 in
4588                        32/64bit modes, and Vec_Disp8/Disp16 in 16bit
4589                        mode.  */
4590                     i.types[op].bitfield.disp8 = 0;
4591                     if (flag_code != CODE_16BIT)
4592                       i.types[op].bitfield.disp16 = 0;
4593                   }
4594               }
4595             else if (flag_code != CODE_16BIT)
4596               {
4597                 /* One form of this instruction supports vector Disp8.
4598                    Try vector Disp8 if we need to use Disp32.  */
4599                 if (vec_disp8_ok && !fits_in_signed_byte (value))
4600                   {
4601                     i.error = try_vector_disp8;
4602                     return 1;
4603                   }
4604               }
4605           }
4606     }
4607   else
4608     i.memshift = -1;
4609
4610   return 0;
4611 }
4612
4613 /* Check if operands are valid for the instruction.  Update VEX
4614    operand types.  */
4615
4616 static int
4617 VEX_check_operands (const insn_template *t)
4618 {
4619   /* VREX is only valid with EVEX prefix.  */
4620   if (i.need_vrex && !t->opcode_modifier.evex)
4621     {
4622       i.error = invalid_register_operand;
4623       return 1;
4624     }
4625
4626   if (!t->opcode_modifier.vex)
4627     return 0;
4628
4629   /* Only check VEX_Imm4, which must be the first operand.  */
4630   if (t->operand_types[0].bitfield.vec_imm4)
4631     {
4632       if (i.op[0].imms->X_op != O_constant
4633           || !fits_in_imm4 (i.op[0].imms->X_add_number))
4634         {
4635           i.error = bad_imm4;
4636           return 1;
4637         }
4638
4639       /* Turn off Imm8 so that update_imm won't complain.  */
4640       i.types[0] = vec_imm4;
4641     }
4642
4643   return 0;
4644 }
4645
4646 static const insn_template *
4647 match_template (void)
4648 {
4649   /* Points to template once we've found it.  */
4650   const insn_template *t;
4651   i386_operand_type overlap0, overlap1, overlap2, overlap3;
4652   i386_operand_type overlap4;
4653   unsigned int found_reverse_match;
4654   i386_opcode_modifier suffix_check;
4655   i386_operand_type operand_types [MAX_OPERANDS];
4656   int addr_prefix_disp;
4657   unsigned int j;
4658   unsigned int found_cpu_match;
4659   unsigned int check_register;
4660   enum i386_error specific_error = 0;
4661
4662 #if MAX_OPERANDS != 5
4663 # error "MAX_OPERANDS must be 5."
4664 #endif
4665
4666   found_reverse_match = 0;
4667   addr_prefix_disp = -1;
4668
4669   memset (&suffix_check, 0, sizeof (suffix_check));
4670   if (i.suffix == BYTE_MNEM_SUFFIX)
4671     suffix_check.no_bsuf = 1;
4672   else if (i.suffix == WORD_MNEM_SUFFIX)
4673     suffix_check.no_wsuf = 1;
4674   else if (i.suffix == SHORT_MNEM_SUFFIX)
4675     suffix_check.no_ssuf = 1;
4676   else if (i.suffix == LONG_MNEM_SUFFIX)
4677     suffix_check.no_lsuf = 1;
4678   else if (i.suffix == QWORD_MNEM_SUFFIX)
4679     suffix_check.no_qsuf = 1;
4680   else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
4681     suffix_check.no_ldsuf = 1;
4682
4683   /* Must have right number of operands.  */
4684   i.error = number_of_operands_mismatch;
4685
4686   for (t = current_templates->start; t < current_templates->end; t++)
4687     {
4688       addr_prefix_disp = -1;
4689
4690       if (i.operands != t->operands)
4691         continue;
4692
4693       /* Check processor support.  */
4694       i.error = unsupported;
4695       found_cpu_match = (cpu_flags_match (t)
4696                          == CPU_FLAGS_PERFECT_MATCH);
4697       if (!found_cpu_match)
4698         continue;
4699
4700       /* Check old gcc support. */
4701       i.error = old_gcc_only;
4702       if (!old_gcc && t->opcode_modifier.oldgcc)
4703         continue;
4704
4705       /* Check AT&T mnemonic.   */
4706       i.error = unsupported_with_intel_mnemonic;
4707       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
4708         continue;
4709
4710       /* Check AT&T/Intel syntax.   */
4711       i.error = unsupported_syntax;
4712       if ((intel_syntax && t->opcode_modifier.attsyntax)
4713           || (!intel_syntax && t->opcode_modifier.intelsyntax))
4714         continue;
4715
4716       /* Check the suffix, except for some instructions in intel mode.  */
4717       i.error = invalid_instruction_suffix;
4718       if ((!intel_syntax || !t->opcode_modifier.ignoresize)
4719           && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
4720               || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
4721               || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
4722               || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
4723               || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
4724               || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
4725         continue;
4726
4727       if (!operand_size_match (t))
4728         continue;
4729
4730       for (j = 0; j < MAX_OPERANDS; j++)
4731         operand_types[j] = t->operand_types[j];
4732
4733       /* In general, don't allow 64-bit operands in 32-bit mode.  */
4734       if (i.suffix == QWORD_MNEM_SUFFIX
4735           && flag_code != CODE_64BIT
4736           && (intel_syntax
4737               ? (!t->opcode_modifier.ignoresize
4738                  && !intel_float_operand (t->name))
4739               : intel_float_operand (t->name) != 2)
4740           && ((!operand_types[0].bitfield.regmmx
4741                && !operand_types[0].bitfield.regxmm
4742                && !operand_types[0].bitfield.regymm
4743                && !operand_types[0].bitfield.regzmm)
4744               || (!operand_types[t->operands > 1].bitfield.regmmx
4745                   && operand_types[t->operands > 1].bitfield.regxmm
4746                   && operand_types[t->operands > 1].bitfield.regymm
4747                   && operand_types[t->operands > 1].bitfield.regzmm))
4748           && (t->base_opcode != 0x0fc7
4749               || t->extension_opcode != 1 /* cmpxchg8b */))
4750         continue;
4751
4752       /* In general, don't allow 32-bit operands on pre-386.  */
4753       else if (i.suffix == LONG_MNEM_SUFFIX
4754                && !cpu_arch_flags.bitfield.cpui386
4755                && (intel_syntax
4756                    ? (!t->opcode_modifier.ignoresize
4757                       && !intel_float_operand (t->name))
4758                    : intel_float_operand (t->name) != 2)
4759                && ((!operand_types[0].bitfield.regmmx
4760                     && !operand_types[0].bitfield.regxmm)
4761                    || (!operand_types[t->operands > 1].bitfield.regmmx
4762                        && operand_types[t->operands > 1].bitfield.regxmm)))
4763         continue;
4764
4765       /* Do not verify operands when there are none.  */
4766       else
4767         {
4768           if (!t->operands)
4769             /* We've found a match; break out of loop.  */
4770             break;
4771         }
4772
4773       /* Address size prefix will turn Disp64/Disp32/Disp16 operand
4774          into Disp32/Disp16/Disp32 operand.  */
4775       if (i.prefix[ADDR_PREFIX] != 0)
4776           {
4777             /* There should be only one Disp operand.  */
4778             switch (flag_code)
4779             {
4780             case CODE_16BIT:
4781               for (j = 0; j < MAX_OPERANDS; j++)
4782                 {
4783                   if (operand_types[j].bitfield.disp16)
4784                     {
4785                       addr_prefix_disp = j;
4786                       operand_types[j].bitfield.disp32 = 1;
4787                       operand_types[j].bitfield.disp16 = 0;
4788                       break;
4789                     }
4790                 }
4791               break;
4792             case CODE_32BIT:
4793               for (j = 0; j < MAX_OPERANDS; j++)
4794                 {
4795                   if (operand_types[j].bitfield.disp32)
4796                     {
4797                       addr_prefix_disp = j;
4798                       operand_types[j].bitfield.disp32 = 0;
4799                       operand_types[j].bitfield.disp16 = 1;
4800                       break;
4801                     }
4802                 }
4803               break;
4804             case CODE_64BIT:
4805               for (j = 0; j < MAX_OPERANDS; j++)
4806                 {
4807                   if (operand_types[j].bitfield.disp64)
4808                     {
4809                       addr_prefix_disp = j;
4810                       operand_types[j].bitfield.disp64 = 0;
4811                       operand_types[j].bitfield.disp32 = 1;
4812                       break;
4813                     }
4814                 }
4815               break;
4816             }
4817           }
4818
4819       /* Force 0x8b encoding for "mov foo@GOT, %eax".  */
4820       if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
4821         continue;
4822
4823       /* We check register size if needed.  */
4824       check_register = t->opcode_modifier.checkregsize;
4825       overlap0 = operand_type_and (i.types[0], operand_types[0]);
4826       switch (t->operands)
4827         {
4828         case 1:
4829           if (!operand_type_match (overlap0, i.types[0]))
4830             continue;
4831           break;
4832         case 2:
4833           /* xchg %eax, %eax is a special case. It is an aliase for nop
4834              only in 32bit mode and we can use opcode 0x90.  In 64bit
4835              mode, we can't use 0x90 for xchg %eax, %eax since it should
4836              zero-extend %eax to %rax.  */
4837           if (flag_code == CODE_64BIT
4838               && t->base_opcode == 0x90
4839               && operand_type_equal (&i.types [0], &acc32)
4840               && operand_type_equal (&i.types [1], &acc32))
4841             continue;
4842           if (i.swap_operand)
4843             {
4844               /* If we swap operand in encoding, we either match
4845                  the next one or reverse direction of operands.  */
4846               if (t->opcode_modifier.s)
4847                 continue;
4848               else if (t->opcode_modifier.d)
4849                 goto check_reverse;
4850             }
4851
4852         case 3:
4853           /* If we swap operand in encoding, we match the next one.  */
4854           if (i.swap_operand && t->opcode_modifier.s)
4855             continue;
4856         case 4:
4857         case 5:
4858           overlap1 = operand_type_and (i.types[1], operand_types[1]);
4859           if (!operand_type_match (overlap0, i.types[0])
4860               || !operand_type_match (overlap1, i.types[1])
4861               || (check_register
4862                   && !operand_type_register_match (overlap0, i.types[0],
4863                                                    operand_types[0],
4864                                                    overlap1, i.types[1],
4865                                                    operand_types[1])))
4866             {
4867               /* Check if other direction is valid ...  */
4868               if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
4869                 continue;
4870
4871 check_reverse:
4872               /* Try reversing direction of operands.  */
4873               overlap0 = operand_type_and (i.types[0], operand_types[1]);
4874               overlap1 = operand_type_and (i.types[1], operand_types[0]);
4875               if (!operand_type_match (overlap0, i.types[0])
4876                   || !operand_type_match (overlap1, i.types[1])
4877                   || (check_register
4878                       && !operand_type_register_match (overlap0,
4879                                                        i.types[0],
4880                                                        operand_types[1],
4881                                                        overlap1,
4882                                                        i.types[1],
4883                                                        operand_types[0])))
4884                 {
4885                   /* Does not match either direction.  */
4886                   continue;
4887                 }
4888               /* found_reverse_match holds which of D or FloatDR
4889                  we've found.  */
4890               if (t->opcode_modifier.d)
4891                 found_reverse_match = Opcode_D;
4892               else if (t->opcode_modifier.floatd)
4893                 found_reverse_match = Opcode_FloatD;
4894               else
4895                 found_reverse_match = 0;
4896               if (t->opcode_modifier.floatr)
4897                 found_reverse_match |= Opcode_FloatR;
4898             }
4899           else
4900             {
4901               /* Found a forward 2 operand match here.  */
4902               switch (t->operands)
4903                 {
4904                 case 5:
4905                   overlap4 = operand_type_and (i.types[4],
4906                                                operand_types[4]);
4907                 case 4:
4908                   overlap3 = operand_type_and (i.types[3],
4909                                                operand_types[3]);
4910                 case 3:
4911                   overlap2 = operand_type_and (i.types[2],
4912                                                operand_types[2]);
4913                   break;
4914                 }
4915
4916               switch (t->operands)
4917                 {
4918                 case 5:
4919                   if (!operand_type_match (overlap4, i.types[4])
4920                       || !operand_type_register_match (overlap3,
4921                                                        i.types[3],
4922                                                        operand_types[3],
4923                                                        overlap4,
4924                                                        i.types[4],
4925                                                        operand_types[4]))
4926                     continue;
4927                 case 4:
4928                   if (!operand_type_match (overlap3, i.types[3])
4929                       || (check_register
4930                           && !operand_type_register_match (overlap2,
4931                                                            i.types[2],
4932                                                            operand_types[2],
4933                                                            overlap3,
4934                                                            i.types[3],
4935                                                            operand_types[3])))
4936                     continue;
4937                 case 3:
4938                   /* Here we make use of the fact that there are no
4939                      reverse match 3 operand instructions, and all 3
4940                      operand instructions only need to be checked for
4941                      register consistency between operands 2 and 3.  */
4942                   if (!operand_type_match (overlap2, i.types[2])
4943                       || (check_register
4944                           && !operand_type_register_match (overlap1,
4945                                                            i.types[1],
4946                                                            operand_types[1],
4947                                                            overlap2,
4948                                                            i.types[2],
4949                                                            operand_types[2])))
4950                     continue;
4951                   break;
4952                 }
4953             }
4954           /* Found either forward/reverse 2, 3 or 4 operand match here:
4955              slip through to break.  */
4956         }
4957       if (!found_cpu_match)
4958         {
4959           found_reverse_match = 0;
4960           continue;
4961         }
4962
4963       /* Check if vector and VEX operands are valid.  */
4964       if (check_VecOperands (t) || VEX_check_operands (t))
4965         {
4966           specific_error = i.error;
4967           continue;
4968         }
4969
4970       /* We've found a match; break out of loop.  */
4971       break;
4972     }
4973
4974   if (t == current_templates->end)
4975     {
4976       /* We found no match.  */
4977       const char *err_msg;
4978       switch (specific_error ? specific_error : i.error)
4979         {
4980         default:
4981           abort ();
4982         case operand_size_mismatch:
4983           err_msg = _("operand size mismatch");
4984           break;
4985         case operand_type_mismatch:
4986           err_msg = _("operand type mismatch");
4987           break;
4988         case register_type_mismatch:
4989           err_msg = _("register type mismatch");
4990           break;
4991         case number_of_operands_mismatch:
4992           err_msg = _("number of operands mismatch");
4993           break;
4994         case invalid_instruction_suffix:
4995           err_msg = _("invalid instruction suffix");
4996           break;
4997         case bad_imm4:
4998           err_msg = _("constant doesn't fit in 4 bits");
4999           break;
5000         case old_gcc_only:
5001           err_msg = _("only supported with old gcc");
5002           break;
5003         case unsupported_with_intel_mnemonic:
5004           err_msg = _("unsupported with Intel mnemonic");
5005           break;
5006         case unsupported_syntax:
5007           err_msg = _("unsupported syntax");
5008           break;
5009         case unsupported:
5010           as_bad (_("unsupported instruction `%s'"),
5011                   current_templates->start->name);
5012           return NULL;
5013         case invalid_vsib_address:
5014           err_msg = _("invalid VSIB address");
5015           break;
5016         case invalid_vector_register_set:
5017           err_msg = _("mask, index, and destination registers must be distinct");
5018           break;
5019         case unsupported_vector_index_register:
5020           err_msg = _("unsupported vector index register");
5021           break;
5022         case unsupported_broadcast:
5023           err_msg = _("unsupported broadcast");
5024           break;
5025         case broadcast_not_on_src_operand:
5026           err_msg = _("broadcast not on source memory operand");
5027           break;
5028         case broadcast_needed:
5029           err_msg = _("broadcast is needed for operand of such type");
5030           break;
5031         case unsupported_masking:
5032           err_msg = _("unsupported masking");
5033           break;
5034         case mask_not_on_destination:
5035           err_msg = _("mask not on destination operand");
5036           break;
5037         case no_default_mask:
5038           err_msg = _("default mask isn't allowed");
5039           break;
5040         case unsupported_rc_sae:
5041           err_msg = _("unsupported static rounding/sae");
5042           break;
5043         case rc_sae_operand_not_last_imm:
5044           if (intel_syntax)
5045             err_msg = _("RC/SAE operand must precede immediate operands");
5046           else
5047             err_msg = _("RC/SAE operand must follow immediate operands");
5048           break;
5049         case invalid_register_operand:
5050           err_msg = _("invalid register operand");
5051           break;
5052         }
5053       as_bad (_("%s for `%s'"), err_msg,
5054               current_templates->start->name);
5055       return NULL;
5056     }
5057
5058   if (!quiet_warnings)
5059     {
5060       if (!intel_syntax
5061           && (i.types[0].bitfield.jumpabsolute
5062               != operand_types[0].bitfield.jumpabsolute))
5063         {
5064           as_warn (_("indirect %s without `*'"), t->name);
5065         }
5066
5067       if (t->opcode_modifier.isprefix
5068           && t->opcode_modifier.ignoresize)
5069         {
5070           /* Warn them that a data or address size prefix doesn't
5071              affect assembly of the next line of code.  */
5072           as_warn (_("stand-alone `%s' prefix"), t->name);
5073         }
5074     }
5075
5076   /* Copy the template we found.  */
5077   i.tm = *t;
5078
5079   if (addr_prefix_disp != -1)
5080     i.tm.operand_types[addr_prefix_disp]
5081       = operand_types[addr_prefix_disp];
5082
5083   if (found_reverse_match)
5084     {
5085       /* If we found a reverse match we must alter the opcode
5086          direction bit.  found_reverse_match holds bits to change
5087          (different for int & float insns).  */
5088
5089       i.tm.base_opcode ^= found_reverse_match;
5090
5091       i.tm.operand_types[0] = operand_types[1];
5092       i.tm.operand_types[1] = operand_types[0];
5093     }
5094
5095   return t;
5096 }
5097
5098 static int
5099 check_string (void)
5100 {
5101   int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
5102   if (i.tm.operand_types[mem_op].bitfield.esseg)
5103     {
5104       if (i.seg[0] != NULL && i.seg[0] != &es)
5105         {
5106           as_bad (_("`%s' operand %d must use `%ses' segment"),
5107                   i.tm.name,
5108                   mem_op + 1,
5109                   register_prefix);
5110           return 0;
5111         }
5112       /* There's only ever one segment override allowed per instruction.
5113          This instruction possibly has a legal segment override on the
5114          second operand, so copy the segment to where non-string
5115          instructions store it, allowing common code.  */
5116       i.seg[0] = i.seg[1];
5117     }
5118   else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
5119     {
5120       if (i.seg[1] != NULL && i.seg[1] != &es)
5121         {
5122           as_bad (_("`%s' operand %d must use `%ses' segment"),
5123                   i.tm.name,
5124                   mem_op + 2,
5125                   register_prefix);
5126           return 0;
5127         }
5128     }
5129   return 1;
5130 }
5131
5132 static int
5133 process_suffix (void)
5134 {
5135   /* If matched instruction specifies an explicit instruction mnemonic
5136      suffix, use it.  */
5137   if (i.tm.opcode_modifier.size16)
5138     i.suffix = WORD_MNEM_SUFFIX;
5139   else if (i.tm.opcode_modifier.size32)
5140     i.suffix = LONG_MNEM_SUFFIX;
5141   else if (i.tm.opcode_modifier.size64)
5142     i.suffix = QWORD_MNEM_SUFFIX;
5143   else if (i.reg_operands)
5144     {
5145       /* If there's no instruction mnemonic suffix we try to invent one
5146          based on register operands.  */
5147       if (!i.suffix)
5148         {
5149           /* We take i.suffix from the last register operand specified,
5150              Destination register type is more significant than source
5151              register type.  crc32 in SSE4.2 prefers source register
5152              type. */
5153           if (i.tm.base_opcode == 0xf20f38f1)
5154             {
5155               if (i.types[0].bitfield.reg16)
5156                 i.suffix = WORD_MNEM_SUFFIX;
5157               else if (i.types[0].bitfield.reg32)
5158                 i.suffix = LONG_MNEM_SUFFIX;
5159               else if (i.types[0].bitfield.reg64)
5160                 i.suffix = QWORD_MNEM_SUFFIX;
5161             }
5162           else if (i.tm.base_opcode == 0xf20f38f0)
5163             {
5164               if (i.types[0].bitfield.reg8)
5165                 i.suffix = BYTE_MNEM_SUFFIX;
5166             }
5167
5168           if (!i.suffix)
5169             {
5170               int op;
5171
5172               if (i.tm.base_opcode == 0xf20f38f1
5173                   || i.tm.base_opcode == 0xf20f38f0)
5174                 {
5175                   /* We have to know the operand size for crc32.  */
5176                   as_bad (_("ambiguous memory operand size for `%s`"),
5177                           i.tm.name);
5178                   return 0;
5179                 }
5180
5181               for (op = i.operands; --op >= 0;)
5182                 if (!i.tm.operand_types[op].bitfield.inoutportreg)
5183                   {
5184                     if (i.types[op].bitfield.reg8)
5185                       {
5186                         i.suffix = BYTE_MNEM_SUFFIX;
5187                         break;
5188                       }
5189                     else if (i.types[op].bitfield.reg16)
5190                       {
5191                         i.suffix = WORD_MNEM_SUFFIX;
5192                         break;
5193                       }
5194                     else if (i.types[op].bitfield.reg32)
5195                       {
5196                         i.suffix = LONG_MNEM_SUFFIX;
5197                         break;
5198                       }
5199                     else if (i.types[op].bitfield.reg64)
5200                       {
5201                         i.suffix = QWORD_MNEM_SUFFIX;
5202                         break;
5203                       }
5204                   }
5205             }
5206         }
5207       else if (i.suffix == BYTE_MNEM_SUFFIX)
5208         {
5209           if (intel_syntax
5210               && i.tm.opcode_modifier.ignoresize
5211               && i.tm.opcode_modifier.no_bsuf)
5212             i.suffix = 0;
5213           else if (!check_byte_reg ())
5214             return 0;
5215         }
5216       else if (i.suffix == LONG_MNEM_SUFFIX)
5217         {
5218           if (intel_syntax
5219               && i.tm.opcode_modifier.ignoresize
5220               && i.tm.opcode_modifier.no_lsuf)
5221             i.suffix = 0;
5222           else if (!check_long_reg ())
5223             return 0;
5224         }
5225       else if (i.suffix == QWORD_MNEM_SUFFIX)
5226         {
5227           if (intel_syntax
5228               && i.tm.opcode_modifier.ignoresize
5229               && i.tm.opcode_modifier.no_qsuf)
5230             i.suffix = 0;
5231           else if (!check_qword_reg ())
5232             return 0;
5233         }
5234       else if (i.suffix == WORD_MNEM_SUFFIX)
5235         {
5236           if (intel_syntax
5237               && i.tm.opcode_modifier.ignoresize
5238               && i.tm.opcode_modifier.no_wsuf)
5239             i.suffix = 0;
5240           else if (!check_word_reg ())
5241             return 0;
5242         }
5243       else if (i.suffix == XMMWORD_MNEM_SUFFIX
5244                || i.suffix == YMMWORD_MNEM_SUFFIX
5245                || i.suffix == ZMMWORD_MNEM_SUFFIX)
5246         {
5247           /* Skip if the instruction has x/y/z suffix.  match_template
5248              should check if it is a valid suffix.  */
5249         }
5250       else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
5251         /* Do nothing if the instruction is going to ignore the prefix.  */
5252         ;
5253       else
5254         abort ();
5255     }
5256   else if (i.tm.opcode_modifier.defaultsize
5257            && !i.suffix
5258            /* exclude fldenv/frstor/fsave/fstenv */
5259            && i.tm.opcode_modifier.no_ssuf)
5260     {
5261       i.suffix = stackop_size;
5262     }
5263   else if (intel_syntax
5264            && !i.suffix
5265            && (i.tm.operand_types[0].bitfield.jumpabsolute
5266                || i.tm.opcode_modifier.jumpbyte
5267                || i.tm.opcode_modifier.jumpintersegment
5268                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
5269                    && i.tm.extension_opcode <= 3)))
5270     {
5271       switch (flag_code)
5272         {
5273         case CODE_64BIT:
5274           if (!i.tm.opcode_modifier.no_qsuf)
5275             {
5276               i.suffix = QWORD_MNEM_SUFFIX;
5277               break;
5278             }
5279         case CODE_32BIT:
5280           if (!i.tm.opcode_modifier.no_lsuf)
5281             i.suffix = LONG_MNEM_SUFFIX;
5282           break;
5283         case CODE_16BIT:
5284           if (!i.tm.opcode_modifier.no_wsuf)
5285             i.suffix = WORD_MNEM_SUFFIX;
5286           break;
5287         }
5288     }
5289
5290   if (!i.suffix)
5291     {
5292       if (!intel_syntax)
5293         {
5294           if (i.tm.opcode_modifier.w)
5295             {
5296               as_bad (_("no instruction mnemonic suffix given and "
5297                         "no register operands; can't size instruction"));
5298               return 0;
5299             }
5300         }
5301       else
5302         {
5303           unsigned int suffixes;
5304
5305           suffixes = !i.tm.opcode_modifier.no_bsuf;
5306           if (!i.tm.opcode_modifier.no_wsuf)
5307             suffixes |= 1 << 1;
5308           if (!i.tm.opcode_modifier.no_lsuf)
5309             suffixes |= 1 << 2;
5310           if (!i.tm.opcode_modifier.no_ldsuf)
5311             suffixes |= 1 << 3;
5312           if (!i.tm.opcode_modifier.no_ssuf)
5313             suffixes |= 1 << 4;
5314           if (!i.tm.opcode_modifier.no_qsuf)
5315             suffixes |= 1 << 5;
5316
5317           /* There are more than suffix matches.  */
5318           if (i.tm.opcode_modifier.w
5319               || ((suffixes & (suffixes - 1))
5320                   && !i.tm.opcode_modifier.defaultsize
5321                   && !i.tm.opcode_modifier.ignoresize))
5322             {
5323               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
5324               return 0;
5325             }
5326         }
5327     }
5328
5329   /* Change the opcode based on the operand size given by i.suffix;
5330      We don't need to change things for byte insns.  */
5331
5332   if (i.suffix
5333       && i.suffix != BYTE_MNEM_SUFFIX
5334       && i.suffix != XMMWORD_MNEM_SUFFIX
5335       && i.suffix != YMMWORD_MNEM_SUFFIX
5336       && i.suffix != ZMMWORD_MNEM_SUFFIX)
5337     {
5338       /* It's not a byte, select word/dword operation.  */
5339       if (i.tm.opcode_modifier.w)
5340         {
5341           if (i.tm.opcode_modifier.shortform)
5342             i.tm.base_opcode |= 8;
5343           else
5344             i.tm.base_opcode |= 1;
5345         }
5346
5347       /* Now select between word & dword operations via the operand
5348          size prefix, except for instructions that will ignore this
5349          prefix anyway.  */
5350       if (i.tm.opcode_modifier.addrprefixop0)
5351         {
5352           /* The address size override prefix changes the size of the
5353              first operand.  */
5354           if ((flag_code == CODE_32BIT
5355                && i.op->regs[0].reg_type.bitfield.reg16)
5356               || (flag_code != CODE_32BIT
5357                   && i.op->regs[0].reg_type.bitfield.reg32))
5358             if (!add_prefix (ADDR_PREFIX_OPCODE))
5359               return 0;
5360         }
5361       else if (i.suffix != QWORD_MNEM_SUFFIX
5362                && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
5363                && !i.tm.opcode_modifier.ignoresize
5364                && !i.tm.opcode_modifier.floatmf
5365                && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
5366                    || (flag_code == CODE_64BIT
5367                        && i.tm.opcode_modifier.jumpbyte)))
5368         {
5369           unsigned int prefix = DATA_PREFIX_OPCODE;
5370
5371           if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
5372             prefix = ADDR_PREFIX_OPCODE;
5373
5374           if (!add_prefix (prefix))
5375             return 0;
5376         }
5377
5378       /* Set mode64 for an operand.  */
5379       if (i.suffix == QWORD_MNEM_SUFFIX
5380           && flag_code == CODE_64BIT
5381           && !i.tm.opcode_modifier.norex64)
5382         {
5383           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
5384              need rex64.  cmpxchg8b is also a special case. */
5385           if (! (i.operands == 2
5386                  && i.tm.base_opcode == 0x90
5387                  && i.tm.extension_opcode == None
5388                  && operand_type_equal (&i.types [0], &acc64)
5389                  && operand_type_equal (&i.types [1], &acc64))
5390               && ! (i.operands == 1
5391                     && i.tm.base_opcode == 0xfc7
5392                     && i.tm.extension_opcode == 1
5393                     && !operand_type_check (i.types [0], reg)
5394                     && operand_type_check (i.types [0], anymem)))
5395             i.rex |= REX_W;
5396         }
5397
5398       /* Size floating point instruction.  */
5399       if (i.suffix == LONG_MNEM_SUFFIX)
5400         if (i.tm.opcode_modifier.floatmf)
5401           i.tm.base_opcode ^= 4;
5402     }
5403
5404   return 1;
5405 }
5406
5407 static int
5408 check_byte_reg (void)
5409 {
5410   int op;
5411
5412   for (op = i.operands; --op >= 0;)
5413     {
5414       /* If this is an eight bit register, it's OK.  If it's the 16 or
5415          32 bit version of an eight bit register, we will just use the
5416          low portion, and that's OK too.  */
5417       if (i.types[op].bitfield.reg8)
5418         continue;
5419
5420       /* I/O port address operands are OK too.  */
5421       if (i.tm.operand_types[op].bitfield.inoutportreg)
5422         continue;
5423
5424       /* crc32 doesn't generate this warning.  */
5425       if (i.tm.base_opcode == 0xf20f38f0)
5426         continue;
5427
5428       if ((i.types[op].bitfield.reg16
5429            || i.types[op].bitfield.reg32
5430            || i.types[op].bitfield.reg64)
5431           && i.op[op].regs->reg_num < 4
5432           /* Prohibit these changes in 64bit mode, since the lowering
5433              would be more complicated.  */
5434           && flag_code != CODE_64BIT)
5435         {
5436 #if REGISTER_WARNINGS
5437           if (!quiet_warnings)
5438             as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5439                      register_prefix,
5440                      (i.op[op].regs + (i.types[op].bitfield.reg16
5441                                        ? REGNAM_AL - REGNAM_AX
5442                                        : REGNAM_AL - REGNAM_EAX))->reg_name,
5443                      register_prefix,
5444                      i.op[op].regs->reg_name,
5445                      i.suffix);
5446 #endif
5447           continue;
5448         }
5449       /* Any other register is bad.  */
5450       if (i.types[op].bitfield.reg16
5451           || i.types[op].bitfield.reg32
5452           || i.types[op].bitfield.reg64
5453           || i.types[op].bitfield.regmmx
5454           || i.types[op].bitfield.regxmm
5455           || i.types[op].bitfield.regymm
5456           || i.types[op].bitfield.regzmm
5457           || i.types[op].bitfield.sreg2
5458           || i.types[op].bitfield.sreg3
5459           || i.types[op].bitfield.control
5460           || i.types[op].bitfield.debug
5461           || i.types[op].bitfield.test
5462           || i.types[op].bitfield.floatreg
5463           || i.types[op].bitfield.floatacc)
5464         {
5465           as_bad (_("`%s%s' not allowed with `%s%c'"),
5466                   register_prefix,
5467                   i.op[op].regs->reg_name,
5468                   i.tm.name,
5469                   i.suffix);
5470           return 0;
5471         }
5472     }
5473   return 1;
5474 }
5475
5476 static int
5477 check_long_reg (void)
5478 {
5479   int op;
5480
5481   for (op = i.operands; --op >= 0;)
5482     /* Reject eight bit registers, except where the template requires
5483        them. (eg. movzb)  */
5484     if (i.types[op].bitfield.reg8
5485         && (i.tm.operand_types[op].bitfield.reg16
5486             || i.tm.operand_types[op].bitfield.reg32
5487             || i.tm.operand_types[op].bitfield.acc))
5488       {
5489         as_bad (_("`%s%s' not allowed with `%s%c'"),
5490                 register_prefix,
5491                 i.op[op].regs->reg_name,
5492                 i.tm.name,
5493                 i.suffix);
5494         return 0;
5495       }
5496     /* Warn if the e prefix on a general reg is missing.  */
5497     else if ((!quiet_warnings || flag_code == CODE_64BIT)
5498              && i.types[op].bitfield.reg16
5499              && (i.tm.operand_types[op].bitfield.reg32
5500                  || i.tm.operand_types[op].bitfield.acc))
5501       {
5502         /* Prohibit these changes in the 64bit mode, since the
5503            lowering is more complicated.  */
5504         if (flag_code == CODE_64BIT)
5505           {
5506             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5507                     register_prefix, i.op[op].regs->reg_name,
5508                     i.suffix);
5509             return 0;
5510           }
5511 #if REGISTER_WARNINGS
5512         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5513                  register_prefix,
5514                  (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
5515                  register_prefix, i.op[op].regs->reg_name, i.suffix);
5516 #endif
5517       }
5518     /* Warn if the r prefix on a general reg is present.  */
5519     else if (i.types[op].bitfield.reg64
5520              && (i.tm.operand_types[op].bitfield.reg32
5521                  || i.tm.operand_types[op].bitfield.acc))
5522       {
5523         if (intel_syntax
5524             && i.tm.opcode_modifier.toqword
5525             && !i.types[0].bitfield.regxmm)
5526           {
5527             /* Convert to QWORD.  We want REX byte. */
5528             i.suffix = QWORD_MNEM_SUFFIX;
5529           }
5530         else
5531           {
5532             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5533                     register_prefix, i.op[op].regs->reg_name,
5534                     i.suffix);
5535             return 0;
5536           }
5537       }
5538   return 1;
5539 }
5540
5541 static int
5542 check_qword_reg (void)
5543 {
5544   int op;
5545
5546   for (op = i.operands; --op >= 0; )
5547     /* Reject eight bit registers, except where the template requires
5548        them. (eg. movzb)  */
5549     if (i.types[op].bitfield.reg8
5550         && (i.tm.operand_types[op].bitfield.reg16
5551             || i.tm.operand_types[op].bitfield.reg32
5552             || i.tm.operand_types[op].bitfield.acc))
5553       {
5554         as_bad (_("`%s%s' not allowed with `%s%c'"),
5555                 register_prefix,
5556                 i.op[op].regs->reg_name,
5557                 i.tm.name,
5558                 i.suffix);
5559         return 0;
5560       }
5561     /* Warn if the r prefix on a general reg is missing.  */
5562     else if ((i.types[op].bitfield.reg16
5563               || i.types[op].bitfield.reg32)
5564              && (i.tm.operand_types[op].bitfield.reg32
5565                  || i.tm.operand_types[op].bitfield.acc))
5566       {
5567         /* Prohibit these changes in the 64bit mode, since the
5568            lowering is more complicated.  */
5569         if (intel_syntax
5570             && i.tm.opcode_modifier.todword
5571             && !i.types[0].bitfield.regxmm)
5572           {
5573             /* Convert to DWORD.  We don't want REX byte. */
5574             i.suffix = LONG_MNEM_SUFFIX;
5575           }
5576         else
5577           {
5578             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5579                     register_prefix, i.op[op].regs->reg_name,
5580                     i.suffix);
5581             return 0;
5582           }
5583       }
5584   return 1;
5585 }
5586
5587 static int
5588 check_word_reg (void)
5589 {
5590   int op;
5591   for (op = i.operands; --op >= 0;)
5592     /* Reject eight bit registers, except where the template requires
5593        them. (eg. movzb)  */
5594     if (i.types[op].bitfield.reg8
5595         && (i.tm.operand_types[op].bitfield.reg16
5596             || i.tm.operand_types[op].bitfield.reg32
5597             || i.tm.operand_types[op].bitfield.acc))
5598       {
5599         as_bad (_("`%s%s' not allowed with `%s%c'"),
5600                 register_prefix,
5601                 i.op[op].regs->reg_name,
5602                 i.tm.name,
5603                 i.suffix);
5604         return 0;
5605       }
5606     /* Warn if the e or r prefix on a general reg is present.  */
5607     else if ((!quiet_warnings || flag_code == CODE_64BIT)
5608              && (i.types[op].bitfield.reg32
5609                  || i.types[op].bitfield.reg64)
5610              && (i.tm.operand_types[op].bitfield.reg16
5611                  || i.tm.operand_types[op].bitfield.acc))
5612       {
5613         /* Prohibit these changes in the 64bit mode, since the
5614            lowering is more complicated.  */
5615         if (flag_code == CODE_64BIT)
5616           {
5617             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5618                     register_prefix, i.op[op].regs->reg_name,
5619                     i.suffix);
5620             return 0;
5621           }
5622 #if REGISTER_WARNINGS
5623         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5624                  register_prefix,
5625                  (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
5626                  register_prefix, i.op[op].regs->reg_name, i.suffix);
5627 #endif
5628       }
5629   return 1;
5630 }
5631
5632 static int
5633 update_imm (unsigned int j)
5634 {
5635   i386_operand_type overlap = i.types[j];
5636   if ((overlap.bitfield.imm8
5637        || overlap.bitfield.imm8s
5638        || overlap.bitfield.imm16
5639        || overlap.bitfield.imm32
5640        || overlap.bitfield.imm32s
5641        || overlap.bitfield.imm64)
5642       && !operand_type_equal (&overlap, &imm8)
5643       && !operand_type_equal (&overlap, &imm8s)
5644       && !operand_type_equal (&overlap, &imm16)
5645       && !operand_type_equal (&overlap, &imm32)
5646       && !operand_type_equal (&overlap, &imm32s)
5647       && !operand_type_equal (&overlap, &imm64))
5648     {
5649       if (i.suffix)
5650         {
5651           i386_operand_type temp;
5652
5653           operand_type_set (&temp, 0);
5654           if (i.suffix == BYTE_MNEM_SUFFIX)
5655             {
5656               temp.bitfield.imm8 = overlap.bitfield.imm8;
5657               temp.bitfield.imm8s = overlap.bitfield.imm8s;
5658             }
5659           else if (i.suffix == WORD_MNEM_SUFFIX)
5660             temp.bitfield.imm16 = overlap.bitfield.imm16;
5661           else if (i.suffix == QWORD_MNEM_SUFFIX)
5662             {
5663               temp.bitfield.imm64 = overlap.bitfield.imm64;
5664               temp.bitfield.imm32s = overlap.bitfield.imm32s;
5665             }
5666           else
5667             temp.bitfield.imm32 = overlap.bitfield.imm32;
5668           overlap = temp;
5669         }
5670       else if (operand_type_equal (&overlap, &imm16_32_32s)
5671                || operand_type_equal (&overlap, &imm16_32)
5672                || operand_type_equal (&overlap, &imm16_32s))
5673         {
5674           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5675             overlap = imm16;
5676           else
5677             overlap = imm32s;
5678         }
5679       if (!operand_type_equal (&overlap, &imm8)
5680           && !operand_type_equal (&overlap, &imm8s)
5681           && !operand_type_equal (&overlap, &imm16)
5682           && !operand_type_equal (&overlap, &imm32)
5683           && !operand_type_equal (&overlap, &imm32s)
5684           && !operand_type_equal (&overlap, &imm64))
5685         {
5686           as_bad (_("no instruction mnemonic suffix given; "
5687                     "can't determine immediate size"));
5688           return 0;
5689         }
5690     }
5691   i.types[j] = overlap;
5692
5693   return 1;
5694 }
5695
5696 static int
5697 finalize_imm (void)
5698 {
5699   unsigned int j, n;
5700
5701   /* Update the first 2 immediate operands.  */
5702   n = i.operands > 2 ? 2 : i.operands;
5703   if (n)
5704     {
5705       for (j = 0; j < n; j++)
5706         if (update_imm (j) == 0)
5707           return 0;
5708
5709       /* The 3rd operand can't be immediate operand.  */
5710       gas_assert (operand_type_check (i.types[2], imm) == 0);
5711     }
5712
5713   return 1;
5714 }
5715
5716 static int
5717 bad_implicit_operand (int xmm)
5718 {
5719   const char *ireg = xmm ? "xmm0" : "ymm0";
5720
5721   if (intel_syntax)
5722     as_bad (_("the last operand of `%s' must be `%s%s'"),
5723             i.tm.name, register_prefix, ireg);
5724   else
5725     as_bad (_("the first operand of `%s' must be `%s%s'"),
5726             i.tm.name, register_prefix, ireg);
5727   return 0;
5728 }
5729
5730 static int
5731 process_operands (void)
5732 {
5733   /* Default segment register this instruction will use for memory
5734      accesses.  0 means unknown.  This is only for optimizing out
5735      unnecessary segment overrides.  */
5736   const seg_entry *default_seg = 0;
5737
5738   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
5739     {
5740       unsigned int dupl = i.operands;
5741       unsigned int dest = dupl - 1;
5742       unsigned int j;
5743
5744       /* The destination must be an xmm register.  */
5745       gas_assert (i.reg_operands
5746                   && MAX_OPERANDS > dupl
5747                   && operand_type_equal (&i.types[dest], &regxmm));
5748
5749       if (i.tm.opcode_modifier.firstxmm0)
5750         {
5751           /* The first operand is implicit and must be xmm0.  */
5752           gas_assert (operand_type_equal (&i.types[0], &regxmm));
5753           if (register_number (i.op[0].regs) != 0)
5754             return bad_implicit_operand (1);
5755
5756           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
5757             {
5758               /* Keep xmm0 for instructions with VEX prefix and 3
5759                  sources.  */
5760               goto duplicate;
5761             }
5762           else
5763             {
5764               /* We remove the first xmm0 and keep the number of
5765                  operands unchanged, which in fact duplicates the
5766                  destination.  */
5767               for (j = 1; j < i.operands; j++)
5768                 {
5769                   i.op[j - 1] = i.op[j];
5770                   i.types[j - 1] = i.types[j];
5771                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
5772                 }
5773             }
5774         }
5775       else if (i.tm.opcode_modifier.implicit1stxmm0)
5776         {
5777           gas_assert ((MAX_OPERANDS - 1) > dupl
5778                       && (i.tm.opcode_modifier.vexsources
5779                           == VEX3SOURCES));
5780
5781           /* Add the implicit xmm0 for instructions with VEX prefix
5782              and 3 sources.  */
5783           for (j = i.operands; j > 0; j--)
5784             {
5785               i.op[j] = i.op[j - 1];
5786               i.types[j] = i.types[j - 1];
5787               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
5788             }
5789           i.op[0].regs
5790             = (const reg_entry *) hash_find (reg_hash, "xmm0");
5791           i.types[0] = regxmm;
5792           i.tm.operand_types[0] = regxmm;
5793
5794           i.operands += 2;
5795           i.reg_operands += 2;
5796           i.tm.operands += 2;
5797
5798           dupl++;
5799           dest++;
5800           i.op[dupl] = i.op[dest];
5801           i.types[dupl] = i.types[dest];
5802           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5803         }
5804       else
5805         {
5806 duplicate:
5807           i.operands++;
5808           i.reg_operands++;
5809           i.tm.operands++;
5810
5811           i.op[dupl] = i.op[dest];
5812           i.types[dupl] = i.types[dest];
5813           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5814         }
5815
5816        if (i.tm.opcode_modifier.immext)
5817          process_immext ();
5818     }
5819   else if (i.tm.opcode_modifier.firstxmm0)
5820     {
5821       unsigned int j;
5822
5823       /* The first operand is implicit and must be xmm0/ymm0/zmm0.  */
5824       gas_assert (i.reg_operands
5825                   && (operand_type_equal (&i.types[0], &regxmm)
5826                       || operand_type_equal (&i.types[0], &regymm)
5827                       || operand_type_equal (&i.types[0], &regzmm)));
5828       if (register_number (i.op[0].regs) != 0)
5829         return bad_implicit_operand (i.types[0].bitfield.regxmm);
5830
5831       for (j = 1; j < i.operands; j++)
5832         {
5833           i.op[j - 1] = i.op[j];
5834           i.types[j - 1] = i.types[j];
5835
5836           /* We need to adjust fields in i.tm since they are used by
5837              build_modrm_byte.  */
5838           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
5839         }
5840
5841       i.operands--;
5842       i.reg_operands--;
5843       i.tm.operands--;
5844     }
5845   else if (i.tm.opcode_modifier.regkludge)
5846     {
5847       /* The imul $imm, %reg instruction is converted into
5848          imul $imm, %reg, %reg, and the clr %reg instruction
5849          is converted into xor %reg, %reg.  */
5850
5851       unsigned int first_reg_op;
5852
5853       if (operand_type_check (i.types[0], reg))
5854         first_reg_op = 0;
5855       else
5856         first_reg_op = 1;
5857       /* Pretend we saw the extra register operand.  */
5858       gas_assert (i.reg_operands == 1
5859                   && i.op[first_reg_op + 1].regs == 0);
5860       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
5861       i.types[first_reg_op + 1] = i.types[first_reg_op];
5862       i.operands++;
5863       i.reg_operands++;
5864     }
5865
5866   if (i.tm.opcode_modifier.shortform)
5867     {
5868       if (i.types[0].bitfield.sreg2
5869           || i.types[0].bitfield.sreg3)
5870         {
5871           if (i.tm.base_opcode == POP_SEG_SHORT
5872               && i.op[0].regs->reg_num == 1)
5873             {
5874               as_bad (_("you can't `pop %scs'"), register_prefix);
5875               return 0;
5876             }
5877           i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
5878           if ((i.op[0].regs->reg_flags & RegRex) != 0)
5879             i.rex |= REX_B;
5880         }
5881       else
5882         {
5883           /* The register or float register operand is in operand
5884              0 or 1.  */
5885           unsigned int op;
5886
5887           if (i.types[0].bitfield.floatreg
5888               || operand_type_check (i.types[0], reg))
5889             op = 0;
5890           else
5891             op = 1;
5892           /* Register goes in low 3 bits of opcode.  */
5893           i.tm.base_opcode |= i.op[op].regs->reg_num;
5894           if ((i.op[op].regs->reg_flags & RegRex) != 0)
5895             i.rex |= REX_B;
5896           if (!quiet_warnings && i.tm.opcode_modifier.ugh)
5897             {
5898               /* Warn about some common errors, but press on regardless.
5899                  The first case can be generated by gcc (<= 2.8.1).  */
5900               if (i.operands == 2)
5901                 {
5902                   /* Reversed arguments on faddp, fsubp, etc.  */
5903                   as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
5904                            register_prefix, i.op[!intel_syntax].regs->reg_name,
5905                            register_prefix, i.op[intel_syntax].regs->reg_name);
5906                 }
5907               else
5908                 {
5909                   /* Extraneous `l' suffix on fp insn.  */
5910                   as_warn (_("translating to `%s %s%s'"), i.tm.name,
5911                            register_prefix, i.op[0].regs->reg_name);
5912                 }
5913             }
5914         }
5915     }
5916   else if (i.tm.opcode_modifier.modrm)
5917     {
5918       /* The opcode is completed (modulo i.tm.extension_opcode which
5919          must be put into the modrm byte).  Now, we make the modrm and
5920          index base bytes based on all the info we've collected.  */
5921
5922       default_seg = build_modrm_byte ();
5923     }
5924   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
5925     {
5926       default_seg = &ds;
5927     }
5928   else if (i.tm.opcode_modifier.isstring)
5929     {
5930       /* For the string instructions that allow a segment override
5931          on one of their operands, the default segment is ds.  */
5932       default_seg = &ds;
5933     }
5934
5935   if (i.tm.base_opcode == 0x8d /* lea */
5936       && i.seg[0]
5937       && !quiet_warnings)
5938     as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
5939
5940   /* If a segment was explicitly specified, and the specified segment
5941      is not the default, use an opcode prefix to select it.  If we
5942      never figured out what the default segment is, then default_seg
5943      will be zero at this point, and the specified segment prefix will
5944      always be used.  */
5945   if ((i.seg[0]) && (i.seg[0] != default_seg))
5946     {
5947       if (!add_prefix (i.seg[0]->seg_prefix))
5948         return 0;
5949     }
5950   return 1;
5951 }
5952
5953 static const seg_entry *
5954 build_modrm_byte (void)
5955 {
5956   const seg_entry *default_seg = 0;
5957   unsigned int source, dest;
5958   int vex_3_sources;
5959
5960   /* The first operand of instructions with VEX prefix and 3 sources
5961      must be VEX_Imm4.  */
5962   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
5963   if (vex_3_sources)
5964     {
5965       unsigned int nds, reg_slot;
5966       expressionS *exp;
5967
5968       if (i.tm.opcode_modifier.veximmext
5969           && i.tm.opcode_modifier.immext)
5970         {
5971           dest = i.operands - 2;
5972           gas_assert (dest == 3);
5973         }
5974       else
5975         dest = i.operands - 1;
5976       nds = dest - 1;
5977
5978       /* There are 2 kinds of instructions:
5979          1. 5 operands: 4 register operands or 3 register operands
5980          plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
5981          VexW0 or VexW1.  The destination must be either XMM, YMM or
5982          ZMM register.
5983          2. 4 operands: 4 register operands or 3 register operands
5984          plus 1 memory operand, VexXDS, and VexImmExt  */
5985       gas_assert ((i.reg_operands == 4
5986                    || (i.reg_operands == 3 && i.mem_operands == 1))
5987                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
5988                   && (i.tm.opcode_modifier.veximmext
5989                       || (i.imm_operands == 1
5990                           && i.types[0].bitfield.vec_imm4
5991                           && (i.tm.opcode_modifier.vexw == VEXW0
5992                               || i.tm.opcode_modifier.vexw == VEXW1)
5993                           && (operand_type_equal (&i.tm.operand_types[dest], &regxmm)
5994                               || operand_type_equal (&i.tm.operand_types[dest], &regymm)
5995                               || operand_type_equal (&i.tm.operand_types[dest], &regzmm)))));
5996
5997       if (i.imm_operands == 0)
5998         {
5999           /* When there is no immediate operand, generate an 8bit
6000              immediate operand to encode the first operand.  */
6001           exp = &im_expressions[i.imm_operands++];
6002           i.op[i.operands].imms = exp;
6003           i.types[i.operands] = imm8;
6004           i.operands++;
6005           /* If VexW1 is set, the first operand is the source and
6006              the second operand is encoded in the immediate operand.  */
6007           if (i.tm.opcode_modifier.vexw == VEXW1)
6008             {
6009               source = 0;
6010               reg_slot = 1;
6011             }
6012           else
6013             {
6014               source = 1;
6015               reg_slot = 0;
6016             }
6017
6018           /* FMA swaps REG and NDS.  */
6019           if (i.tm.cpu_flags.bitfield.cpufma)
6020             {
6021               unsigned int tmp;
6022               tmp = reg_slot;
6023               reg_slot = nds;
6024               nds = tmp;
6025             }
6026
6027           gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
6028                                           &regxmm)
6029                       || operand_type_equal (&i.tm.operand_types[reg_slot],
6030                                              &regymm)
6031                       || operand_type_equal (&i.tm.operand_types[reg_slot],
6032                                              &regzmm));
6033           exp->X_op = O_constant;
6034           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
6035           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6036         }
6037       else
6038         {
6039           unsigned int imm_slot;
6040
6041           if (i.tm.opcode_modifier.vexw == VEXW0)
6042             {
6043               /* If VexW0 is set, the third operand is the source and
6044                  the second operand is encoded in the immediate
6045                  operand.  */
6046               source = 2;
6047               reg_slot = 1;
6048             }
6049           else
6050             {
6051               /* VexW1 is set, the second operand is the source and
6052                  the third operand is encoded in the immediate
6053                  operand.  */
6054               source = 1;
6055               reg_slot = 2;
6056             }
6057
6058           if (i.tm.opcode_modifier.immext)
6059             {
6060               /* When ImmExt is set, the immdiate byte is the last
6061                  operand.  */
6062               imm_slot = i.operands - 1;
6063               source--;
6064               reg_slot--;
6065             }
6066           else
6067             {
6068               imm_slot = 0;
6069
6070               /* Turn on Imm8 so that output_imm will generate it.  */
6071               i.types[imm_slot].bitfield.imm8 = 1;
6072             }
6073
6074           gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
6075                                           &regxmm)
6076                       || operand_type_equal (&i.tm.operand_types[reg_slot],
6077                                              &regymm)
6078                       || operand_type_equal (&i.tm.operand_types[reg_slot],
6079                                              &regzmm));
6080           i.op[imm_slot].imms->X_add_number
6081               |= register_number (i.op[reg_slot].regs) << 4;
6082           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6083         }
6084
6085       gas_assert (operand_type_equal (&i.tm.operand_types[nds], &regxmm)
6086                   || operand_type_equal (&i.tm.operand_types[nds],
6087                                          &regymm)
6088                   || operand_type_equal (&i.tm.operand_types[nds],
6089                                          &regzmm));
6090       i.vex.register_specifier = i.op[nds].regs;
6091     }
6092   else
6093     source = dest = 0;
6094
6095   /* i.reg_operands MUST be the number of real register operands;
6096      implicit registers do not count.  If there are 3 register
6097      operands, it must be a instruction with VexNDS.  For a
6098      instruction with VexNDD, the destination register is encoded
6099      in VEX prefix.  If there are 4 register operands, it must be
6100      a instruction with VEX prefix and 3 sources.  */
6101   if (i.mem_operands == 0
6102       && ((i.reg_operands == 2
6103            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
6104           || (i.reg_operands == 3
6105               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
6106           || (i.reg_operands == 4 && vex_3_sources)))
6107     {
6108       switch (i.operands)
6109         {
6110         case 2:
6111           source = 0;
6112           break;
6113         case 3:
6114           /* When there are 3 operands, one of them may be immediate,
6115              which may be the first or the last operand.  Otherwise,
6116              the first operand must be shift count register (cl) or it
6117              is an instruction with VexNDS. */
6118           gas_assert (i.imm_operands == 1
6119                       || (i.imm_operands == 0
6120                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
6121                               || i.types[0].bitfield.shiftcount)));
6122           if (operand_type_check (i.types[0], imm)
6123               || i.types[0].bitfield.shiftcount)
6124             source = 1;
6125           else
6126             source = 0;
6127           break;
6128         case 4:
6129           /* When there are 4 operands, the first two must be 8bit
6130              immediate operands. The source operand will be the 3rd
6131              one.
6132
6133              For instructions with VexNDS, if the first operand
6134              an imm8, the source operand is the 2nd one.  If the last
6135              operand is imm8, the source operand is the first one.  */
6136           gas_assert ((i.imm_operands == 2
6137                        && i.types[0].bitfield.imm8
6138                        && i.types[1].bitfield.imm8)
6139                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
6140                           && i.imm_operands == 1
6141                           && (i.types[0].bitfield.imm8
6142                               || i.types[i.operands - 1].bitfield.imm8
6143                               || i.rounding)));
6144           if (i.imm_operands == 2)
6145             source = 2;
6146           else
6147             {
6148               if (i.types[0].bitfield.imm8)
6149                 source = 1;
6150               else
6151                 source = 0;
6152             }
6153           break;
6154         case 5:
6155           if (i.tm.opcode_modifier.evex)
6156             {
6157               /* For EVEX instructions, when there are 5 operands, the
6158                  first one must be immediate operand.  If the second one
6159                  is immediate operand, the source operand is the 3th
6160                  one.  If the last one is immediate operand, the source
6161                  operand is the 2nd one.  */
6162               gas_assert (i.imm_operands == 2
6163                           && i.tm.opcode_modifier.sae
6164                           && operand_type_check (i.types[0], imm));
6165               if (operand_type_check (i.types[1], imm))
6166                 source = 2;
6167               else if (operand_type_check (i.types[4], imm))
6168                 source = 1;
6169               else
6170                 abort ();
6171             }
6172           break;
6173         default:
6174           abort ();
6175         }
6176
6177       if (!vex_3_sources)
6178         {
6179           dest = source + 1;
6180
6181           /* RC/SAE operand could be between DEST and SRC.  That happens
6182              when one operand is GPR and the other one is XMM/YMM/ZMM
6183              register.  */
6184           if (i.rounding && i.rounding->operand == (int) dest)
6185             dest++;
6186
6187           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6188             {
6189               /* For instructions with VexNDS, the register-only source
6190                  operand must be 32/64bit integer, XMM, YMM or ZMM
6191                  register.  It is encoded in VEX prefix.  We need to
6192                  clear RegMem bit before calling operand_type_equal.  */
6193
6194               i386_operand_type op;
6195               unsigned int vvvv;
6196
6197               /* Check register-only source operand when two source
6198                  operands are swapped.  */
6199               if (!i.tm.operand_types[source].bitfield.baseindex
6200                   && i.tm.operand_types[dest].bitfield.baseindex)
6201                 {
6202                   vvvv = source;
6203                   source = dest;
6204                 }
6205               else
6206                 vvvv = dest;
6207
6208               op = i.tm.operand_types[vvvv];
6209               op.bitfield.regmem = 0;
6210               if ((dest + 1) >= i.operands
6211                   || (!op.bitfield.reg32
6212                       && op.bitfield.reg64
6213                       && !operand_type_equal (&op, &regxmm)
6214                       && !operand_type_equal (&op, &regymm)
6215                       && !operand_type_equal (&op, &regzmm)
6216                       && !operand_type_equal (&op, &regmask)))
6217                 abort ();
6218               i.vex.register_specifier = i.op[vvvv].regs;
6219               dest++;
6220             }
6221         }
6222
6223       i.rm.mode = 3;
6224       /* One of the register operands will be encoded in the i.tm.reg
6225          field, the other in the combined i.tm.mode and i.tm.regmem
6226          fields.  If no form of this instruction supports a memory
6227          destination operand, then we assume the source operand may
6228          sometimes be a memory operand and so we need to store the
6229          destination in the i.rm.reg field.  */
6230       if (!i.tm.operand_types[dest].bitfield.regmem
6231           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
6232         {
6233           i.rm.reg = i.op[dest].regs->reg_num;
6234           i.rm.regmem = i.op[source].regs->reg_num;
6235           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6236             i.rex |= REX_R;
6237           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6238             i.vrex |= REX_R;
6239           if ((i.op[source].regs->reg_flags & RegRex) != 0)
6240             i.rex |= REX_B;
6241           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6242             i.vrex |= REX_B;
6243         }
6244       else
6245         {
6246           i.rm.reg = i.op[source].regs->reg_num;
6247           i.rm.regmem = i.op[dest].regs->reg_num;
6248           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6249             i.rex |= REX_B;
6250           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6251             i.vrex |= REX_B;
6252           if ((i.op[source].regs->reg_flags & RegRex) != 0)
6253             i.rex |= REX_R;
6254           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6255             i.vrex |= REX_R;
6256         }
6257       if (flag_code != CODE_64BIT && (i.rex & (REX_R | REX_B)))
6258         {
6259           if (!i.types[0].bitfield.control
6260               && !i.types[1].bitfield.control)
6261             abort ();
6262           i.rex &= ~(REX_R | REX_B);
6263           add_prefix (LOCK_PREFIX_OPCODE);
6264         }
6265     }
6266   else
6267     {                   /* If it's not 2 reg operands...  */
6268       unsigned int mem;
6269
6270       if (i.mem_operands)
6271         {
6272           unsigned int fake_zero_displacement = 0;
6273           unsigned int op;
6274
6275           for (op = 0; op < i.operands; op++)
6276             if (operand_type_check (i.types[op], anymem))
6277               break;
6278           gas_assert (op < i.operands);
6279
6280           if (i.tm.opcode_modifier.vecsib)
6281             {
6282               if (i.index_reg->reg_num == RegEiz
6283                   || i.index_reg->reg_num == RegRiz)
6284                 abort ();
6285
6286               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6287               if (!i.base_reg)
6288                 {
6289                   i.sib.base = NO_BASE_REGISTER;
6290                   i.sib.scale = i.log2_scale_factor;
6291                   /* No Vec_Disp8 if there is no base.  */
6292                   i.types[op].bitfield.vec_disp8 = 0;
6293                   i.types[op].bitfield.disp8 = 0;
6294                   i.types[op].bitfield.disp16 = 0;
6295                   i.types[op].bitfield.disp64 = 0;
6296                   if (flag_code != CODE_64BIT)
6297                     {
6298                       /* Must be 32 bit */
6299                       i.types[op].bitfield.disp32 = 1;
6300                       i.types[op].bitfield.disp32s = 0;
6301                     }
6302                   else
6303                     {
6304                       i.types[op].bitfield.disp32 = 0;
6305                       i.types[op].bitfield.disp32s = 1;
6306                     }
6307                 }
6308               i.sib.index = i.index_reg->reg_num;
6309               if ((i.index_reg->reg_flags & RegRex) != 0)
6310                 i.rex |= REX_X;
6311               if ((i.index_reg->reg_flags & RegVRex) != 0)
6312                 i.vrex |= REX_X;
6313             }
6314
6315           default_seg = &ds;
6316
6317           if (i.base_reg == 0)
6318             {
6319               i.rm.mode = 0;
6320               if (!i.disp_operands)
6321                 {
6322                   fake_zero_displacement = 1;
6323                   /* Instructions with VSIB byte need 32bit displacement
6324                      if there is no base register.  */
6325                   if (i.tm.opcode_modifier.vecsib)
6326                     i.types[op].bitfield.disp32 = 1;
6327                 }
6328               if (i.index_reg == 0)
6329                 {
6330                   gas_assert (!i.tm.opcode_modifier.vecsib);
6331                   /* Operand is just <disp>  */
6332                   if (flag_code == CODE_64BIT)
6333                     {
6334                       /* 64bit mode overwrites the 32bit absolute
6335                          addressing by RIP relative addressing and
6336                          absolute addressing is encoded by one of the
6337                          redundant SIB forms.  */
6338                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6339                       i.sib.base = NO_BASE_REGISTER;
6340                       i.sib.index = NO_INDEX_REGISTER;
6341                       i.types[op] = ((i.prefix[ADDR_PREFIX] == 0)
6342                                      ? disp32s : disp32);
6343                     }
6344                   else if ((flag_code == CODE_16BIT)
6345                            ^ (i.prefix[ADDR_PREFIX] != 0))
6346                     {
6347                       i.rm.regmem = NO_BASE_REGISTER_16;
6348                       i.types[op] = disp16;
6349                     }
6350                   else
6351                     {
6352                       i.rm.regmem = NO_BASE_REGISTER;
6353                       i.types[op] = disp32;
6354                     }
6355                 }
6356               else if (!i.tm.opcode_modifier.vecsib)
6357                 {
6358                   /* !i.base_reg && i.index_reg  */
6359                   if (i.index_reg->reg_num == RegEiz
6360                       || i.index_reg->reg_num == RegRiz)
6361                     i.sib.index = NO_INDEX_REGISTER;
6362                   else
6363                     i.sib.index = i.index_reg->reg_num;
6364                   i.sib.base = NO_BASE_REGISTER;
6365                   i.sib.scale = i.log2_scale_factor;
6366                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6367                   /* No Vec_Disp8 if there is no base.  */
6368                   i.types[op].bitfield.vec_disp8 = 0;
6369                   i.types[op].bitfield.disp8 = 0;
6370                   i.types[op].bitfield.disp16 = 0;
6371                   i.types[op].bitfield.disp64 = 0;
6372                   if (flag_code != CODE_64BIT)
6373                     {
6374                       /* Must be 32 bit */
6375                       i.types[op].bitfield.disp32 = 1;
6376                       i.types[op].bitfield.disp32s = 0;
6377                     }
6378                   else
6379                     {
6380                       i.types[op].bitfield.disp32 = 0;
6381                       i.types[op].bitfield.disp32s = 1;
6382                     }
6383                   if ((i.index_reg->reg_flags & RegRex) != 0)
6384                     i.rex |= REX_X;
6385                 }
6386             }
6387           /* RIP addressing for 64bit mode.  */
6388           else if (i.base_reg->reg_num == RegRip ||
6389                    i.base_reg->reg_num == RegEip)
6390             {
6391               gas_assert (!i.tm.opcode_modifier.vecsib);
6392               i.rm.regmem = NO_BASE_REGISTER;
6393               i.types[op].bitfield.disp8 = 0;
6394               i.types[op].bitfield.disp16 = 0;
6395               i.types[op].bitfield.disp32 = 0;
6396               i.types[op].bitfield.disp32s = 1;
6397               i.types[op].bitfield.disp64 = 0;
6398               i.types[op].bitfield.vec_disp8 = 0;
6399               i.flags[op] |= Operand_PCrel;
6400               if (! i.disp_operands)
6401                 fake_zero_displacement = 1;
6402             }
6403           else if (i.base_reg->reg_type.bitfield.reg16)
6404             {
6405               gas_assert (!i.tm.opcode_modifier.vecsib);
6406               switch (i.base_reg->reg_num)
6407                 {
6408                 case 3: /* (%bx)  */
6409                   if (i.index_reg == 0)
6410                     i.rm.regmem = 7;
6411                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
6412                     i.rm.regmem = i.index_reg->reg_num - 6;
6413                   break;
6414                 case 5: /* (%bp)  */
6415                   default_seg = &ss;
6416                   if (i.index_reg == 0)
6417                     {
6418                       i.rm.regmem = 6;
6419                       if (operand_type_check (i.types[op], disp) == 0)
6420                         {
6421                           /* fake (%bp) into 0(%bp)  */
6422                           if (i.tm.operand_types[op].bitfield.vec_disp8)
6423                             i.types[op].bitfield.vec_disp8 = 1;
6424                           else
6425                             i.types[op].bitfield.disp8 = 1;
6426                           fake_zero_displacement = 1;
6427                         }
6428                     }
6429                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
6430                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
6431                   break;
6432                 default: /* (%si) -> 4 or (%di) -> 5  */
6433                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
6434                 }
6435               i.rm.mode = mode_from_disp_size (i.types[op]);
6436             }
6437           else /* i.base_reg and 32/64 bit mode  */
6438             {
6439               if (flag_code == CODE_64BIT
6440                   && operand_type_check (i.types[op], disp))
6441                 {
6442                   i386_operand_type temp;
6443                   operand_type_set (&temp, 0);
6444                   temp.bitfield.disp8 = i.types[op].bitfield.disp8;
6445                   temp.bitfield.vec_disp8
6446                     = i.types[op].bitfield.vec_disp8;
6447                   i.types[op] = temp;
6448                   if (i.prefix[ADDR_PREFIX] == 0)
6449                     i.types[op].bitfield.disp32s = 1;
6450                   else
6451                     i.types[op].bitfield.disp32 = 1;
6452                 }
6453
6454               if (!i.tm.opcode_modifier.vecsib)
6455                 i.rm.regmem = i.base_reg->reg_num;
6456               if ((i.base_reg->reg_flags & RegRex) != 0)
6457                 i.rex |= REX_B;
6458               i.sib.base = i.base_reg->reg_num;
6459               /* x86-64 ignores REX prefix bit here to avoid decoder
6460                  complications.  */
6461               if (!(i.base_reg->reg_flags & RegRex)
6462                   && (i.base_reg->reg_num == EBP_REG_NUM
6463                    || i.base_reg->reg_num == ESP_REG_NUM))
6464                   default_seg = &ss;
6465               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
6466                 {
6467                   fake_zero_displacement = 1;
6468                   if (i.tm.operand_types [op].bitfield.vec_disp8)
6469                     i.types[op].bitfield.vec_disp8 = 1;
6470                   else
6471                     i.types[op].bitfield.disp8 = 1;
6472                 }
6473               i.sib.scale = i.log2_scale_factor;
6474               if (i.index_reg == 0)
6475                 {
6476                   gas_assert (!i.tm.opcode_modifier.vecsib);
6477                   /* <disp>(%esp) becomes two byte modrm with no index
6478                      register.  We've already stored the code for esp
6479                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
6480                      Any base register besides %esp will not use the
6481                      extra modrm byte.  */
6482                   i.sib.index = NO_INDEX_REGISTER;
6483                 }
6484               else if (!i.tm.opcode_modifier.vecsib)
6485                 {
6486                   if (i.index_reg->reg_num == RegEiz
6487                       || i.index_reg->reg_num == RegRiz)
6488                     i.sib.index = NO_INDEX_REGISTER;
6489                   else
6490                     i.sib.index = i.index_reg->reg_num;
6491                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6492                   if ((i.index_reg->reg_flags & RegRex) != 0)
6493                     i.rex |= REX_X;
6494                 }
6495
6496               if (i.disp_operands
6497                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
6498                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
6499                 i.rm.mode = 0;
6500               else
6501                 {
6502                   if (!fake_zero_displacement
6503                       && !i.disp_operands
6504                       && i.disp_encoding)
6505                     {
6506                       fake_zero_displacement = 1;
6507                       if (i.disp_encoding == disp_encoding_8bit)
6508                         i.types[op].bitfield.disp8 = 1;
6509                       else
6510                         i.types[op].bitfield.disp32 = 1;
6511                     }
6512                   i.rm.mode = mode_from_disp_size (i.types[op]);
6513                 }
6514             }
6515
6516           if (fake_zero_displacement)
6517             {
6518               /* Fakes a zero displacement assuming that i.types[op]
6519                  holds the correct displacement size.  */
6520               expressionS *exp;
6521
6522               gas_assert (i.op[op].disps == 0);
6523               exp = &disp_expressions[i.disp_operands++];
6524               i.op[op].disps = exp;
6525               exp->X_op = O_constant;
6526               exp->X_add_number = 0;
6527               exp->X_add_symbol = (symbolS *) 0;
6528               exp->X_op_symbol = (symbolS *) 0;
6529             }
6530
6531           mem = op;
6532         }
6533       else
6534         mem = ~0;
6535
6536       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
6537         {
6538           if (operand_type_check (i.types[0], imm))
6539             i.vex.register_specifier = NULL;
6540           else
6541             {
6542               /* VEX.vvvv encodes one of the sources when the first
6543                  operand is not an immediate.  */
6544               if (i.tm.opcode_modifier.vexw == VEXW0)
6545                 i.vex.register_specifier = i.op[0].regs;
6546               else
6547                 i.vex.register_specifier = i.op[1].regs;
6548             }
6549
6550           /* Destination is a XMM register encoded in the ModRM.reg
6551              and VEX.R bit.  */
6552           i.rm.reg = i.op[2].regs->reg_num;
6553           if ((i.op[2].regs->reg_flags & RegRex) != 0)
6554             i.rex |= REX_R;
6555
6556           /* ModRM.rm and VEX.B encodes the other source.  */
6557           if (!i.mem_operands)
6558             {
6559               i.rm.mode = 3;
6560
6561               if (i.tm.opcode_modifier.vexw == VEXW0)
6562                 i.rm.regmem = i.op[1].regs->reg_num;
6563               else
6564                 i.rm.regmem = i.op[0].regs->reg_num;
6565
6566               if ((i.op[1].regs->reg_flags & RegRex) != 0)
6567                 i.rex |= REX_B;
6568             }
6569         }
6570       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
6571         {
6572           i.vex.register_specifier = i.op[2].regs;
6573           if (!i.mem_operands)
6574             {
6575               i.rm.mode = 3;
6576               i.rm.regmem = i.op[1].regs->reg_num;
6577               if ((i.op[1].regs->reg_flags & RegRex) != 0)
6578                 i.rex |= REX_B;
6579             }
6580         }
6581       /* Fill in i.rm.reg or i.rm.regmem field with register operand
6582          (if any) based on i.tm.extension_opcode.  Again, we must be
6583          careful to make sure that segment/control/debug/test/MMX
6584          registers are coded into the i.rm.reg field.  */
6585       else if (i.reg_operands)
6586         {
6587           unsigned int op;
6588           unsigned int vex_reg = ~0;
6589
6590           for (op = 0; op < i.operands; op++)
6591             if (i.types[op].bitfield.reg8
6592                 || i.types[op].bitfield.reg16
6593                 || i.types[op].bitfield.reg32
6594                 || i.types[op].bitfield.reg64
6595                 || i.types[op].bitfield.regmmx
6596                 || i.types[op].bitfield.regxmm
6597                 || i.types[op].bitfield.regymm
6598                 || i.types[op].bitfield.regbnd
6599                 || i.types[op].bitfield.regzmm
6600                 || i.types[op].bitfield.regmask
6601                 || i.types[op].bitfield.sreg2
6602                 || i.types[op].bitfield.sreg3
6603                 || i.types[op].bitfield.control
6604                 || i.types[op].bitfield.debug
6605                 || i.types[op].bitfield.test)
6606               break;
6607
6608           if (vex_3_sources)
6609             op = dest;
6610           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6611             {
6612               /* For instructions with VexNDS, the register-only
6613                  source operand is encoded in VEX prefix. */
6614               gas_assert (mem != (unsigned int) ~0);
6615
6616               if (op > mem)
6617                 {
6618                   vex_reg = op++;
6619                   gas_assert (op < i.operands);
6620                 }
6621               else
6622                 {
6623                   /* Check register-only source operand when two source
6624                      operands are swapped.  */
6625                   if (!i.tm.operand_types[op].bitfield.baseindex
6626                       && i.tm.operand_types[op + 1].bitfield.baseindex)
6627                     {
6628                       vex_reg = op;
6629                       op += 2;
6630                       gas_assert (mem == (vex_reg + 1)
6631                                   && op < i.operands);
6632                     }
6633                   else
6634                     {
6635                       vex_reg = op + 1;
6636                       gas_assert (vex_reg < i.operands);
6637                     }
6638                 }
6639             }
6640           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
6641             {
6642               /* For instructions with VexNDD, the register destination
6643                  is encoded in VEX prefix.  */
6644               if (i.mem_operands == 0)
6645                 {
6646                   /* There is no memory operand.  */
6647                   gas_assert ((op + 2) == i.operands);
6648                   vex_reg = op + 1;
6649                 }
6650               else
6651                 {
6652                   /* There are only 2 operands.  */
6653                   gas_assert (op < 2 && i.operands == 2);
6654                   vex_reg = 1;
6655                 }
6656             }
6657           else
6658             gas_assert (op < i.operands);
6659
6660           if (vex_reg != (unsigned int) ~0)
6661             {
6662               i386_operand_type *type = &i.tm.operand_types[vex_reg];
6663
6664               if (type->bitfield.reg32 != 1
6665                   && type->bitfield.reg64 != 1
6666                   && !operand_type_equal (type, &regxmm)
6667                   && !operand_type_equal (type, &regymm)
6668                   && !operand_type_equal (type, &regzmm)
6669                   && !operand_type_equal (type, &regmask))
6670                 abort ();
6671
6672               i.vex.register_specifier = i.op[vex_reg].regs;
6673             }
6674
6675           /* Don't set OP operand twice.  */
6676           if (vex_reg != op)
6677             {
6678               /* If there is an extension opcode to put here, the
6679                  register number must be put into the regmem field.  */
6680               if (i.tm.extension_opcode != None)
6681                 {
6682                   i.rm.regmem = i.op[op].regs->reg_num;
6683                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
6684                     i.rex |= REX_B;
6685                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6686                     i.vrex |= REX_B;
6687                 }
6688               else
6689                 {
6690                   i.rm.reg = i.op[op].regs->reg_num;
6691                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
6692                     i.rex |= REX_R;
6693                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6694                     i.vrex |= REX_R;
6695                 }
6696             }
6697
6698           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
6699              must set it to 3 to indicate this is a register operand
6700              in the regmem field.  */
6701           if (!i.mem_operands)
6702             i.rm.mode = 3;
6703         }
6704
6705       /* Fill in i.rm.reg field with extension opcode (if any).  */
6706       if (i.tm.extension_opcode != None)
6707         i.rm.reg = i.tm.extension_opcode;
6708     }
6709   return default_seg;
6710 }
6711
6712 static void
6713 output_branch (void)
6714 {
6715   char *p;
6716   int size;
6717   int code16;
6718   int prefix;
6719   relax_substateT subtype;
6720   symbolS *sym;
6721   offsetT off;
6722
6723   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
6724   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
6725
6726   prefix = 0;
6727   if (i.prefix[DATA_PREFIX] != 0)
6728     {
6729       prefix = 1;
6730       i.prefixes -= 1;
6731       code16 ^= CODE16;
6732     }
6733   /* Pentium4 branch hints.  */
6734   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6735       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6736     {
6737       prefix++;
6738       i.prefixes--;
6739     }
6740   if (i.prefix[REX_PREFIX] != 0)
6741     {
6742       prefix++;
6743       i.prefixes--;
6744     }
6745
6746   /* BND prefixed jump.  */
6747   if (i.prefix[BND_PREFIX] != 0)
6748     {
6749       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6750       i.prefixes -= 1;
6751     }
6752
6753   if (i.prefixes != 0 && !intel_syntax)
6754     as_warn (_("skipping prefixes on this instruction"));
6755
6756   /* It's always a symbol;  End frag & setup for relax.
6757      Make sure there is enough room in this frag for the largest
6758      instruction we may generate in md_convert_frag.  This is 2
6759      bytes for the opcode and room for the prefix and largest
6760      displacement.  */
6761   frag_grow (prefix + 2 + 4);
6762   /* Prefix and 1 opcode byte go in fr_fix.  */
6763   p = frag_more (prefix + 1);
6764   if (i.prefix[DATA_PREFIX] != 0)
6765     *p++ = DATA_PREFIX_OPCODE;
6766   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
6767       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
6768     *p++ = i.prefix[SEG_PREFIX];
6769   if (i.prefix[REX_PREFIX] != 0)
6770     *p++ = i.prefix[REX_PREFIX];
6771   *p = i.tm.base_opcode;
6772
6773   if ((unsigned char) *p == JUMP_PC_RELATIVE)
6774     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
6775   else if (cpu_arch_flags.bitfield.cpui386)
6776     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
6777   else
6778     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
6779   subtype |= code16;
6780
6781   sym = i.op[0].disps->X_add_symbol;
6782   off = i.op[0].disps->X_add_number;
6783
6784   if (i.op[0].disps->X_op != O_constant
6785       && i.op[0].disps->X_op != O_symbol)
6786     {
6787       /* Handle complex expressions.  */
6788       sym = make_expr_symbol (i.op[0].disps);
6789       off = 0;
6790     }
6791
6792   /* 1 possible extra opcode + 4 byte displacement go in var part.
6793      Pass reloc in fr_var.  */
6794   frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
6795 }
6796
6797 static void
6798 output_jump (void)
6799 {
6800   char *p;
6801   int size;
6802   fixS *fixP;
6803
6804   if (i.tm.opcode_modifier.jumpbyte)
6805     {
6806       /* This is a loop or jecxz type instruction.  */
6807       size = 1;
6808       if (i.prefix[ADDR_PREFIX] != 0)
6809         {
6810           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
6811           i.prefixes -= 1;
6812         }
6813       /* Pentium4 branch hints.  */
6814       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6815           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6816         {
6817           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
6818           i.prefixes--;
6819         }
6820     }
6821   else
6822     {
6823       int code16;
6824
6825       code16 = 0;
6826       if (flag_code == CODE_16BIT)
6827         code16 = CODE16;
6828
6829       if (i.prefix[DATA_PREFIX] != 0)
6830         {
6831           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
6832           i.prefixes -= 1;
6833           code16 ^= CODE16;
6834         }
6835
6836       size = 4;
6837       if (code16)
6838         size = 2;
6839     }
6840
6841   if (i.prefix[REX_PREFIX] != 0)
6842     {
6843       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
6844       i.prefixes -= 1;
6845     }
6846
6847   /* BND prefixed jump.  */
6848   if (i.prefix[BND_PREFIX] != 0)
6849     {
6850       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6851       i.prefixes -= 1;
6852     }
6853
6854   if (i.prefixes != 0 && !intel_syntax)
6855     as_warn (_("skipping prefixes on this instruction"));
6856
6857   p = frag_more (i.tm.opcode_length + size);
6858   switch (i.tm.opcode_length)
6859     {
6860     case 2:
6861       *p++ = i.tm.base_opcode >> 8;
6862     case 1:
6863       *p++ = i.tm.base_opcode;
6864       break;
6865     default:
6866       abort ();
6867     }
6868
6869   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6870                       i.op[0].disps, 1, reloc (size, 1, 1, i.reloc[0]));
6871
6872   /* All jumps handled here are signed, but don't use a signed limit
6873      check for 32 and 16 bit jumps as we want to allow wrap around at
6874      4G and 64k respectively.  */
6875   if (size == 1)
6876     fixP->fx_signed = 1;
6877 }
6878
6879 static void
6880 output_interseg_jump (void)
6881 {
6882   char *p;
6883   int size;
6884   int prefix;
6885   int code16;
6886
6887   code16 = 0;
6888   if (flag_code == CODE_16BIT)
6889     code16 = CODE16;
6890
6891   prefix = 0;
6892   if (i.prefix[DATA_PREFIX] != 0)
6893     {
6894       prefix = 1;
6895       i.prefixes -= 1;
6896       code16 ^= CODE16;
6897     }
6898   if (i.prefix[REX_PREFIX] != 0)
6899     {
6900       prefix++;
6901       i.prefixes -= 1;
6902     }
6903
6904   size = 4;
6905   if (code16)
6906     size = 2;
6907
6908   if (i.prefixes != 0 && !intel_syntax)
6909     as_warn (_("skipping prefixes on this instruction"));
6910
6911   /* 1 opcode; 2 segment; offset  */
6912   p = frag_more (prefix + 1 + 2 + size);
6913
6914   if (i.prefix[DATA_PREFIX] != 0)
6915     *p++ = DATA_PREFIX_OPCODE;
6916
6917   if (i.prefix[REX_PREFIX] != 0)
6918     *p++ = i.prefix[REX_PREFIX];
6919
6920   *p++ = i.tm.base_opcode;
6921   if (i.op[1].imms->X_op == O_constant)
6922     {
6923       offsetT n = i.op[1].imms->X_add_number;
6924
6925       if (size == 2
6926           && !fits_in_unsigned_word (n)
6927           && !fits_in_signed_word (n))
6928         {
6929           as_bad (_("16-bit jump out of range"));
6930           return;
6931         }
6932       md_number_to_chars (p, n, size);
6933     }
6934   else
6935     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6936                  i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
6937   if (i.op[0].imms->X_op != O_constant)
6938     as_bad (_("can't handle non absolute segment in `%s'"),
6939             i.tm.name);
6940   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
6941 }
6942
6943 static void
6944 output_insn (void)
6945 {
6946   fragS *insn_start_frag;
6947   offsetT insn_start_off;
6948
6949   /* Tie dwarf2 debug info to the address at the start of the insn.
6950      We can't do this after the insn has been output as the current
6951      frag may have been closed off.  eg. by frag_var.  */
6952   dwarf2_emit_insn (0);
6953
6954   insn_start_frag = frag_now;
6955   insn_start_off = frag_now_fix ();
6956
6957   /* Output jumps.  */
6958   if (i.tm.opcode_modifier.jump)
6959     output_branch ();
6960   else if (i.tm.opcode_modifier.jumpbyte
6961            || i.tm.opcode_modifier.jumpdword)
6962     output_jump ();
6963   else if (i.tm.opcode_modifier.jumpintersegment)
6964     output_interseg_jump ();
6965   else
6966     {
6967       /* Output normal instructions here.  */
6968       char *p;
6969       unsigned char *q;
6970       unsigned int j;
6971       unsigned int prefix;
6972
6973       if (avoid_fence
6974          && i.tm.base_opcode == 0xfae
6975          && i.operands == 1
6976          && i.imm_operands == 1
6977          && (i.op[0].imms->X_add_number == 0xe8
6978              || i.op[0].imms->X_add_number == 0xf0
6979              || i.op[0].imms->X_add_number == 0xf8))
6980         {
6981           /* Encode lfence, mfence, and sfence as
6982              f0 83 04 24 00   lock addl $0x0, (%{re}sp).  */
6983           offsetT val = 0x240483f0ULL;
6984           p = frag_more (5);
6985           md_number_to_chars (p, val, 5);
6986           return;
6987         }
6988
6989       /* Some processors fail on LOCK prefix. This options makes
6990          assembler ignore LOCK prefix and serves as a workaround.  */
6991       if (omit_lock_prefix)
6992         {
6993           if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
6994             return;
6995           i.prefix[LOCK_PREFIX] = 0;
6996         }
6997
6998       /* Since the VEX/EVEX prefix contains the implicit prefix, we
6999          don't need the explicit prefix.  */
7000       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
7001         {
7002           switch (i.tm.opcode_length)
7003             {
7004             case 3:
7005               if (i.tm.base_opcode & 0xff000000)
7006                 {
7007                   prefix = (i.tm.base_opcode >> 24) & 0xff;
7008                   goto check_prefix;
7009                 }
7010               break;
7011             case 2:
7012               if ((i.tm.base_opcode & 0xff0000) != 0)
7013                 {
7014                   prefix = (i.tm.base_opcode >> 16) & 0xff;
7015                   if (i.tm.cpu_flags.bitfield.cpupadlock)
7016                     {
7017 check_prefix:
7018                       if (prefix != REPE_PREFIX_OPCODE
7019                           || (i.prefix[REP_PREFIX]
7020                               != REPE_PREFIX_OPCODE))
7021                         add_prefix (prefix);
7022                     }
7023                   else
7024                     add_prefix (prefix);
7025                 }
7026               break;
7027             case 1:
7028               break;
7029             default:
7030               abort ();
7031             }
7032
7033 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7034           /* For x32, add a dummy REX_OPCODE prefix for mov/add with
7035              R_X86_64_GOTTPOFF relocation so that linker can safely
7036              perform IE->LE optimization.  */
7037           if (x86_elf_abi == X86_64_X32_ABI
7038               && i.operands == 2
7039               && i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
7040               && i.prefix[REX_PREFIX] == 0)
7041             add_prefix (REX_OPCODE);
7042 #endif
7043
7044           /* The prefix bytes.  */
7045           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
7046             if (*q)
7047               FRAG_APPEND_1_CHAR (*q);
7048         }
7049       else
7050         {
7051           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
7052             if (*q)
7053               switch (j)
7054                 {
7055                 case REX_PREFIX:
7056                   /* REX byte is encoded in VEX prefix.  */
7057                   break;
7058                 case SEG_PREFIX:
7059                 case ADDR_PREFIX:
7060                   FRAG_APPEND_1_CHAR (*q);
7061                   break;
7062                 default:
7063                   /* There should be no other prefixes for instructions
7064                      with VEX prefix.  */
7065                   abort ();
7066                 }
7067
7068           /* For EVEX instructions i.vrex should become 0 after
7069              build_evex_prefix.  For VEX instructions upper 16 registers
7070              aren't available, so VREX should be 0.  */
7071           if (i.vrex)
7072             abort ();
7073           /* Now the VEX prefix.  */
7074           p = frag_more (i.vex.length);
7075           for (j = 0; j < i.vex.length; j++)
7076             p[j] = i.vex.bytes[j];
7077         }
7078
7079       /* Now the opcode; be careful about word order here!  */
7080       if (i.tm.opcode_length == 1)
7081         {
7082           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
7083         }
7084       else
7085         {
7086           switch (i.tm.opcode_length)
7087             {
7088             case 4:
7089               p = frag_more (4);
7090               *p++ = (i.tm.base_opcode >> 24) & 0xff;
7091               *p++ = (i.tm.base_opcode >> 16) & 0xff;
7092               break;
7093             case 3:
7094               p = frag_more (3);
7095               *p++ = (i.tm.base_opcode >> 16) & 0xff;
7096               break;
7097             case 2:
7098               p = frag_more (2);
7099               break;
7100             default:
7101               abort ();
7102               break;
7103             }
7104
7105           /* Put out high byte first: can't use md_number_to_chars!  */
7106           *p++ = (i.tm.base_opcode >> 8) & 0xff;
7107           *p = i.tm.base_opcode & 0xff;
7108         }
7109
7110       /* Now the modrm byte and sib byte (if present).  */
7111       if (i.tm.opcode_modifier.modrm)
7112         {
7113           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
7114                                | i.rm.reg << 3
7115                                | i.rm.mode << 6));
7116           /* If i.rm.regmem == ESP (4)
7117              && i.rm.mode != (Register mode)
7118              && not 16 bit
7119              ==> need second modrm byte.  */
7120           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
7121               && i.rm.mode != 3
7122               && !(i.base_reg && i.base_reg->reg_type.bitfield.reg16))
7123             FRAG_APPEND_1_CHAR ((i.sib.base << 0
7124                                  | i.sib.index << 3
7125                                  | i.sib.scale << 6));
7126         }
7127
7128       if (i.disp_operands)
7129         output_disp (insn_start_frag, insn_start_off);
7130
7131       if (i.imm_operands)
7132         output_imm (insn_start_frag, insn_start_off);
7133     }
7134
7135 #ifdef DEBUG386
7136   if (flag_debug)
7137     {
7138       pi ("" /*line*/, &i);
7139     }
7140 #endif /* DEBUG386  */
7141 }
7142
7143 /* Return the size of the displacement operand N.  */
7144
7145 static int
7146 disp_size (unsigned int n)
7147 {
7148   int size = 4;
7149
7150   /* Vec_Disp8 has to be 8bit.  */
7151   if (i.types[n].bitfield.vec_disp8)
7152     size = 1;
7153   else if (i.types[n].bitfield.disp64)
7154     size = 8;
7155   else if (i.types[n].bitfield.disp8)
7156     size = 1;
7157   else if (i.types[n].bitfield.disp16)
7158     size = 2;
7159   return size;
7160 }
7161
7162 /* Return the size of the immediate operand N.  */
7163
7164 static int
7165 imm_size (unsigned int n)
7166 {
7167   int size = 4;
7168   if (i.types[n].bitfield.imm64)
7169     size = 8;
7170   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
7171     size = 1;
7172   else if (i.types[n].bitfield.imm16)
7173     size = 2;
7174   return size;
7175 }
7176
7177 static void
7178 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
7179 {
7180   char *p;
7181   unsigned int n;
7182
7183   for (n = 0; n < i.operands; n++)
7184     {
7185       if (i.types[n].bitfield.vec_disp8
7186           || operand_type_check (i.types[n], disp))
7187         {
7188           if (i.op[n].disps->X_op == O_constant)
7189             {
7190               int size = disp_size (n);
7191               offsetT val = i.op[n].disps->X_add_number;
7192
7193               if (i.types[n].bitfield.vec_disp8)
7194                 val >>= i.memshift;
7195               val = offset_in_range (val, size);
7196               p = frag_more (size);
7197               md_number_to_chars (p, val, size);
7198             }
7199           else
7200             {
7201               enum bfd_reloc_code_real reloc_type;
7202               int size = disp_size (n);
7203               int sign = i.types[n].bitfield.disp32s;
7204               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
7205               fixS *fixP;
7206
7207               /* We can't have 8 bit displacement here.  */
7208               gas_assert (!i.types[n].bitfield.disp8);
7209
7210               /* The PC relative address is computed relative
7211                  to the instruction boundary, so in case immediate
7212                  fields follows, we need to adjust the value.  */
7213               if (pcrel && i.imm_operands)
7214                 {
7215                   unsigned int n1;
7216                   int sz = 0;
7217
7218                   for (n1 = 0; n1 < i.operands; n1++)
7219                     if (operand_type_check (i.types[n1], imm))
7220                       {
7221                         /* Only one immediate is allowed for PC
7222                            relative address.  */
7223                         gas_assert (sz == 0);
7224                         sz = imm_size (n1);
7225                         i.op[n].disps->X_add_number -= sz;
7226                       }
7227                   /* We should find the immediate.  */
7228                   gas_assert (sz != 0);
7229                 }
7230
7231               p = frag_more (size);
7232               reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
7233               if (GOT_symbol
7234                   && GOT_symbol == i.op[n].disps->X_add_symbol
7235                   && (((reloc_type == BFD_RELOC_32
7236                         || reloc_type == BFD_RELOC_X86_64_32S
7237                         || (reloc_type == BFD_RELOC_64
7238                             && object_64bit))
7239                        && (i.op[n].disps->X_op == O_symbol
7240                            || (i.op[n].disps->X_op == O_add
7241                                && ((symbol_get_value_expression
7242                                     (i.op[n].disps->X_op_symbol)->X_op)
7243                                    == O_subtract))))
7244                       || reloc_type == BFD_RELOC_32_PCREL))
7245                 {
7246                   offsetT add;
7247
7248                   if (insn_start_frag == frag_now)
7249                     add = (p - frag_now->fr_literal) - insn_start_off;
7250                   else
7251                     {
7252                       fragS *fr;
7253
7254                       add = insn_start_frag->fr_fix - insn_start_off;
7255                       for (fr = insn_start_frag->fr_next;
7256                            fr && fr != frag_now; fr = fr->fr_next)
7257                         add += fr->fr_fix;
7258                       add += p - frag_now->fr_literal;
7259                     }
7260
7261                   if (!object_64bit)
7262                     {
7263                       reloc_type = BFD_RELOC_386_GOTPC;
7264                       i.op[n].imms->X_add_number += add;
7265                     }
7266                   else if (reloc_type == BFD_RELOC_64)
7267                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
7268                   else
7269                     /* Don't do the adjustment for x86-64, as there
7270                        the pcrel addressing is relative to the _next_
7271                        insn, and that is taken care of in other code.  */
7272                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
7273                 }
7274               fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
7275                                   size, i.op[n].disps, pcrel,
7276                                   reloc_type);
7277               /* Check for "call/jmp *mem", "mov mem, %reg",
7278                  "test %reg, mem" and "binop mem, %reg" where binop
7279                  is one of adc, add, and, cmp, or, sbb, sub, xor
7280                  instructions.  Always generate R_386_GOT32X for
7281                  "sym*GOT" operand in 32-bit mode.  */
7282               if ((generate_relax_relocations
7283                    || (!object_64bit
7284                        && i.rm.mode == 0
7285                        && i.rm.regmem == 5))
7286                   && (i.rm.mode == 2
7287                       || (i.rm.mode == 0 && i.rm.regmem == 5))
7288                   && ((i.operands == 1
7289                        && i.tm.base_opcode == 0xff
7290                        && (i.rm.reg == 2 || i.rm.reg == 4))
7291                       || (i.operands == 2
7292                           && (i.tm.base_opcode == 0x8b
7293                               || i.tm.base_opcode == 0x85
7294                               || (i.tm.base_opcode & 0xc7) == 0x03))))
7295                 {
7296                   if (object_64bit)
7297                     {
7298                       fixP->fx_tcbit = i.rex != 0;
7299                       if (i.base_reg
7300                           && (i.base_reg->reg_num == RegRip
7301                               || i.base_reg->reg_num == RegEip))
7302                       fixP->fx_tcbit2 = 1;
7303                     }
7304                   else
7305                     fixP->fx_tcbit2 = 1;
7306                 }
7307             }
7308         }
7309     }
7310 }
7311
7312 static void
7313 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
7314 {
7315   char *p;
7316   unsigned int n;
7317
7318   for (n = 0; n < i.operands; n++)
7319     {
7320       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
7321       if (i.rounding && (int) n == i.rounding->operand)
7322         continue;
7323
7324       if (operand_type_check (i.types[n], imm))
7325         {
7326           if (i.op[n].imms->X_op == O_constant)
7327             {
7328               int size = imm_size (n);
7329               offsetT val;
7330
7331               val = offset_in_range (i.op[n].imms->X_add_number,
7332                                      size);
7333               p = frag_more (size);
7334               md_number_to_chars (p, val, size);
7335             }
7336           else
7337             {
7338               /* Not absolute_section.
7339                  Need a 32-bit fixup (don't support 8bit
7340                  non-absolute imms).  Try to support other
7341                  sizes ...  */
7342               enum bfd_reloc_code_real reloc_type;
7343               int size = imm_size (n);
7344               int sign;
7345
7346               if (i.types[n].bitfield.imm32s
7347                   && (i.suffix == QWORD_MNEM_SUFFIX
7348                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
7349                 sign = 1;
7350               else
7351                 sign = 0;
7352
7353               p = frag_more (size);
7354               reloc_type = reloc (size, 0, sign, i.reloc[n]);
7355
7356               /*   This is tough to explain.  We end up with this one if we
7357                * have operands that look like
7358                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
7359                * obtain the absolute address of the GOT, and it is strongly
7360                * preferable from a performance point of view to avoid using
7361                * a runtime relocation for this.  The actual sequence of
7362                * instructions often look something like:
7363                *
7364                *        call    .L66
7365                * .L66:
7366                *        popl    %ebx
7367                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
7368                *
7369                *   The call and pop essentially return the absolute address
7370                * of the label .L66 and store it in %ebx.  The linker itself
7371                * will ultimately change the first operand of the addl so
7372                * that %ebx points to the GOT, but to keep things simple, the
7373                * .o file must have this operand set so that it generates not
7374                * the absolute address of .L66, but the absolute address of
7375                * itself.  This allows the linker itself simply treat a GOTPC
7376                * relocation as asking for a pcrel offset to the GOT to be
7377                * added in, and the addend of the relocation is stored in the
7378                * operand field for the instruction itself.
7379                *
7380                *   Our job here is to fix the operand so that it would add
7381                * the correct offset so that %ebx would point to itself.  The
7382                * thing that is tricky is that .-.L66 will point to the
7383                * beginning of the instruction, so we need to further modify
7384                * the operand so that it will point to itself.  There are
7385                * other cases where you have something like:
7386                *
7387                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
7388                *
7389                * and here no correction would be required.  Internally in
7390                * the assembler we treat operands of this form as not being
7391                * pcrel since the '.' is explicitly mentioned, and I wonder
7392                * whether it would simplify matters to do it this way.  Who
7393                * knows.  In earlier versions of the PIC patches, the
7394                * pcrel_adjust field was used to store the correction, but
7395                * since the expression is not pcrel, I felt it would be
7396                * confusing to do it this way.  */
7397
7398               if ((reloc_type == BFD_RELOC_32
7399                    || reloc_type == BFD_RELOC_X86_64_32S
7400                    || reloc_type == BFD_RELOC_64)
7401                   && GOT_symbol
7402                   && GOT_symbol == i.op[n].imms->X_add_symbol
7403                   && (i.op[n].imms->X_op == O_symbol
7404                       || (i.op[n].imms->X_op == O_add
7405                           && ((symbol_get_value_expression
7406                                (i.op[n].imms->X_op_symbol)->X_op)
7407                               == O_subtract))))
7408                 {
7409                   offsetT add;
7410
7411                   if (insn_start_frag == frag_now)
7412                     add = (p - frag_now->fr_literal) - insn_start_off;
7413                   else
7414                     {
7415                       fragS *fr;
7416
7417                       add = insn_start_frag->fr_fix - insn_start_off;
7418                       for (fr = insn_start_frag->fr_next;
7419                            fr && fr != frag_now; fr = fr->fr_next)
7420                         add += fr->fr_fix;
7421                       add += p - frag_now->fr_literal;
7422                     }
7423
7424                   if (!object_64bit)
7425                     reloc_type = BFD_RELOC_386_GOTPC;
7426                   else if (size == 4)
7427                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
7428                   else if (size == 8)
7429                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
7430                   i.op[n].imms->X_add_number += add;
7431                 }
7432               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7433                            i.op[n].imms, 0, reloc_type);
7434             }
7435         }
7436     }
7437 }
7438 \f
7439 /* x86_cons_fix_new is called via the expression parsing code when a
7440    reloc is needed.  We use this hook to get the correct .got reloc.  */
7441 static int cons_sign = -1;
7442
7443 void
7444 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
7445                   expressionS *exp, bfd_reloc_code_real_type r)
7446 {
7447   r = reloc (len, 0, cons_sign, r);
7448
7449 #ifdef TE_PE
7450   if (exp->X_op == O_secrel)
7451     {
7452       exp->X_op = O_symbol;
7453       r = BFD_RELOC_32_SECREL;
7454     }
7455 #endif
7456
7457   fix_new_exp (frag, off, len, exp, 0, r);
7458 }
7459
7460 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
7461    purpose of the `.dc.a' internal pseudo-op.  */
7462
7463 int
7464 x86_address_bytes (void)
7465 {
7466   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
7467     return 4;
7468   return stdoutput->arch_info->bits_per_address / 8;
7469 }
7470
7471 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
7472     || defined (LEX_AT)
7473 # define lex_got(reloc, adjust, types) NULL
7474 #else
7475 /* Parse operands of the form
7476    <symbol>@GOTOFF+<nnn>
7477    and similar .plt or .got references.
7478
7479    If we find one, set up the correct relocation in RELOC and copy the
7480    input string, minus the `@GOTOFF' into a malloc'd buffer for
7481    parsing by the calling routine.  Return this buffer, and if ADJUST
7482    is non-null set it to the length of the string we removed from the
7483    input line.  Otherwise return NULL.  */
7484 static char *
7485 lex_got (enum bfd_reloc_code_real *rel,
7486          int *adjust,
7487          i386_operand_type *types)
7488 {
7489   /* Some of the relocations depend on the size of what field is to
7490      be relocated.  But in our callers i386_immediate and i386_displacement
7491      we don't yet know the operand size (this will be set by insn
7492      matching).  Hence we record the word32 relocation here,
7493      and adjust the reloc according to the real size in reloc().  */
7494   static const struct {
7495     const char *str;
7496     int len;
7497     const enum bfd_reloc_code_real rel[2];
7498     const i386_operand_type types64;
7499   } gotrel[] = {
7500 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7501     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
7502                                         BFD_RELOC_SIZE32 },
7503       OPERAND_TYPE_IMM32_64 },
7504 #endif
7505     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
7506                                        BFD_RELOC_X86_64_PLTOFF64 },
7507       OPERAND_TYPE_IMM64 },
7508     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
7509                                        BFD_RELOC_X86_64_PLT32    },
7510       OPERAND_TYPE_IMM32_32S_DISP32 },
7511     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
7512                                        BFD_RELOC_X86_64_GOTPLT64 },
7513       OPERAND_TYPE_IMM64_DISP64 },
7514     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
7515                                        BFD_RELOC_X86_64_GOTOFF64 },
7516       OPERAND_TYPE_IMM64_DISP64 },
7517     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
7518                                        BFD_RELOC_X86_64_GOTPCREL },
7519       OPERAND_TYPE_IMM32_32S_DISP32 },
7520     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
7521                                        BFD_RELOC_X86_64_TLSGD    },
7522       OPERAND_TYPE_IMM32_32S_DISP32 },
7523     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
7524                                        _dummy_first_bfd_reloc_code_real },
7525       OPERAND_TYPE_NONE },
7526     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
7527                                        BFD_RELOC_X86_64_TLSLD    },
7528       OPERAND_TYPE_IMM32_32S_DISP32 },
7529     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
7530                                        BFD_RELOC_X86_64_GOTTPOFF },
7531       OPERAND_TYPE_IMM32_32S_DISP32 },
7532     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
7533                                        BFD_RELOC_X86_64_TPOFF32  },
7534       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7535     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
7536                                        _dummy_first_bfd_reloc_code_real },
7537       OPERAND_TYPE_NONE },
7538     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
7539                                        BFD_RELOC_X86_64_DTPOFF32 },
7540       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7541     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
7542                                        _dummy_first_bfd_reloc_code_real },
7543       OPERAND_TYPE_NONE },
7544     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
7545                                        _dummy_first_bfd_reloc_code_real },
7546       OPERAND_TYPE_NONE },
7547     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
7548                                        BFD_RELOC_X86_64_GOT32    },
7549       OPERAND_TYPE_IMM32_32S_64_DISP32 },
7550     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
7551                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
7552       OPERAND_TYPE_IMM32_32S_DISP32 },
7553     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
7554                                        BFD_RELOC_X86_64_TLSDESC_CALL },
7555       OPERAND_TYPE_IMM32_32S_DISP32 },
7556   };
7557   char *cp;
7558   unsigned int j;
7559
7560 #if defined (OBJ_MAYBE_ELF)
7561   if (!IS_ELF)
7562     return NULL;
7563 #endif
7564
7565   for (cp = input_line_pointer; *cp != '@'; cp++)
7566     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7567       return NULL;
7568
7569   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7570     {
7571       int len = gotrel[j].len;
7572       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7573         {
7574           if (gotrel[j].rel[object_64bit] != 0)
7575             {
7576               int first, second;
7577               char *tmpbuf, *past_reloc;
7578
7579               *rel = gotrel[j].rel[object_64bit];
7580
7581               if (types)
7582                 {
7583                   if (flag_code != CODE_64BIT)
7584                     {
7585                       types->bitfield.imm32 = 1;
7586                       types->bitfield.disp32 = 1;
7587                     }
7588                   else
7589                     *types = gotrel[j].types64;
7590                 }
7591
7592               if (j != 0 && GOT_symbol == NULL)
7593                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
7594
7595               /* The length of the first part of our input line.  */
7596               first = cp - input_line_pointer;
7597
7598               /* The second part goes from after the reloc token until
7599                  (and including) an end_of_line char or comma.  */
7600               past_reloc = cp + 1 + len;
7601               cp = past_reloc;
7602               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7603                 ++cp;
7604               second = cp + 1 - past_reloc;
7605
7606               /* Allocate and copy string.  The trailing NUL shouldn't
7607                  be necessary, but be safe.  */
7608               tmpbuf = (char *) xmalloc (first + second + 2);
7609               memcpy (tmpbuf, input_line_pointer, first);
7610               if (second != 0 && *past_reloc != ' ')
7611                 /* Replace the relocation token with ' ', so that
7612                    errors like foo@GOTOFF1 will be detected.  */
7613                 tmpbuf[first++] = ' ';
7614               else
7615                 /* Increment length by 1 if the relocation token is
7616                    removed.  */
7617                 len++;
7618               if (adjust)
7619                 *adjust = len;
7620               memcpy (tmpbuf + first, past_reloc, second);
7621               tmpbuf[first + second] = '\0';
7622               return tmpbuf;
7623             }
7624
7625           as_bad (_("@%s reloc is not supported with %d-bit output format"),
7626                   gotrel[j].str, 1 << (5 + object_64bit));
7627           return NULL;
7628         }
7629     }
7630
7631   /* Might be a symbol version string.  Don't as_bad here.  */
7632   return NULL;
7633 }
7634 #endif
7635
7636 #ifdef TE_PE
7637 #ifdef lex_got
7638 #undef lex_got
7639 #endif
7640 /* Parse operands of the form
7641    <symbol>@SECREL32+<nnn>
7642
7643    If we find one, set up the correct relocation in RELOC and copy the
7644    input string, minus the `@SECREL32' into a malloc'd buffer for
7645    parsing by the calling routine.  Return this buffer, and if ADJUST
7646    is non-null set it to the length of the string we removed from the
7647    input line.  Otherwise return NULL.
7648
7649    This function is copied from the ELF version above adjusted for PE targets.  */
7650
7651 static char *
7652 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
7653          int *adjust ATTRIBUTE_UNUSED,
7654          i386_operand_type *types)
7655 {
7656   static const struct
7657   {
7658     const char *str;
7659     int len;
7660     const enum bfd_reloc_code_real rel[2];
7661     const i386_operand_type types64;
7662   }
7663   gotrel[] =
7664   {
7665     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
7666                                           BFD_RELOC_32_SECREL },
7667       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7668   };
7669
7670   char *cp;
7671   unsigned j;
7672
7673   for (cp = input_line_pointer; *cp != '@'; cp++)
7674     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7675       return NULL;
7676
7677   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7678     {
7679       int len = gotrel[j].len;
7680
7681       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7682         {
7683           if (gotrel[j].rel[object_64bit] != 0)
7684             {
7685               int first, second;
7686               char *tmpbuf, *past_reloc;
7687
7688               *rel = gotrel[j].rel[object_64bit];
7689               if (adjust)
7690                 *adjust = len;
7691
7692               if (types)
7693                 {
7694                   if (flag_code != CODE_64BIT)
7695                     {
7696                       types->bitfield.imm32 = 1;
7697                       types->bitfield.disp32 = 1;
7698                     }
7699                   else
7700                     *types = gotrel[j].types64;
7701                 }
7702
7703               /* The length of the first part of our input line.  */
7704               first = cp - input_line_pointer;
7705
7706               /* The second part goes from after the reloc token until
7707                  (and including) an end_of_line char or comma.  */
7708               past_reloc = cp + 1 + len;
7709               cp = past_reloc;
7710               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7711                 ++cp;
7712               second = cp + 1 - past_reloc;
7713
7714               /* Allocate and copy string.  The trailing NUL shouldn't
7715                  be necessary, but be safe.  */
7716               tmpbuf = (char *) xmalloc (first + second + 2);
7717               memcpy (tmpbuf, input_line_pointer, first);
7718               if (second != 0 && *past_reloc != ' ')
7719                 /* Replace the relocation token with ' ', so that
7720                    errors like foo@SECLREL321 will be detected.  */
7721                 tmpbuf[first++] = ' ';
7722               memcpy (tmpbuf + first, past_reloc, second);
7723               tmpbuf[first + second] = '\0';
7724               return tmpbuf;
7725             }
7726
7727           as_bad (_("@%s reloc is not supported with %d-bit output format"),
7728                   gotrel[j].str, 1 << (5 + object_64bit));
7729           return NULL;
7730         }
7731     }
7732
7733   /* Might be a symbol version string.  Don't as_bad here.  */
7734   return NULL;
7735 }
7736
7737 #endif /* TE_PE */
7738
7739 bfd_reloc_code_real_type
7740 x86_cons (expressionS *exp, int size)
7741 {
7742   bfd_reloc_code_real_type got_reloc = NO_RELOC;
7743
7744   intel_syntax = -intel_syntax;
7745
7746   exp->X_md = 0;
7747   if (size == 4 || (object_64bit && size == 8))
7748     {
7749       /* Handle @GOTOFF and the like in an expression.  */
7750       char *save;
7751       char *gotfree_input_line;
7752       int adjust = 0;
7753
7754       save = input_line_pointer;
7755       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
7756       if (gotfree_input_line)
7757         input_line_pointer = gotfree_input_line;
7758
7759       expression (exp);
7760
7761       if (gotfree_input_line)
7762         {
7763           /* expression () has merrily parsed up to the end of line,
7764              or a comma - in the wrong buffer.  Transfer how far
7765              input_line_pointer has moved to the right buffer.  */
7766           input_line_pointer = (save
7767                                 + (input_line_pointer - gotfree_input_line)
7768                                 + adjust);
7769           free (gotfree_input_line);
7770           if (exp->X_op == O_constant
7771               || exp->X_op == O_absent
7772               || exp->X_op == O_illegal
7773               || exp->X_op == O_register
7774               || exp->X_op == O_big)
7775             {
7776               char c = *input_line_pointer;
7777               *input_line_pointer = 0;
7778               as_bad (_("missing or invalid expression `%s'"), save);
7779               *input_line_pointer = c;
7780             }
7781         }
7782     }
7783   else
7784     expression (exp);
7785
7786   intel_syntax = -intel_syntax;
7787
7788   if (intel_syntax)
7789     i386_intel_simplify (exp);
7790
7791   return got_reloc;
7792 }
7793
7794 static void
7795 signed_cons (int size)
7796 {
7797   if (flag_code == CODE_64BIT)
7798     cons_sign = 1;
7799   cons (size);
7800   cons_sign = -1;
7801 }
7802
7803 #ifdef TE_PE
7804 static void
7805 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
7806 {
7807   expressionS exp;
7808
7809   do
7810     {
7811       expression (&exp);
7812       if (exp.X_op == O_symbol)
7813         exp.X_op = O_secrel;
7814
7815       emit_expr (&exp, 4);
7816     }
7817   while (*input_line_pointer++ == ',');
7818
7819   input_line_pointer--;
7820   demand_empty_rest_of_line ();
7821 }
7822 #endif
7823
7824 /* Handle Vector operations.  */
7825
7826 static char *
7827 check_VecOperations (char *op_string, char *op_end)
7828 {
7829   const reg_entry *mask;
7830   const char *saved;
7831   char *end_op;
7832
7833   while (*op_string
7834          && (op_end == NULL || op_string < op_end))
7835     {
7836       saved = op_string;
7837       if (*op_string == '{')
7838         {
7839           op_string++;
7840
7841           /* Check broadcasts.  */
7842           if (strncmp (op_string, "1to", 3) == 0)
7843             {
7844               int bcst_type;
7845
7846               if (i.broadcast)
7847                 goto duplicated_vec_op;
7848
7849               op_string += 3;
7850               if (*op_string == '8')
7851                 bcst_type = BROADCAST_1TO8;
7852               else if (*op_string == '4')
7853                 bcst_type = BROADCAST_1TO4;
7854               else if (*op_string == '2')
7855                 bcst_type = BROADCAST_1TO2;
7856               else if (*op_string == '1'
7857                        && *(op_string+1) == '6')
7858                 {
7859                   bcst_type = BROADCAST_1TO16;
7860                   op_string++;
7861                 }
7862               else
7863                 {
7864                   as_bad (_("Unsupported broadcast: `%s'"), saved);
7865                   return NULL;
7866                 }
7867               op_string++;
7868
7869               broadcast_op.type = bcst_type;
7870               broadcast_op.operand = this_operand;
7871               i.broadcast = &broadcast_op;
7872             }
7873           /* Check masking operation.  */
7874           else if ((mask = parse_register (op_string, &end_op)) != NULL)
7875             {
7876               /* k0 can't be used for write mask.  */
7877               if (mask->reg_num == 0)
7878                 {
7879                   as_bad (_("`%s' can't be used for write mask"),
7880                           op_string);
7881                   return NULL;
7882                 }
7883
7884               if (!i.mask)
7885                 {
7886                   mask_op.mask = mask;
7887                   mask_op.zeroing = 0;
7888                   mask_op.operand = this_operand;
7889                   i.mask = &mask_op;
7890                 }
7891               else
7892                 {
7893                   if (i.mask->mask)
7894                     goto duplicated_vec_op;
7895
7896                   i.mask->mask = mask;
7897
7898                   /* Only "{z}" is allowed here.  No need to check
7899                      zeroing mask explicitly.  */
7900                   if (i.mask->operand != this_operand)
7901                     {
7902                       as_bad (_("invalid write mask `%s'"), saved);
7903                       return NULL;
7904                     }
7905                 }
7906
7907               op_string = end_op;
7908             }
7909           /* Check zeroing-flag for masking operation.  */
7910           else if (*op_string == 'z')
7911             {
7912               if (!i.mask)
7913                 {
7914                   mask_op.mask = NULL;
7915                   mask_op.zeroing = 1;
7916                   mask_op.operand = this_operand;
7917                   i.mask = &mask_op;
7918                 }
7919               else
7920                 {
7921                   if (i.mask->zeroing)
7922                     {
7923                     duplicated_vec_op:
7924                       as_bad (_("duplicated `%s'"), saved);
7925                       return NULL;
7926                     }
7927
7928                   i.mask->zeroing = 1;
7929
7930                   /* Only "{%k}" is allowed here.  No need to check mask
7931                      register explicitly.  */
7932                   if (i.mask->operand != this_operand)
7933                     {
7934                       as_bad (_("invalid zeroing-masking `%s'"),
7935                               saved);
7936                       return NULL;
7937                     }
7938                 }
7939
7940               op_string++;
7941             }
7942           else
7943             goto unknown_vec_op;
7944
7945           if (*op_string != '}')
7946             {
7947               as_bad (_("missing `}' in `%s'"), saved);
7948               return NULL;
7949             }
7950           op_string++;
7951           continue;
7952         }
7953     unknown_vec_op:
7954       /* We don't know this one.  */
7955       as_bad (_("unknown vector operation: `%s'"), saved);
7956       return NULL;
7957     }
7958
7959   return op_string;
7960 }
7961
7962 static int
7963 i386_immediate (char *imm_start)
7964 {
7965   char *save_input_line_pointer;
7966   char *gotfree_input_line;
7967   segT exp_seg = 0;
7968   expressionS *exp;
7969   i386_operand_type types;
7970
7971   operand_type_set (&types, ~0);
7972
7973   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
7974     {
7975       as_bad (_("at most %d immediate operands are allowed"),
7976               MAX_IMMEDIATE_OPERANDS);
7977       return 0;
7978     }
7979
7980   exp = &im_expressions[i.imm_operands++];
7981   i.op[this_operand].imms = exp;
7982
7983   if (is_space_char (*imm_start))
7984     ++imm_start;
7985
7986   save_input_line_pointer = input_line_pointer;
7987   input_line_pointer = imm_start;
7988
7989   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
7990   if (gotfree_input_line)
7991     input_line_pointer = gotfree_input_line;
7992
7993   exp_seg = expression (exp);
7994
7995   SKIP_WHITESPACE ();
7996
7997   /* Handle vector operations.  */
7998   if (*input_line_pointer == '{')
7999     {
8000       input_line_pointer = check_VecOperations (input_line_pointer,
8001                                                 NULL);
8002       if (input_line_pointer == NULL)
8003         return 0;
8004     }
8005
8006   if (*input_line_pointer)
8007     as_bad (_("junk `%s' after expression"), input_line_pointer);
8008
8009   input_line_pointer = save_input_line_pointer;
8010   if (gotfree_input_line)
8011     {
8012       free (gotfree_input_line);
8013
8014       if (exp->X_op == O_constant || exp->X_op == O_register)
8015         exp->X_op = O_illegal;
8016     }
8017
8018   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
8019 }
8020
8021 static int
8022 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8023                          i386_operand_type types, const char *imm_start)
8024 {
8025   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
8026     {
8027       if (imm_start)
8028         as_bad (_("missing or invalid immediate expression `%s'"),
8029                 imm_start);
8030       return 0;
8031     }
8032   else if (exp->X_op == O_constant)
8033     {
8034       /* Size it properly later.  */
8035       i.types[this_operand].bitfield.imm64 = 1;
8036       /* If not 64bit, sign extend val.  */
8037       if (flag_code != CODE_64BIT
8038           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
8039         exp->X_add_number
8040           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
8041     }
8042 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8043   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
8044            && exp_seg != absolute_section
8045            && exp_seg != text_section
8046            && exp_seg != data_section
8047            && exp_seg != bss_section
8048            && exp_seg != undefined_section
8049            && !bfd_is_com_section (exp_seg))
8050     {
8051       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8052       return 0;
8053     }
8054 #endif
8055   else if (!intel_syntax && exp_seg == reg_section)
8056     {
8057       if (imm_start)
8058         as_bad (_("illegal immediate register operand %s"), imm_start);
8059       return 0;
8060     }
8061   else
8062     {
8063       /* This is an address.  The size of the address will be
8064          determined later, depending on destination register,
8065          suffix, or the default for the section.  */
8066       i.types[this_operand].bitfield.imm8 = 1;
8067       i.types[this_operand].bitfield.imm16 = 1;
8068       i.types[this_operand].bitfield.imm32 = 1;
8069       i.types[this_operand].bitfield.imm32s = 1;
8070       i.types[this_operand].bitfield.imm64 = 1;
8071       i.types[this_operand] = operand_type_and (i.types[this_operand],
8072                                                 types);
8073     }
8074
8075   return 1;
8076 }
8077
8078 static char *
8079 i386_scale (char *scale)
8080 {
8081   offsetT val;
8082   char *save = input_line_pointer;
8083
8084   input_line_pointer = scale;
8085   val = get_absolute_expression ();
8086
8087   switch (val)
8088     {
8089     case 1:
8090       i.log2_scale_factor = 0;
8091       break;
8092     case 2:
8093       i.log2_scale_factor = 1;
8094       break;
8095     case 4:
8096       i.log2_scale_factor = 2;
8097       break;
8098     case 8:
8099       i.log2_scale_factor = 3;
8100       break;
8101     default:
8102       {
8103         char sep = *input_line_pointer;
8104
8105         *input_line_pointer = '\0';
8106         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
8107                 scale);
8108         *input_line_pointer = sep;
8109         input_line_pointer = save;
8110         return NULL;
8111       }
8112     }
8113   if (i.log2_scale_factor != 0 && i.index_reg == 0)
8114     {
8115       as_warn (_("scale factor of %d without an index register"),
8116                1 << i.log2_scale_factor);
8117       i.log2_scale_factor = 0;
8118     }
8119   scale = input_line_pointer;
8120   input_line_pointer = save;
8121   return scale;
8122 }
8123
8124 static int
8125 i386_displacement (char *disp_start, char *disp_end)
8126 {
8127   expressionS *exp;
8128   segT exp_seg = 0;
8129   char *save_input_line_pointer;
8130   char *gotfree_input_line;
8131   int override;
8132   i386_operand_type bigdisp, types = anydisp;
8133   int ret;
8134
8135   if (i.disp_operands == MAX_MEMORY_OPERANDS)
8136     {
8137       as_bad (_("at most %d displacement operands are allowed"),
8138               MAX_MEMORY_OPERANDS);
8139       return 0;
8140     }
8141
8142   operand_type_set (&bigdisp, 0);
8143   if ((i.types[this_operand].bitfield.jumpabsolute)
8144       || (!current_templates->start->opcode_modifier.jump
8145           && !current_templates->start->opcode_modifier.jumpdword))
8146     {
8147       bigdisp.bitfield.disp32 = 1;
8148       override = (i.prefix[ADDR_PREFIX] != 0);
8149       if (flag_code == CODE_64BIT)
8150         {
8151           if (!override)
8152             {
8153               bigdisp.bitfield.disp32s = 1;
8154               bigdisp.bitfield.disp64 = 1;
8155             }
8156         }
8157       else if ((flag_code == CODE_16BIT) ^ override)
8158         {
8159           bigdisp.bitfield.disp32 = 0;
8160           bigdisp.bitfield.disp16 = 1;
8161         }
8162     }
8163   else
8164     {
8165       /* For PC-relative branches, the width of the displacement
8166          is dependent upon data size, not address size.  */
8167       override = (i.prefix[DATA_PREFIX] != 0);
8168       if (flag_code == CODE_64BIT)
8169         {
8170           if (override || i.suffix == WORD_MNEM_SUFFIX)
8171             bigdisp.bitfield.disp16 = 1;
8172           else
8173             {
8174               bigdisp.bitfield.disp32 = 1;
8175               bigdisp.bitfield.disp32s = 1;
8176             }
8177         }
8178       else
8179         {
8180           if (!override)
8181             override = (i.suffix == (flag_code != CODE_16BIT
8182                                      ? WORD_MNEM_SUFFIX
8183                                      : LONG_MNEM_SUFFIX));
8184           bigdisp.bitfield.disp32 = 1;
8185           if ((flag_code == CODE_16BIT) ^ override)
8186             {
8187               bigdisp.bitfield.disp32 = 0;
8188               bigdisp.bitfield.disp16 = 1;
8189             }
8190         }
8191     }
8192   i.types[this_operand] = operand_type_or (i.types[this_operand],
8193                                            bigdisp);
8194
8195   exp = &disp_expressions[i.disp_operands];
8196   i.op[this_operand].disps = exp;
8197   i.disp_operands++;
8198   save_input_line_pointer = input_line_pointer;
8199   input_line_pointer = disp_start;
8200   END_STRING_AND_SAVE (disp_end);
8201
8202 #ifndef GCC_ASM_O_HACK
8203 #define GCC_ASM_O_HACK 0
8204 #endif
8205 #if GCC_ASM_O_HACK
8206   END_STRING_AND_SAVE (disp_end + 1);
8207   if (i.types[this_operand].bitfield.baseIndex
8208       && displacement_string_end[-1] == '+')
8209     {
8210       /* This hack is to avoid a warning when using the "o"
8211          constraint within gcc asm statements.
8212          For instance:
8213
8214          #define _set_tssldt_desc(n,addr,limit,type) \
8215          __asm__ __volatile__ ( \
8216          "movw %w2,%0\n\t" \
8217          "movw %w1,2+%0\n\t" \
8218          "rorl $16,%1\n\t" \
8219          "movb %b1,4+%0\n\t" \
8220          "movb %4,5+%0\n\t" \
8221          "movb $0,6+%0\n\t" \
8222          "movb %h1,7+%0\n\t" \
8223          "rorl $16,%1" \
8224          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
8225
8226          This works great except that the output assembler ends
8227          up looking a bit weird if it turns out that there is
8228          no offset.  You end up producing code that looks like:
8229
8230          #APP
8231          movw $235,(%eax)
8232          movw %dx,2+(%eax)
8233          rorl $16,%edx
8234          movb %dl,4+(%eax)
8235          movb $137,5+(%eax)
8236          movb $0,6+(%eax)
8237          movb %dh,7+(%eax)
8238          rorl $16,%edx
8239          #NO_APP
8240
8241          So here we provide the missing zero.  */
8242
8243       *displacement_string_end = '0';
8244     }
8245 #endif
8246   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
8247   if (gotfree_input_line)
8248     input_line_pointer = gotfree_input_line;
8249
8250   exp_seg = expression (exp);
8251
8252   SKIP_WHITESPACE ();
8253   if (*input_line_pointer)
8254     as_bad (_("junk `%s' after expression"), input_line_pointer);
8255 #if GCC_ASM_O_HACK
8256   RESTORE_END_STRING (disp_end + 1);
8257 #endif
8258   input_line_pointer = save_input_line_pointer;
8259   if (gotfree_input_line)
8260     {
8261       free (gotfree_input_line);
8262
8263       if (exp->X_op == O_constant || exp->X_op == O_register)
8264         exp->X_op = O_illegal;
8265     }
8266
8267   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
8268
8269   RESTORE_END_STRING (disp_end);
8270
8271   return ret;
8272 }
8273
8274 static int
8275 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8276                             i386_operand_type types, const char *disp_start)
8277 {
8278   i386_operand_type bigdisp;
8279   int ret = 1;
8280
8281   /* We do this to make sure that the section symbol is in
8282      the symbol table.  We will ultimately change the relocation
8283      to be relative to the beginning of the section.  */
8284   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
8285       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
8286       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8287     {
8288       if (exp->X_op != O_symbol)
8289         goto inv_disp;
8290
8291       if (S_IS_LOCAL (exp->X_add_symbol)
8292           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
8293           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
8294         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
8295       exp->X_op = O_subtract;
8296       exp->X_op_symbol = GOT_symbol;
8297       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
8298         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
8299       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8300         i.reloc[this_operand] = BFD_RELOC_64;
8301       else
8302         i.reloc[this_operand] = BFD_RELOC_32;
8303     }
8304
8305   else if (exp->X_op == O_absent
8306            || exp->X_op == O_illegal
8307            || exp->X_op == O_big)
8308     {
8309     inv_disp:
8310       as_bad (_("missing or invalid displacement expression `%s'"),
8311               disp_start);
8312       ret = 0;
8313     }
8314
8315   else if (flag_code == CODE_64BIT
8316            && !i.prefix[ADDR_PREFIX]
8317            && exp->X_op == O_constant)
8318     {
8319       /* Since displacement is signed extended to 64bit, don't allow
8320          disp32 and turn off disp32s if they are out of range.  */
8321       i.types[this_operand].bitfield.disp32 = 0;
8322       if (!fits_in_signed_long (exp->X_add_number))
8323         {
8324           i.types[this_operand].bitfield.disp32s = 0;
8325           if (i.types[this_operand].bitfield.baseindex)
8326             {
8327               as_bad (_("0x%lx out range of signed 32bit displacement"),
8328                       (long) exp->X_add_number);
8329               ret = 0;
8330             }
8331         }
8332     }
8333
8334 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8335   else if (exp->X_op != O_constant
8336            && OUTPUT_FLAVOR == bfd_target_aout_flavour
8337            && exp_seg != absolute_section
8338            && exp_seg != text_section
8339            && exp_seg != data_section
8340            && exp_seg != bss_section
8341            && exp_seg != undefined_section
8342            && !bfd_is_com_section (exp_seg))
8343     {
8344       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8345       ret = 0;
8346     }
8347 #endif
8348
8349   /* Check if this is a displacement only operand.  */
8350   bigdisp = i.types[this_operand];
8351   bigdisp.bitfield.disp8 = 0;
8352   bigdisp.bitfield.disp16 = 0;
8353   bigdisp.bitfield.disp32 = 0;
8354   bigdisp.bitfield.disp32s = 0;
8355   bigdisp.bitfield.disp64 = 0;
8356   if (operand_type_all_zero (&bigdisp))
8357     i.types[this_operand] = operand_type_and (i.types[this_operand],
8358                                               types);
8359
8360   return ret;
8361 }
8362
8363 /* Make sure the memory operand we've been dealt is valid.
8364    Return 1 on success, 0 on a failure.  */
8365
8366 static int
8367 i386_index_check (const char *operand_string)
8368 {
8369   const char *kind = "base/index";
8370   enum flag_code addr_mode;
8371
8372   if (i.prefix[ADDR_PREFIX])
8373     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
8374   else
8375     {
8376       addr_mode = flag_code;
8377
8378 #if INFER_ADDR_PREFIX
8379       if (i.mem_operands == 0)
8380         {
8381           /* Infer address prefix from the first memory operand.  */
8382           const reg_entry *addr_reg = i.base_reg;
8383
8384           if (addr_reg == NULL)
8385             addr_reg = i.index_reg;
8386
8387           if (addr_reg)
8388             {
8389               if (addr_reg->reg_num == RegEip
8390                   || addr_reg->reg_num == RegEiz
8391                   || addr_reg->reg_type.bitfield.reg32)
8392                 addr_mode = CODE_32BIT;
8393               else if (flag_code != CODE_64BIT
8394                        && addr_reg->reg_type.bitfield.reg16)
8395                 addr_mode = CODE_16BIT;
8396
8397               if (addr_mode != flag_code)
8398                 {
8399                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
8400                   i.prefixes += 1;
8401                   /* Change the size of any displacement too.  At most one
8402                      of Disp16 or Disp32 is set.
8403                      FIXME.  There doesn't seem to be any real need for
8404                      separate Disp16 and Disp32 flags.  The same goes for
8405                      Imm16 and Imm32.  Removing them would probably clean
8406                      up the code quite a lot.  */
8407                   if (flag_code != CODE_64BIT
8408                       && (i.types[this_operand].bitfield.disp16
8409                           || i.types[this_operand].bitfield.disp32))
8410                     i.types[this_operand]
8411                       = operand_type_xor (i.types[this_operand], disp16_32);
8412                 }
8413             }
8414         }
8415 #endif
8416     }
8417
8418   if (current_templates->start->opcode_modifier.isstring
8419       && !current_templates->start->opcode_modifier.immext
8420       && (current_templates->end[-1].opcode_modifier.isstring
8421           || i.mem_operands))
8422     {
8423       /* Memory operands of string insns are special in that they only allow
8424          a single register (rDI, rSI, or rBX) as their memory address.  */
8425       const reg_entry *expected_reg;
8426       static const char *di_si[][2] =
8427         {
8428           { "esi", "edi" },
8429           { "si", "di" },
8430           { "rsi", "rdi" }
8431         };
8432       static const char *bx[] = { "ebx", "bx", "rbx" };
8433
8434       kind = "string address";
8435
8436       if (current_templates->start->opcode_modifier.w)
8437         {
8438           i386_operand_type type = current_templates->end[-1].operand_types[0];
8439
8440           if (!type.bitfield.baseindex
8441               || ((!i.mem_operands != !intel_syntax)
8442                   && current_templates->end[-1].operand_types[1]
8443                      .bitfield.baseindex))
8444             type = current_templates->end[-1].operand_types[1];
8445           expected_reg = hash_find (reg_hash,
8446                                     di_si[addr_mode][type.bitfield.esseg]);
8447
8448         }
8449       else
8450         expected_reg = hash_find (reg_hash, bx[addr_mode]);
8451
8452       if (i.base_reg != expected_reg
8453           || i.index_reg
8454           || operand_type_check (i.types[this_operand], disp))
8455         {
8456           /* The second memory operand must have the same size as
8457              the first one.  */
8458           if (i.mem_operands
8459               && i.base_reg
8460               && !((addr_mode == CODE_64BIT
8461                     && i.base_reg->reg_type.bitfield.reg64)
8462                    || (addr_mode == CODE_32BIT
8463                        ? i.base_reg->reg_type.bitfield.reg32
8464                        : i.base_reg->reg_type.bitfield.reg16)))
8465             goto bad_address;
8466
8467           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
8468                    operand_string,
8469                    intel_syntax ? '[' : '(',
8470                    register_prefix,
8471                    expected_reg->reg_name,
8472                    intel_syntax ? ']' : ')');
8473           return 1;
8474         }
8475       else
8476         return 1;
8477
8478 bad_address:
8479       as_bad (_("`%s' is not a valid %s expression"),
8480               operand_string, kind);
8481       return 0;
8482     }
8483   else
8484     {
8485       if (addr_mode != CODE_16BIT)
8486         {
8487           /* 32-bit/64-bit checks.  */
8488           if ((i.base_reg
8489                && (addr_mode == CODE_64BIT
8490                    ? !i.base_reg->reg_type.bitfield.reg64
8491                    : !i.base_reg->reg_type.bitfield.reg32)
8492                && (i.index_reg
8493                    || (i.base_reg->reg_num
8494                        != (addr_mode == CODE_64BIT ? RegRip : RegEip))))
8495               || (i.index_reg
8496                   && !i.index_reg->reg_type.bitfield.regxmm
8497                   && !i.index_reg->reg_type.bitfield.regymm
8498                   && !i.index_reg->reg_type.bitfield.regzmm
8499                   && ((addr_mode == CODE_64BIT
8500                        ? !(i.index_reg->reg_type.bitfield.reg64
8501                            || i.index_reg->reg_num == RegRiz)
8502                        : !(i.index_reg->reg_type.bitfield.reg32
8503                            || i.index_reg->reg_num == RegEiz))
8504                       || !i.index_reg->reg_type.bitfield.baseindex)))
8505             goto bad_address;
8506         }
8507       else
8508         {
8509           /* 16-bit checks.  */
8510           if ((i.base_reg
8511                && (!i.base_reg->reg_type.bitfield.reg16
8512                    || !i.base_reg->reg_type.bitfield.baseindex))
8513               || (i.index_reg
8514                   && (!i.index_reg->reg_type.bitfield.reg16
8515                       || !i.index_reg->reg_type.bitfield.baseindex
8516                       || !(i.base_reg
8517                            && i.base_reg->reg_num < 6
8518                            && i.index_reg->reg_num >= 6
8519                            && i.log2_scale_factor == 0))))
8520             goto bad_address;
8521         }
8522     }
8523   return 1;
8524 }
8525
8526 /* Handle vector immediates.  */
8527
8528 static int
8529 RC_SAE_immediate (const char *imm_start)
8530 {
8531   unsigned int match_found, j;
8532   const char *pstr = imm_start;
8533   expressionS *exp;
8534
8535   if (*pstr != '{')
8536     return 0;
8537
8538   pstr++;
8539   match_found = 0;
8540   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
8541     {
8542       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
8543         {
8544           if (!i.rounding)
8545             {
8546               rc_op.type = RC_NamesTable[j].type;
8547               rc_op.operand = this_operand;
8548               i.rounding = &rc_op;
8549             }
8550           else
8551             {
8552               as_bad (_("duplicated `%s'"), imm_start);
8553               return 0;
8554             }
8555           pstr += RC_NamesTable[j].len;
8556           match_found = 1;
8557           break;
8558         }
8559     }
8560   if (!match_found)
8561     return 0;
8562
8563   if (*pstr++ != '}')
8564     {
8565       as_bad (_("Missing '}': '%s'"), imm_start);
8566       return 0;
8567     }
8568   /* RC/SAE immediate string should contain nothing more.  */;
8569   if (*pstr != 0)
8570     {
8571       as_bad (_("Junk after '}': '%s'"), imm_start);
8572       return 0;
8573     }
8574
8575   exp = &im_expressions[i.imm_operands++];
8576   i.op[this_operand].imms = exp;
8577
8578   exp->X_op = O_constant;
8579   exp->X_add_number = 0;
8580   exp->X_add_symbol = (symbolS *) 0;
8581   exp->X_op_symbol = (symbolS *) 0;
8582
8583   i.types[this_operand].bitfield.imm8 = 1;
8584   return 1;
8585 }
8586
8587 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
8588    on error.  */
8589
8590 static int
8591 i386_att_operand (char *operand_string)
8592 {
8593   const reg_entry *r;
8594   char *end_op;
8595   char *op_string = operand_string;
8596
8597   if (is_space_char (*op_string))
8598     ++op_string;
8599
8600   /* We check for an absolute prefix (differentiating,
8601      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
8602   if (*op_string == ABSOLUTE_PREFIX)
8603     {
8604       ++op_string;
8605       if (is_space_char (*op_string))
8606         ++op_string;
8607       i.types[this_operand].bitfield.jumpabsolute = 1;
8608     }
8609
8610   /* Check if operand is a register.  */
8611   if ((r = parse_register (op_string, &end_op)) != NULL)
8612     {
8613       i386_operand_type temp;
8614
8615       /* Check for a segment override by searching for ':' after a
8616          segment register.  */
8617       op_string = end_op;
8618       if (is_space_char (*op_string))
8619         ++op_string;
8620       if (*op_string == ':'
8621           && (r->reg_type.bitfield.sreg2
8622               || r->reg_type.bitfield.sreg3))
8623         {
8624           switch (r->reg_num)
8625             {
8626             case 0:
8627               i.seg[i.mem_operands] = &es;
8628               break;
8629             case 1:
8630               i.seg[i.mem_operands] = &cs;
8631               break;
8632             case 2:
8633               i.seg[i.mem_operands] = &ss;
8634               break;
8635             case 3:
8636               i.seg[i.mem_operands] = &ds;
8637               break;
8638             case 4:
8639               i.seg[i.mem_operands] = &fs;
8640               break;
8641             case 5:
8642               i.seg[i.mem_operands] = &gs;
8643               break;
8644             }
8645
8646           /* Skip the ':' and whitespace.  */
8647           ++op_string;
8648           if (is_space_char (*op_string))
8649             ++op_string;
8650
8651           if (!is_digit_char (*op_string)
8652               && !is_identifier_char (*op_string)
8653               && *op_string != '('
8654               && *op_string != ABSOLUTE_PREFIX)
8655             {
8656               as_bad (_("bad memory operand `%s'"), op_string);
8657               return 0;
8658             }
8659           /* Handle case of %es:*foo.  */
8660           if (*op_string == ABSOLUTE_PREFIX)
8661             {
8662               ++op_string;
8663               if (is_space_char (*op_string))
8664                 ++op_string;
8665               i.types[this_operand].bitfield.jumpabsolute = 1;
8666             }
8667           goto do_memory_reference;
8668         }
8669
8670       /* Handle vector operations.  */
8671       if (*op_string == '{')
8672         {
8673           op_string = check_VecOperations (op_string, NULL);
8674           if (op_string == NULL)
8675             return 0;
8676         }
8677
8678       if (*op_string)
8679         {
8680           as_bad (_("junk `%s' after register"), op_string);
8681           return 0;
8682         }
8683       temp = r->reg_type;
8684       temp.bitfield.baseindex = 0;
8685       i.types[this_operand] = operand_type_or (i.types[this_operand],
8686                                                temp);
8687       i.types[this_operand].bitfield.unspecified = 0;
8688       i.op[this_operand].regs = r;
8689       i.reg_operands++;
8690     }
8691   else if (*op_string == REGISTER_PREFIX)
8692     {
8693       as_bad (_("bad register name `%s'"), op_string);
8694       return 0;
8695     }
8696   else if (*op_string == IMMEDIATE_PREFIX)
8697     {
8698       ++op_string;
8699       if (i.types[this_operand].bitfield.jumpabsolute)
8700         {
8701           as_bad (_("immediate operand illegal with absolute jump"));
8702           return 0;
8703         }
8704       if (!i386_immediate (op_string))
8705         return 0;
8706     }
8707   else if (RC_SAE_immediate (operand_string))
8708     {
8709       /* If it is a RC or SAE immediate, do nothing.  */
8710       ;
8711     }
8712   else if (is_digit_char (*op_string)
8713            || is_identifier_char (*op_string)
8714            || *op_string == '"'
8715            || *op_string == '(')
8716     {
8717       /* This is a memory reference of some sort.  */
8718       char *base_string;
8719
8720       /* Start and end of displacement string expression (if found).  */
8721       char *displacement_string_start;
8722       char *displacement_string_end;
8723       char *vop_start;
8724
8725     do_memory_reference:
8726       if ((i.mem_operands == 1
8727            && !current_templates->start->opcode_modifier.isstring)
8728           || i.mem_operands == 2)
8729         {
8730           as_bad (_("too many memory references for `%s'"),
8731                   current_templates->start->name);
8732           return 0;
8733         }
8734
8735       /* Check for base index form.  We detect the base index form by
8736          looking for an ')' at the end of the operand, searching
8737          for the '(' matching it, and finding a REGISTER_PREFIX or ','
8738          after the '('.  */
8739       base_string = op_string + strlen (op_string);
8740
8741       /* Handle vector operations.  */
8742       vop_start = strchr (op_string, '{');
8743       if (vop_start && vop_start < base_string)
8744         {
8745           if (check_VecOperations (vop_start, base_string) == NULL)
8746             return 0;
8747           base_string = vop_start;
8748         }
8749
8750       --base_string;
8751       if (is_space_char (*base_string))
8752         --base_string;
8753
8754       /* If we only have a displacement, set-up for it to be parsed later.  */
8755       displacement_string_start = op_string;
8756       displacement_string_end = base_string + 1;
8757
8758       if (*base_string == ')')
8759         {
8760           char *temp_string;
8761           unsigned int parens_balanced = 1;
8762           /* We've already checked that the number of left & right ()'s are
8763              equal, so this loop will not be infinite.  */
8764           do
8765             {
8766               base_string--;
8767               if (*base_string == ')')
8768                 parens_balanced++;
8769               if (*base_string == '(')
8770                 parens_balanced--;
8771             }
8772           while (parens_balanced);
8773
8774           temp_string = base_string;
8775
8776           /* Skip past '(' and whitespace.  */
8777           ++base_string;
8778           if (is_space_char (*base_string))
8779             ++base_string;
8780
8781           if (*base_string == ','
8782               || ((i.base_reg = parse_register (base_string, &end_op))
8783                   != NULL))
8784             {
8785               displacement_string_end = temp_string;
8786
8787               i.types[this_operand].bitfield.baseindex = 1;
8788
8789               if (i.base_reg)
8790                 {
8791                   base_string = end_op;
8792                   if (is_space_char (*base_string))
8793                     ++base_string;
8794                 }
8795
8796               /* There may be an index reg or scale factor here.  */
8797               if (*base_string == ',')
8798                 {
8799                   ++base_string;
8800                   if (is_space_char (*base_string))
8801                     ++base_string;
8802
8803                   if ((i.index_reg = parse_register (base_string, &end_op))
8804                       != NULL)
8805                     {
8806                       base_string = end_op;
8807                       if (is_space_char (*base_string))
8808                         ++base_string;
8809                       if (*base_string == ',')
8810                         {
8811                           ++base_string;
8812                           if (is_space_char (*base_string))
8813                             ++base_string;
8814                         }
8815                       else if (*base_string != ')')
8816                         {
8817                           as_bad (_("expecting `,' or `)' "
8818                                     "after index register in `%s'"),
8819                                   operand_string);
8820                           return 0;
8821                         }
8822                     }
8823                   else if (*base_string == REGISTER_PREFIX)
8824                     {
8825                       end_op = strchr (base_string, ',');
8826                       if (end_op)
8827                         *end_op = '\0';
8828                       as_bad (_("bad register name `%s'"), base_string);
8829                       return 0;
8830                     }
8831
8832                   /* Check for scale factor.  */
8833                   if (*base_string != ')')
8834                     {
8835                       char *end_scale = i386_scale (base_string);
8836
8837                       if (!end_scale)
8838                         return 0;
8839
8840                       base_string = end_scale;
8841                       if (is_space_char (*base_string))
8842                         ++base_string;
8843                       if (*base_string != ')')
8844                         {
8845                           as_bad (_("expecting `)' "
8846                                     "after scale factor in `%s'"),
8847                                   operand_string);
8848                           return 0;
8849                         }
8850                     }
8851                   else if (!i.index_reg)
8852                     {
8853                       as_bad (_("expecting index register or scale factor "
8854                                 "after `,'; got '%c'"),
8855                               *base_string);
8856                       return 0;
8857                     }
8858                 }
8859               else if (*base_string != ')')
8860                 {
8861                   as_bad (_("expecting `,' or `)' "
8862                             "after base register in `%s'"),
8863                           operand_string);
8864                   return 0;
8865                 }
8866             }
8867           else if (*base_string == REGISTER_PREFIX)
8868             {
8869               end_op = strchr (base_string, ',');
8870               if (end_op)
8871                 *end_op = '\0';
8872               as_bad (_("bad register name `%s'"), base_string);
8873               return 0;
8874             }
8875         }
8876
8877       /* If there's an expression beginning the operand, parse it,
8878          assuming displacement_string_start and
8879          displacement_string_end are meaningful.  */
8880       if (displacement_string_start != displacement_string_end)
8881         {
8882           if (!i386_displacement (displacement_string_start,
8883                                   displacement_string_end))
8884             return 0;
8885         }
8886
8887       /* Special case for (%dx) while doing input/output op.  */
8888       if (i.base_reg
8889           && operand_type_equal (&i.base_reg->reg_type,
8890                                  &reg16_inoutportreg)
8891           && i.index_reg == 0
8892           && i.log2_scale_factor == 0
8893           && i.seg[i.mem_operands] == 0
8894           && !operand_type_check (i.types[this_operand], disp))
8895         {
8896           i.types[this_operand] = inoutportreg;
8897           return 1;
8898         }
8899
8900       if (i386_index_check (operand_string) == 0)
8901         return 0;
8902       i.types[this_operand].bitfield.mem = 1;
8903       i.mem_operands++;
8904     }
8905   else
8906     {
8907       /* It's not a memory operand; argh!  */
8908       as_bad (_("invalid char %s beginning operand %d `%s'"),
8909               output_invalid (*op_string),
8910               this_operand + 1,
8911               op_string);
8912       return 0;
8913     }
8914   return 1;                     /* Normal return.  */
8915 }
8916 \f
8917 /* Calculate the maximum variable size (i.e., excluding fr_fix)
8918    that an rs_machine_dependent frag may reach.  */
8919
8920 unsigned int
8921 i386_frag_max_var (fragS *frag)
8922 {
8923   /* The only relaxable frags are for jumps.
8924      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
8925   gas_assert (frag->fr_type == rs_machine_dependent);
8926   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
8927 }
8928
8929 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8930 static int
8931 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
8932 {
8933   /* STT_GNU_IFUNC symbol must go through PLT.  */
8934   if ((symbol_get_bfdsym (fr_symbol)->flags
8935        & BSF_GNU_INDIRECT_FUNCTION) != 0)
8936     return 0;
8937
8938   if (!S_IS_EXTERNAL (fr_symbol))
8939     /* Symbol may be weak or local.  */
8940     return !S_IS_WEAK (fr_symbol);
8941
8942   /* Global symbols with non-default visibility can't be preempted. */
8943   if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
8944     return 1;
8945
8946   if (fr_var != NO_RELOC)
8947     switch ((enum bfd_reloc_code_real) fr_var)
8948       {
8949       case BFD_RELOC_386_PLT32:
8950       case BFD_RELOC_X86_64_PLT32:
8951         /* Symbol with PLT relocatin may be preempted. */
8952         return 0;
8953       default:
8954         abort ();
8955       }
8956
8957   /* Global symbols with default visibility in a shared library may be
8958      preempted by another definition.  */
8959   return !shared;
8960 }
8961 #endif
8962
8963 /* md_estimate_size_before_relax()
8964
8965    Called just before relax() for rs_machine_dependent frags.  The x86
8966    assembler uses these frags to handle variable size jump
8967    instructions.
8968
8969    Any symbol that is now undefined will not become defined.
8970    Return the correct fr_subtype in the frag.
8971    Return the initial "guess for variable size of frag" to caller.
8972    The guess is actually the growth beyond the fixed part.  Whatever
8973    we do to grow the fixed or variable part contributes to our
8974    returned value.  */
8975
8976 int
8977 md_estimate_size_before_relax (fragS *fragP, segT segment)
8978 {
8979   /* We've already got fragP->fr_subtype right;  all we have to do is
8980      check for un-relaxable symbols.  On an ELF system, we can't relax
8981      an externally visible symbol, because it may be overridden by a
8982      shared library.  */
8983   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
8984 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8985       || (IS_ELF
8986           && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
8987                                                 fragP->fr_var))
8988 #endif
8989 #if defined (OBJ_COFF) && defined (TE_PE)
8990       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
8991           && S_IS_WEAK (fragP->fr_symbol))
8992 #endif
8993       )
8994     {
8995       /* Symbol is undefined in this segment, or we need to keep a
8996          reloc so that weak symbols can be overridden.  */
8997       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
8998       enum bfd_reloc_code_real reloc_type;
8999       unsigned char *opcode;
9000       int old_fr_fix;
9001
9002       if (fragP->fr_var != NO_RELOC)
9003         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
9004       else if (size == 2)
9005         reloc_type = BFD_RELOC_16_PCREL;
9006       else
9007         reloc_type = BFD_RELOC_32_PCREL;
9008
9009       old_fr_fix = fragP->fr_fix;
9010       opcode = (unsigned char *) fragP->fr_opcode;
9011
9012       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
9013         {
9014         case UNCOND_JUMP:
9015           /* Make jmp (0xeb) a (d)word displacement jump.  */
9016           opcode[0] = 0xe9;
9017           fragP->fr_fix += size;
9018           fix_new (fragP, old_fr_fix, size,
9019                    fragP->fr_symbol,
9020                    fragP->fr_offset, 1,
9021                    reloc_type);
9022           break;
9023
9024         case COND_JUMP86:
9025           if (size == 2
9026               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
9027             {
9028               /* Negate the condition, and branch past an
9029                  unconditional jump.  */
9030               opcode[0] ^= 1;
9031               opcode[1] = 3;
9032               /* Insert an unconditional jump.  */
9033               opcode[2] = 0xe9;
9034               /* We added two extra opcode bytes, and have a two byte
9035                  offset.  */
9036               fragP->fr_fix += 2 + 2;
9037               fix_new (fragP, old_fr_fix + 2, 2,
9038                        fragP->fr_symbol,
9039                        fragP->fr_offset, 1,
9040                        reloc_type);
9041               break;
9042             }
9043           /* Fall through.  */
9044
9045         case COND_JUMP:
9046           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
9047             {
9048               fixS *fixP;
9049
9050               fragP->fr_fix += 1;
9051               fixP = fix_new (fragP, old_fr_fix, 1,
9052                               fragP->fr_symbol,
9053                               fragP->fr_offset, 1,
9054                               BFD_RELOC_8_PCREL);
9055               fixP->fx_signed = 1;
9056               break;
9057             }
9058
9059           /* This changes the byte-displacement jump 0x7N
9060              to the (d)word-displacement jump 0x0f,0x8N.  */
9061           opcode[1] = opcode[0] + 0x10;
9062           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9063           /* We've added an opcode byte.  */
9064           fragP->fr_fix += 1 + size;
9065           fix_new (fragP, old_fr_fix + 1, size,
9066                    fragP->fr_symbol,
9067                    fragP->fr_offset, 1,
9068                    reloc_type);
9069           break;
9070
9071         default:
9072           BAD_CASE (fragP->fr_subtype);
9073           break;
9074         }
9075       frag_wane (fragP);
9076       return fragP->fr_fix - old_fr_fix;
9077     }
9078
9079   /* Guess size depending on current relax state.  Initially the relax
9080      state will correspond to a short jump and we return 1, because
9081      the variable part of the frag (the branch offset) is one byte
9082      long.  However, we can relax a section more than once and in that
9083      case we must either set fr_subtype back to the unrelaxed state,
9084      or return the value for the appropriate branch.  */
9085   return md_relax_table[fragP->fr_subtype].rlx_length;
9086 }
9087
9088 /* Called after relax() is finished.
9089
9090    In:  Address of frag.
9091         fr_type == rs_machine_dependent.
9092         fr_subtype is what the address relaxed to.
9093
9094    Out: Any fixSs and constants are set up.
9095         Caller will turn frag into a ".space 0".  */
9096
9097 void
9098 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
9099                  fragS *fragP)
9100 {
9101   unsigned char *opcode;
9102   unsigned char *where_to_put_displacement = NULL;
9103   offsetT target_address;
9104   offsetT opcode_address;
9105   unsigned int extension = 0;
9106   offsetT displacement_from_opcode_start;
9107
9108   opcode = (unsigned char *) fragP->fr_opcode;
9109
9110   /* Address we want to reach in file space.  */
9111   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
9112
9113   /* Address opcode resides at in file space.  */
9114   opcode_address = fragP->fr_address + fragP->fr_fix;
9115
9116   /* Displacement from opcode start to fill into instruction.  */
9117   displacement_from_opcode_start = target_address - opcode_address;
9118
9119   if ((fragP->fr_subtype & BIG) == 0)
9120     {
9121       /* Don't have to change opcode.  */
9122       extension = 1;            /* 1 opcode + 1 displacement  */
9123       where_to_put_displacement = &opcode[1];
9124     }
9125   else
9126     {
9127       if (no_cond_jump_promotion
9128           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
9129         as_warn_where (fragP->fr_file, fragP->fr_line,
9130                        _("long jump required"));
9131
9132       switch (fragP->fr_subtype)
9133         {
9134         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
9135           extension = 4;                /* 1 opcode + 4 displacement  */
9136           opcode[0] = 0xe9;
9137           where_to_put_displacement = &opcode[1];
9138           break;
9139
9140         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
9141           extension = 2;                /* 1 opcode + 2 displacement  */
9142           opcode[0] = 0xe9;
9143           where_to_put_displacement = &opcode[1];
9144           break;
9145
9146         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
9147         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
9148           extension = 5;                /* 2 opcode + 4 displacement  */
9149           opcode[1] = opcode[0] + 0x10;
9150           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9151           where_to_put_displacement = &opcode[2];
9152           break;
9153
9154         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
9155           extension = 3;                /* 2 opcode + 2 displacement  */
9156           opcode[1] = opcode[0] + 0x10;
9157           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9158           where_to_put_displacement = &opcode[2];
9159           break;
9160
9161         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
9162           extension = 4;
9163           opcode[0] ^= 1;
9164           opcode[1] = 3;
9165           opcode[2] = 0xe9;
9166           where_to_put_displacement = &opcode[3];
9167           break;
9168
9169         default:
9170           BAD_CASE (fragP->fr_subtype);
9171           break;
9172         }
9173     }
9174
9175   /* If size if less then four we are sure that the operand fits,
9176      but if it's 4, then it could be that the displacement is larger
9177      then -/+ 2GB.  */
9178   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
9179       && object_64bit
9180       && ((addressT) (displacement_from_opcode_start - extension
9181                       + ((addressT) 1 << 31))
9182           > (((addressT) 2 << 31) - 1)))
9183     {
9184       as_bad_where (fragP->fr_file, fragP->fr_line,
9185                     _("jump target out of range"));
9186       /* Make us emit 0.  */
9187       displacement_from_opcode_start = extension;
9188     }
9189   /* Now put displacement after opcode.  */
9190   md_number_to_chars ((char *) where_to_put_displacement,
9191                       (valueT) (displacement_from_opcode_start - extension),
9192                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
9193   fragP->fr_fix += extension;
9194 }
9195 \f
9196 /* Apply a fixup (fixP) to segment data, once it has been determined
9197    by our caller that we have all the info we need to fix it up.
9198
9199    Parameter valP is the pointer to the value of the bits.
9200
9201    On the 386, immediates, displacements, and data pointers are all in
9202    the same (little-endian) format, so we don't need to care about which
9203    we are handling.  */
9204
9205 void
9206 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
9207 {
9208   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
9209   valueT value = *valP;
9210
9211 #if !defined (TE_Mach)
9212   if (fixP->fx_pcrel)
9213     {
9214       switch (fixP->fx_r_type)
9215         {
9216         default:
9217           break;
9218
9219         case BFD_RELOC_64:
9220           fixP->fx_r_type = BFD_RELOC_64_PCREL;
9221           break;
9222         case BFD_RELOC_32:
9223         case BFD_RELOC_X86_64_32S:
9224           fixP->fx_r_type = BFD_RELOC_32_PCREL;
9225           break;
9226         case BFD_RELOC_16:
9227           fixP->fx_r_type = BFD_RELOC_16_PCREL;
9228           break;
9229         case BFD_RELOC_8:
9230           fixP->fx_r_type = BFD_RELOC_8_PCREL;
9231           break;
9232         }
9233     }
9234
9235   if (fixP->fx_addsy != NULL
9236       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
9237           || fixP->fx_r_type == BFD_RELOC_64_PCREL
9238           || fixP->fx_r_type == BFD_RELOC_16_PCREL
9239           || fixP->fx_r_type == BFD_RELOC_8_PCREL)
9240       && !use_rela_relocations)
9241     {
9242       /* This is a hack.  There should be a better way to handle this.
9243          This covers for the fact that bfd_install_relocation will
9244          subtract the current location (for partial_inplace, PC relative
9245          relocations); see more below.  */
9246 #ifndef OBJ_AOUT
9247       if (IS_ELF
9248 #ifdef TE_PE
9249           || OUTPUT_FLAVOR == bfd_target_coff_flavour
9250 #endif
9251           )
9252         value += fixP->fx_where + fixP->fx_frag->fr_address;
9253 #endif
9254 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9255       if (IS_ELF)
9256         {
9257           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
9258
9259           if ((sym_seg == seg
9260                || (symbol_section_p (fixP->fx_addsy)
9261                    && sym_seg != absolute_section))
9262               && !generic_force_reloc (fixP))
9263             {
9264               /* Yes, we add the values in twice.  This is because
9265                  bfd_install_relocation subtracts them out again.  I think
9266                  bfd_install_relocation is broken, but I don't dare change
9267                  it.  FIXME.  */
9268               value += fixP->fx_where + fixP->fx_frag->fr_address;
9269             }
9270         }
9271 #endif
9272 #if defined (OBJ_COFF) && defined (TE_PE)
9273       /* For some reason, the PE format does not store a
9274          section address offset for a PC relative symbol.  */
9275       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
9276           || S_IS_WEAK (fixP->fx_addsy))
9277         value += md_pcrel_from (fixP);
9278 #endif
9279     }
9280 #if defined (OBJ_COFF) && defined (TE_PE)
9281   if (fixP->fx_addsy != NULL
9282       && S_IS_WEAK (fixP->fx_addsy)
9283       /* PR 16858: Do not modify weak function references.  */
9284       && ! fixP->fx_pcrel)
9285     {
9286 #if !defined (TE_PEP)
9287       /* For x86 PE weak function symbols are neither PC-relative
9288          nor do they set S_IS_FUNCTION.  So the only reliable way
9289          to detect them is to check the flags of their containing
9290          section.  */
9291       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
9292           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
9293         ;
9294       else
9295 #endif
9296       value -= S_GET_VALUE (fixP->fx_addsy);
9297     }
9298 #endif
9299
9300   /* Fix a few things - the dynamic linker expects certain values here,
9301      and we must not disappoint it.  */
9302 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9303   if (IS_ELF && fixP->fx_addsy)
9304     switch (fixP->fx_r_type)
9305       {
9306       case BFD_RELOC_386_PLT32:
9307       case BFD_RELOC_X86_64_PLT32:
9308         /* Make the jump instruction point to the address of the operand.  At
9309            runtime we merely add the offset to the actual PLT entry.  */
9310         value = -4;
9311         break;
9312
9313       case BFD_RELOC_386_TLS_GD:
9314       case BFD_RELOC_386_TLS_LDM:
9315       case BFD_RELOC_386_TLS_IE_32:
9316       case BFD_RELOC_386_TLS_IE:
9317       case BFD_RELOC_386_TLS_GOTIE:
9318       case BFD_RELOC_386_TLS_GOTDESC:
9319       case BFD_RELOC_X86_64_TLSGD:
9320       case BFD_RELOC_X86_64_TLSLD:
9321       case BFD_RELOC_X86_64_GOTTPOFF:
9322       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9323         value = 0; /* Fully resolved at runtime.  No addend.  */
9324         /* Fallthrough */
9325       case BFD_RELOC_386_TLS_LE:
9326       case BFD_RELOC_386_TLS_LDO_32:
9327       case BFD_RELOC_386_TLS_LE_32:
9328       case BFD_RELOC_X86_64_DTPOFF32:
9329       case BFD_RELOC_X86_64_DTPOFF64:
9330       case BFD_RELOC_X86_64_TPOFF32:
9331       case BFD_RELOC_X86_64_TPOFF64:
9332         S_SET_THREAD_LOCAL (fixP->fx_addsy);
9333         break;
9334
9335       case BFD_RELOC_386_TLS_DESC_CALL:
9336       case BFD_RELOC_X86_64_TLSDESC_CALL:
9337         value = 0; /* Fully resolved at runtime.  No addend.  */
9338         S_SET_THREAD_LOCAL (fixP->fx_addsy);
9339         fixP->fx_done = 0;
9340         return;
9341
9342       case BFD_RELOC_386_GOT32:
9343       case BFD_RELOC_X86_64_GOT32:
9344         value = 0; /* Fully resolved at runtime.  No addend.  */
9345         break;
9346
9347       case BFD_RELOC_VTABLE_INHERIT:
9348       case BFD_RELOC_VTABLE_ENTRY:
9349         fixP->fx_done = 0;
9350         return;
9351
9352       default:
9353         break;
9354       }
9355 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
9356   *valP = value;
9357 #endif /* !defined (TE_Mach)  */
9358
9359   /* Are we finished with this relocation now?  */
9360   if (fixP->fx_addsy == NULL)
9361     fixP->fx_done = 1;
9362 #if defined (OBJ_COFF) && defined (TE_PE)
9363   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
9364     {
9365       fixP->fx_done = 0;
9366       /* Remember value for tc_gen_reloc.  */
9367       fixP->fx_addnumber = value;
9368       /* Clear out the frag for now.  */
9369       value = 0;
9370     }
9371 #endif
9372   else if (use_rela_relocations)
9373     {
9374       fixP->fx_no_overflow = 1;
9375       /* Remember value for tc_gen_reloc.  */
9376       fixP->fx_addnumber = value;
9377       value = 0;
9378     }
9379
9380   md_number_to_chars (p, value, fixP->fx_size);
9381 }
9382 \f
9383 const char *
9384 md_atof (int type, char *litP, int *sizeP)
9385 {
9386   /* This outputs the LITTLENUMs in REVERSE order;
9387      in accord with the bigendian 386.  */
9388   return ieee_md_atof (type, litP, sizeP, FALSE);
9389 }
9390 \f
9391 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
9392
9393 static char *
9394 output_invalid (int c)
9395 {
9396   if (ISPRINT (c))
9397     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9398               "'%c'", c);
9399   else
9400     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9401               "(0x%x)", (unsigned char) c);
9402   return output_invalid_buf;
9403 }
9404
9405 /* REG_STRING starts *before* REGISTER_PREFIX.  */
9406
9407 static const reg_entry *
9408 parse_real_register (char *reg_string, char **end_op)
9409 {
9410   char *s = reg_string;
9411   char *p;
9412   char reg_name_given[MAX_REG_NAME_SIZE + 1];
9413   const reg_entry *r;
9414
9415   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
9416   if (*s == REGISTER_PREFIX)
9417     ++s;
9418
9419   if (is_space_char (*s))
9420     ++s;
9421
9422   p = reg_name_given;
9423   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
9424     {
9425       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
9426         return (const reg_entry *) NULL;
9427       s++;
9428     }
9429
9430   /* For naked regs, make sure that we are not dealing with an identifier.
9431      This prevents confusing an identifier like `eax_var' with register
9432      `eax'.  */
9433   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
9434     return (const reg_entry *) NULL;
9435
9436   *end_op = s;
9437
9438   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
9439
9440   /* Handle floating point regs, allowing spaces in the (i) part.  */
9441   if (r == i386_regtab /* %st is first entry of table  */)
9442     {
9443       if (is_space_char (*s))
9444         ++s;
9445       if (*s == '(')
9446         {
9447           ++s;
9448           if (is_space_char (*s))
9449             ++s;
9450           if (*s >= '0' && *s <= '7')
9451             {
9452               int fpr = *s - '0';
9453               ++s;
9454               if (is_space_char (*s))
9455                 ++s;
9456               if (*s == ')')
9457                 {
9458                   *end_op = s + 1;
9459                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
9460                   know (r);
9461                   return r + fpr;
9462                 }
9463             }
9464           /* We have "%st(" then garbage.  */
9465           return (const reg_entry *) NULL;
9466         }
9467     }
9468
9469   if (r == NULL || allow_pseudo_reg)
9470     return r;
9471
9472   if (operand_type_all_zero (&r->reg_type))
9473     return (const reg_entry *) NULL;
9474
9475   if ((r->reg_type.bitfield.reg32
9476        || r->reg_type.bitfield.sreg3
9477        || r->reg_type.bitfield.control
9478        || r->reg_type.bitfield.debug
9479        || r->reg_type.bitfield.test)
9480       && !cpu_arch_flags.bitfield.cpui386)
9481     return (const reg_entry *) NULL;
9482
9483   if (r->reg_type.bitfield.floatreg
9484       && !cpu_arch_flags.bitfield.cpu8087
9485       && !cpu_arch_flags.bitfield.cpu287
9486       && !cpu_arch_flags.bitfield.cpu387)
9487     return (const reg_entry *) NULL;
9488
9489   if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
9490     return (const reg_entry *) NULL;
9491
9492   if (r->reg_type.bitfield.regxmm && !cpu_arch_flags.bitfield.cpusse)
9493     return (const reg_entry *) NULL;
9494
9495   if (r->reg_type.bitfield.regymm && !cpu_arch_flags.bitfield.cpuavx)
9496     return (const reg_entry *) NULL;
9497
9498   if ((r->reg_type.bitfield.regzmm || r->reg_type.bitfield.regmask)
9499        && !cpu_arch_flags.bitfield.cpuavx512f)
9500     return (const reg_entry *) NULL;
9501
9502   /* Don't allow fake index register unless allow_index_reg isn't 0. */
9503   if (!allow_index_reg
9504       && (r->reg_num == RegEiz || r->reg_num == RegRiz))
9505     return (const reg_entry *) NULL;
9506
9507   /* Upper 16 vector register is only available with VREX in 64bit
9508      mode.  */
9509   if ((r->reg_flags & RegVRex))
9510     {
9511       if (!cpu_arch_flags.bitfield.cpuvrex
9512           || flag_code != CODE_64BIT)
9513         return (const reg_entry *) NULL;
9514
9515       i.need_vrex = 1;
9516     }
9517
9518   if (((r->reg_flags & (RegRex64 | RegRex))
9519        || r->reg_type.bitfield.reg64)
9520       && (!cpu_arch_flags.bitfield.cpulm
9521           || !operand_type_equal (&r->reg_type, &control))
9522       && flag_code != CODE_64BIT)
9523     return (const reg_entry *) NULL;
9524
9525   if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
9526     return (const reg_entry *) NULL;
9527
9528   return r;
9529 }
9530
9531 /* REG_STRING starts *before* REGISTER_PREFIX.  */
9532
9533 static const reg_entry *
9534 parse_register (char *reg_string, char **end_op)
9535 {
9536   const reg_entry *r;
9537
9538   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
9539     r = parse_real_register (reg_string, end_op);
9540   else
9541     r = NULL;
9542   if (!r)
9543     {
9544       char *save = input_line_pointer;
9545       char c;
9546       symbolS *symbolP;
9547
9548       input_line_pointer = reg_string;
9549       c = get_symbol_name (&reg_string);
9550       symbolP = symbol_find (reg_string);
9551       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
9552         {
9553           const expressionS *e = symbol_get_value_expression (symbolP);
9554
9555           know (e->X_op == O_register);
9556           know (e->X_add_number >= 0
9557                 && (valueT) e->X_add_number < i386_regtab_size);
9558           r = i386_regtab + e->X_add_number;
9559           if ((r->reg_flags & RegVRex))
9560             i.need_vrex = 1;
9561           *end_op = input_line_pointer;
9562         }
9563       *input_line_pointer = c;
9564       input_line_pointer = save;
9565     }
9566   return r;
9567 }
9568
9569 int
9570 i386_parse_name (char *name, expressionS *e, char *nextcharP)
9571 {
9572   const reg_entry *r;
9573   char *end = input_line_pointer;
9574
9575   *end = *nextcharP;
9576   r = parse_register (name, &input_line_pointer);
9577   if (r && end <= input_line_pointer)
9578     {
9579       *nextcharP = *input_line_pointer;
9580       *input_line_pointer = 0;
9581       e->X_op = O_register;
9582       e->X_add_number = r - i386_regtab;
9583       return 1;
9584     }
9585   input_line_pointer = end;
9586   *end = 0;
9587   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
9588 }
9589
9590 void
9591 md_operand (expressionS *e)
9592 {
9593   char *end;
9594   const reg_entry *r;
9595
9596   switch (*input_line_pointer)
9597     {
9598     case REGISTER_PREFIX:
9599       r = parse_real_register (input_line_pointer, &end);
9600       if (r)
9601         {
9602           e->X_op = O_register;
9603           e->X_add_number = r - i386_regtab;
9604           input_line_pointer = end;
9605         }
9606       break;
9607
9608     case '[':
9609       gas_assert (intel_syntax);
9610       end = input_line_pointer++;
9611       expression (e);
9612       if (*input_line_pointer == ']')
9613         {
9614           ++input_line_pointer;
9615           e->X_op_symbol = make_expr_symbol (e);
9616           e->X_add_symbol = NULL;
9617           e->X_add_number = 0;
9618           e->X_op = O_index;
9619         }
9620       else
9621         {
9622           e->X_op = O_absent;
9623           input_line_pointer = end;
9624         }
9625       break;
9626     }
9627 }
9628
9629 \f
9630 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9631 const char *md_shortopts = "kVQ:sqn";
9632 #else
9633 const char *md_shortopts = "qn";
9634 #endif
9635
9636 #define OPTION_32 (OPTION_MD_BASE + 0)
9637 #define OPTION_64 (OPTION_MD_BASE + 1)
9638 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9639 #define OPTION_MARCH (OPTION_MD_BASE + 3)
9640 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
9641 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
9642 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
9643 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
9644 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
9645 #define OPTION_MOLD_GCC (OPTION_MD_BASE + 9)
9646 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
9647 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
9648 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
9649 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
9650 #define OPTION_X32 (OPTION_MD_BASE + 14)
9651 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
9652 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
9653 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
9654 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
9655 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
9656 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
9657 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
9658 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
9659 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
9660 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
9661 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 25)
9662
9663 struct option md_longopts[] =
9664 {
9665   {"32", no_argument, NULL, OPTION_32},
9666 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9667      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9668   {"64", no_argument, NULL, OPTION_64},
9669 #endif
9670 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9671   {"x32", no_argument, NULL, OPTION_X32},
9672   {"mshared", no_argument, NULL, OPTION_MSHARED},
9673 #endif
9674   {"divide", no_argument, NULL, OPTION_DIVIDE},
9675   {"march", required_argument, NULL, OPTION_MARCH},
9676   {"mtune", required_argument, NULL, OPTION_MTUNE},
9677   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
9678   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
9679   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
9680   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
9681   {"mold-gcc", no_argument, NULL, OPTION_MOLD_GCC},
9682   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
9683   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
9684   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
9685   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
9686   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
9687   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
9688   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
9689 # if defined (TE_PE) || defined (TE_PEP)
9690   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
9691 #endif
9692   {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
9693   {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
9694   {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
9695   {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
9696   {"mamd64", no_argument, NULL, OPTION_MAMD64},
9697   {"mintel64", no_argument, NULL, OPTION_MINTEL64},
9698   {NULL, no_argument, NULL, 0}
9699 };
9700 size_t md_longopts_size = sizeof (md_longopts);
9701
9702 int
9703 md_parse_option (int c, const char *arg)
9704 {
9705   unsigned int j;
9706   char *arch, *next;
9707
9708   switch (c)
9709     {
9710     case 'n':
9711       optimize_align_code = 0;
9712       break;
9713
9714     case 'q':
9715       quiet_warnings = 1;
9716       break;
9717
9718 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9719       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
9720          should be emitted or not.  FIXME: Not implemented.  */
9721     case 'Q':
9722       break;
9723
9724       /* -V: SVR4 argument to print version ID.  */
9725     case 'V':
9726       print_version_id ();
9727       break;
9728
9729       /* -k: Ignore for FreeBSD compatibility.  */
9730     case 'k':
9731       break;
9732
9733     case 's':
9734       /* -s: On i386 Solaris, this tells the native assembler to use
9735          .stab instead of .stab.excl.  We always use .stab anyhow.  */
9736       break;
9737
9738     case OPTION_MSHARED:
9739       shared = 1;
9740       break;
9741 #endif
9742 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9743      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9744     case OPTION_64:
9745       {
9746         const char **list, **l;
9747
9748         list = bfd_target_list ();
9749         for (l = list; *l != NULL; l++)
9750           if (CONST_STRNEQ (*l, "elf64-x86-64")
9751               || strcmp (*l, "coff-x86-64") == 0
9752               || strcmp (*l, "pe-x86-64") == 0
9753               || strcmp (*l, "pei-x86-64") == 0
9754               || strcmp (*l, "mach-o-x86-64") == 0)
9755             {
9756               default_arch = "x86_64";
9757               break;
9758             }
9759         if (*l == NULL)
9760           as_fatal (_("no compiled in support for x86_64"));
9761         free (list);
9762       }
9763       break;
9764 #endif
9765
9766 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9767     case OPTION_X32:
9768       if (IS_ELF)
9769         {
9770           const char **list, **l;
9771
9772           list = bfd_target_list ();
9773           for (l = list; *l != NULL; l++)
9774             if (CONST_STRNEQ (*l, "elf32-x86-64"))
9775               {
9776                 default_arch = "x86_64:32";
9777                 break;
9778               }
9779           if (*l == NULL)
9780             as_fatal (_("no compiled in support for 32bit x86_64"));
9781           free (list);
9782         }
9783       else
9784         as_fatal (_("32bit x86_64 is only supported for ELF"));
9785       break;
9786 #endif
9787
9788     case OPTION_32:
9789       default_arch = "i386";
9790       break;
9791
9792     case OPTION_DIVIDE:
9793 #ifdef SVR4_COMMENT_CHARS
9794       {
9795         char *n, *t;
9796         const char *s;
9797
9798         n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
9799         t = n;
9800         for (s = i386_comment_chars; *s != '\0'; s++)
9801           if (*s != '/')
9802             *t++ = *s;
9803         *t = '\0';
9804         i386_comment_chars = n;
9805       }
9806 #endif
9807       break;
9808
9809     case OPTION_MARCH:
9810       arch = xstrdup (arg);
9811       do
9812         {
9813           if (*arch == '.')
9814             as_fatal (_("invalid -march= option: `%s'"), arg);
9815           next = strchr (arch, '+');
9816           if (next)
9817             *next++ = '\0';
9818           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9819             {
9820               if (strcmp (arch, cpu_arch [j].name) == 0)
9821                 {
9822                   /* Processor.  */
9823                   if (! cpu_arch[j].flags.bitfield.cpui386)
9824                     continue;
9825
9826                   cpu_arch_name = cpu_arch[j].name;
9827                   cpu_sub_arch_name = NULL;
9828                   cpu_arch_flags = cpu_arch[j].flags;
9829                   cpu_arch_isa = cpu_arch[j].type;
9830                   cpu_arch_isa_flags = cpu_arch[j].flags;
9831                   if (!cpu_arch_tune_set)
9832                     {
9833                       cpu_arch_tune = cpu_arch_isa;
9834                       cpu_arch_tune_flags = cpu_arch_isa_flags;
9835                     }
9836                   break;
9837                 }
9838               else if (*cpu_arch [j].name == '.'
9839                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
9840                 {
9841                   /* ISA entension.  */
9842                   i386_cpu_flags flags;
9843
9844                   if (!cpu_arch[j].negated)
9845                     flags = cpu_flags_or (cpu_arch_flags,
9846                                           cpu_arch[j].flags);
9847                   else
9848                     flags = cpu_flags_and_not (cpu_arch_flags,
9849                                                cpu_arch[j].flags);
9850
9851                   if (!valid_iamcu_cpu_flags (&flags))
9852                     as_fatal (_("`%s' isn't valid for Intel MCU"), arch);
9853                   else if (!cpu_flags_equal (&flags, &cpu_arch_flags))
9854                     {
9855                       if (cpu_sub_arch_name)
9856                         {
9857                           char *name = cpu_sub_arch_name;
9858                           cpu_sub_arch_name = concat (name,
9859                                                       cpu_arch[j].name,
9860                                                       (const char *) NULL);
9861                           free (name);
9862                         }
9863                       else
9864                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
9865                       cpu_arch_flags = flags;
9866                       cpu_arch_isa_flags = flags;
9867                     }
9868                   break;
9869                 }
9870             }
9871
9872           if (j >= ARRAY_SIZE (cpu_arch))
9873             as_fatal (_("invalid -march= option: `%s'"), arg);
9874
9875           arch = next;
9876         }
9877       while (next != NULL );
9878       break;
9879
9880     case OPTION_MTUNE:
9881       if (*arg == '.')
9882         as_fatal (_("invalid -mtune= option: `%s'"), arg);
9883       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9884         {
9885           if (strcmp (arg, cpu_arch [j].name) == 0)
9886             {
9887               cpu_arch_tune_set = 1;
9888               cpu_arch_tune = cpu_arch [j].type;
9889               cpu_arch_tune_flags = cpu_arch[j].flags;
9890               break;
9891             }
9892         }
9893       if (j >= ARRAY_SIZE (cpu_arch))
9894         as_fatal (_("invalid -mtune= option: `%s'"), arg);
9895       break;
9896
9897     case OPTION_MMNEMONIC:
9898       if (strcasecmp (arg, "att") == 0)
9899         intel_mnemonic = 0;
9900       else if (strcasecmp (arg, "intel") == 0)
9901         intel_mnemonic = 1;
9902       else
9903         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
9904       break;
9905
9906     case OPTION_MSYNTAX:
9907       if (strcasecmp (arg, "att") == 0)
9908         intel_syntax = 0;
9909       else if (strcasecmp (arg, "intel") == 0)
9910         intel_syntax = 1;
9911       else
9912         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
9913       break;
9914
9915     case OPTION_MINDEX_REG:
9916       allow_index_reg = 1;
9917       break;
9918
9919     case OPTION_MNAKED_REG:
9920       allow_naked_reg = 1;
9921       break;
9922
9923     case OPTION_MOLD_GCC:
9924       old_gcc = 1;
9925       break;
9926
9927     case OPTION_MSSE2AVX:
9928       sse2avx = 1;
9929       break;
9930
9931     case OPTION_MSSE_CHECK:
9932       if (strcasecmp (arg, "error") == 0)
9933         sse_check = check_error;
9934       else if (strcasecmp (arg, "warning") == 0)
9935         sse_check = check_warning;
9936       else if (strcasecmp (arg, "none") == 0)
9937         sse_check = check_none;
9938       else
9939         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
9940       break;
9941
9942     case OPTION_MOPERAND_CHECK:
9943       if (strcasecmp (arg, "error") == 0)
9944         operand_check = check_error;
9945       else if (strcasecmp (arg, "warning") == 0)
9946         operand_check = check_warning;
9947       else if (strcasecmp (arg, "none") == 0)
9948         operand_check = check_none;
9949       else
9950         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
9951       break;
9952
9953     case OPTION_MAVXSCALAR:
9954       if (strcasecmp (arg, "128") == 0)
9955         avxscalar = vex128;
9956       else if (strcasecmp (arg, "256") == 0)
9957         avxscalar = vex256;
9958       else
9959         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
9960       break;
9961
9962     case OPTION_MADD_BND_PREFIX:
9963       add_bnd_prefix = 1;
9964       break;
9965
9966     case OPTION_MEVEXLIG:
9967       if (strcmp (arg, "128") == 0)
9968         evexlig = evexl128;
9969       else if (strcmp (arg, "256") == 0)
9970         evexlig = evexl256;
9971       else  if (strcmp (arg, "512") == 0)
9972         evexlig = evexl512;
9973       else
9974         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
9975       break;
9976
9977     case OPTION_MEVEXRCIG:
9978       if (strcmp (arg, "rne") == 0)
9979         evexrcig = rne;
9980       else if (strcmp (arg, "rd") == 0)
9981         evexrcig = rd;
9982       else if (strcmp (arg, "ru") == 0)
9983         evexrcig = ru;
9984       else if (strcmp (arg, "rz") == 0)
9985         evexrcig = rz;
9986       else
9987         as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
9988       break;
9989
9990     case OPTION_MEVEXWIG:
9991       if (strcmp (arg, "0") == 0)
9992         evexwig = evexw0;
9993       else if (strcmp (arg, "1") == 0)
9994         evexwig = evexw1;
9995       else
9996         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
9997       break;
9998
9999 # if defined (TE_PE) || defined (TE_PEP)
10000     case OPTION_MBIG_OBJ:
10001       use_big_obj = 1;
10002       break;
10003 #endif
10004
10005     case OPTION_MOMIT_LOCK_PREFIX:
10006       if (strcasecmp (arg, "yes") == 0)
10007         omit_lock_prefix = 1;
10008       else if (strcasecmp (arg, "no") == 0)
10009         omit_lock_prefix = 0;
10010       else
10011         as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
10012       break;
10013
10014     case OPTION_MFENCE_AS_LOCK_ADD:
10015       if (strcasecmp (arg, "yes") == 0)
10016         avoid_fence = 1;
10017       else if (strcasecmp (arg, "no") == 0)
10018         avoid_fence = 0;
10019       else
10020         as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
10021       break;
10022
10023     case OPTION_MRELAX_RELOCATIONS:
10024       if (strcasecmp (arg, "yes") == 0)
10025         generate_relax_relocations = 1;
10026       else if (strcasecmp (arg, "no") == 0)
10027         generate_relax_relocations = 0;
10028       else
10029         as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
10030       break;
10031
10032     case OPTION_MAMD64:
10033       cpu_arch_flags.bitfield.cpuamd64 = 1;
10034       cpu_arch_flags.bitfield.cpuintel64 = 0;
10035       cpu_arch_isa_flags.bitfield.cpuamd64 = 1;
10036       cpu_arch_isa_flags.bitfield.cpuintel64 = 0;
10037       break;
10038
10039     case OPTION_MINTEL64:
10040       cpu_arch_flags.bitfield.cpuamd64 = 0;
10041       cpu_arch_flags.bitfield.cpuintel64 = 1;
10042       cpu_arch_isa_flags.bitfield.cpuamd64 = 0;
10043       cpu_arch_isa_flags.bitfield.cpuintel64 = 1;
10044       break;
10045
10046     default:
10047       return 0;
10048     }
10049   return 1;
10050 }
10051
10052 #define MESSAGE_TEMPLATE \
10053 "                                                                                "
10054
10055 static void
10056 show_arch (FILE *stream, int ext, int check)
10057 {
10058   static char message[] = MESSAGE_TEMPLATE;
10059   char *start = message + 27;
10060   char *p;
10061   int size = sizeof (MESSAGE_TEMPLATE);
10062   int left;
10063   const char *name;
10064   int len;
10065   unsigned int j;
10066
10067   p = start;
10068   left = size - (start - message);
10069   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
10070     {
10071       /* Should it be skipped?  */
10072       if (cpu_arch [j].skip)
10073         continue;
10074
10075       name = cpu_arch [j].name;
10076       len = cpu_arch [j].len;
10077       if (*name == '.')
10078         {
10079           /* It is an extension.  Skip if we aren't asked to show it.  */
10080           if (ext)
10081             {
10082               name++;
10083               len--;
10084             }
10085           else
10086             continue;
10087         }
10088       else if (ext)
10089         {
10090           /* It is an processor.  Skip if we show only extension.  */
10091           continue;
10092         }
10093       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
10094         {
10095           /* It is an impossible processor - skip.  */
10096           continue;
10097         }
10098
10099       /* Reserve 2 spaces for ", " or ",\0" */
10100       left -= len + 2;
10101
10102       /* Check if there is any room.  */
10103       if (left >= 0)
10104         {
10105           if (p != start)
10106             {
10107               *p++ = ',';
10108               *p++ = ' ';
10109             }
10110           p = mempcpy (p, name, len);
10111         }
10112       else
10113         {
10114           /* Output the current message now and start a new one.  */
10115           *p++ = ',';
10116           *p = '\0';
10117           fprintf (stream, "%s\n", message);
10118           p = start;
10119           left = size - (start - message) - len - 2;
10120
10121           gas_assert (left >= 0);
10122
10123           p = mempcpy (p, name, len);
10124         }
10125     }
10126
10127   *p = '\0';
10128   fprintf (stream, "%s\n", message);
10129 }
10130
10131 void
10132 md_show_usage (FILE *stream)
10133 {
10134 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10135   fprintf (stream, _("\
10136   -Q                      ignored\n\
10137   -V                      print assembler version number\n\
10138   -k                      ignored\n"));
10139 #endif
10140   fprintf (stream, _("\
10141   -n                      Do not optimize code alignment\n\
10142   -q                      quieten some warnings\n"));
10143 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10144   fprintf (stream, _("\
10145   -s                      ignored\n"));
10146 #endif
10147 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10148      || defined (TE_PE) || defined (TE_PEP))
10149   fprintf (stream, _("\
10150   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
10151 #endif
10152 #ifdef SVR4_COMMENT_CHARS
10153   fprintf (stream, _("\
10154   --divide                do not treat `/' as a comment character\n"));
10155 #else
10156   fprintf (stream, _("\
10157   --divide                ignored\n"));
10158 #endif
10159   fprintf (stream, _("\
10160   -march=CPU[,+EXTENSION...]\n\
10161                           generate code for CPU and EXTENSION, CPU is one of:\n"));
10162   show_arch (stream, 0, 1);
10163   fprintf (stream, _("\
10164                           EXTENSION is combination of:\n"));
10165   show_arch (stream, 1, 0);
10166   fprintf (stream, _("\
10167   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
10168   show_arch (stream, 0, 0);
10169   fprintf (stream, _("\
10170   -msse2avx               encode SSE instructions with VEX prefix\n"));
10171   fprintf (stream, _("\
10172   -msse-check=[none|error|warning]\n\
10173                           check SSE instructions\n"));
10174   fprintf (stream, _("\
10175   -moperand-check=[none|error|warning]\n\
10176                           check operand combinations for validity\n"));
10177   fprintf (stream, _("\
10178   -mavxscalar=[128|256]   encode scalar AVX instructions with specific vector\n\
10179                            length\n"));
10180   fprintf (stream, _("\
10181   -mevexlig=[128|256|512] encode scalar EVEX instructions with specific vector\n\
10182                            length\n"));
10183   fprintf (stream, _("\
10184   -mevexwig=[0|1]         encode EVEX instructions with specific EVEX.W value\n\
10185                            for EVEX.W bit ignored instructions\n"));
10186   fprintf (stream, _("\
10187   -mevexrcig=[rne|rd|ru|rz]\n\
10188                           encode EVEX instructions with specific EVEX.RC value\n\
10189                            for SAE-only ignored instructions\n"));
10190   fprintf (stream, _("\
10191   -mmnemonic=[att|intel]  use AT&T/Intel mnemonic\n"));
10192   fprintf (stream, _("\
10193   -msyntax=[att|intel]    use AT&T/Intel syntax\n"));
10194   fprintf (stream, _("\
10195   -mindex-reg             support pseudo index registers\n"));
10196   fprintf (stream, _("\
10197   -mnaked-reg             don't require `%%' prefix for registers\n"));
10198   fprintf (stream, _("\
10199   -mold-gcc               support old (<= 2.8.1) versions of gcc\n"));
10200   fprintf (stream, _("\
10201   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
10202   fprintf (stream, _("\
10203   -mshared                disable branch optimization for shared code\n"));
10204 # if defined (TE_PE) || defined (TE_PEP)
10205   fprintf (stream, _("\
10206   -mbig-obj               generate big object files\n"));
10207 #endif
10208   fprintf (stream, _("\
10209   -momit-lock-prefix=[no|yes]\n\
10210                           strip all lock prefixes\n"));
10211   fprintf (stream, _("\
10212   -mfence-as-lock-add=[no|yes]\n\
10213                           encode lfence, mfence and sfence as\n\
10214                            lock addl $0x0, (%%{re}sp)\n"));
10215   fprintf (stream, _("\
10216   -mrelax-relocations=[no|yes]\n\
10217                           generate relax relocations\n"));
10218   fprintf (stream, _("\
10219   -mamd64                 accept only AMD64 ISA\n"));
10220   fprintf (stream, _("\
10221   -mintel64               accept only Intel64 ISA\n"));
10222 }
10223
10224 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
10225      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10226      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10227
10228 /* Pick the target format to use.  */
10229
10230 const char *
10231 i386_target_format (void)
10232 {
10233   if (!strncmp (default_arch, "x86_64", 6))
10234     {
10235       update_code_flag (CODE_64BIT, 1);
10236       if (default_arch[6] == '\0')
10237         x86_elf_abi = X86_64_ABI;
10238       else
10239         x86_elf_abi = X86_64_X32_ABI;
10240     }
10241   else if (!strcmp (default_arch, "i386"))
10242     update_code_flag (CODE_32BIT, 1);
10243   else if (!strcmp (default_arch, "iamcu"))
10244     {
10245       update_code_flag (CODE_32BIT, 1);
10246       if (cpu_arch_isa == PROCESSOR_UNKNOWN)
10247         {
10248           static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
10249           cpu_arch_name = "iamcu";
10250           cpu_sub_arch_name = NULL;
10251           cpu_arch_flags = iamcu_flags;
10252           cpu_arch_isa = PROCESSOR_IAMCU;
10253           cpu_arch_isa_flags = iamcu_flags;
10254           if (!cpu_arch_tune_set)
10255             {
10256               cpu_arch_tune = cpu_arch_isa;
10257               cpu_arch_tune_flags = cpu_arch_isa_flags;
10258             }
10259         }
10260       else
10261         as_fatal (_("Intel MCU doesn't support `%s' architecture"),
10262                   cpu_arch_name);
10263     }
10264   else
10265     as_fatal (_("unknown architecture"));
10266
10267   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
10268     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
10269   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
10270     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
10271
10272   switch (OUTPUT_FLAVOR)
10273     {
10274 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
10275     case bfd_target_aout_flavour:
10276       return AOUT_TARGET_FORMAT;
10277 #endif
10278 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
10279 # if defined (TE_PE) || defined (TE_PEP)
10280     case bfd_target_coff_flavour:
10281       if (flag_code == CODE_64BIT)
10282         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
10283       else
10284         return "pe-i386";
10285 # elif defined (TE_GO32)
10286     case bfd_target_coff_flavour:
10287       return "coff-go32";
10288 # else
10289     case bfd_target_coff_flavour:
10290       return "coff-i386";
10291 # endif
10292 #endif
10293 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10294     case bfd_target_elf_flavour:
10295       {
10296         const char *format;
10297
10298         switch (x86_elf_abi)
10299           {
10300           default:
10301             format = ELF_TARGET_FORMAT;
10302             break;
10303           case X86_64_ABI:
10304             use_rela_relocations = 1;
10305             object_64bit = 1;
10306             format = ELF_TARGET_FORMAT64;
10307             break;
10308           case X86_64_X32_ABI:
10309             use_rela_relocations = 1;
10310             object_64bit = 1;
10311             disallow_64bit_reloc = 1;
10312             format = ELF_TARGET_FORMAT32;
10313             break;
10314           }
10315         if (cpu_arch_isa == PROCESSOR_L1OM)
10316           {
10317             if (x86_elf_abi != X86_64_ABI)
10318               as_fatal (_("Intel L1OM is 64bit only"));
10319             return ELF_TARGET_L1OM_FORMAT;
10320           }
10321         else if (cpu_arch_isa == PROCESSOR_K1OM)
10322           {
10323             if (x86_elf_abi != X86_64_ABI)
10324               as_fatal (_("Intel K1OM is 64bit only"));
10325             return ELF_TARGET_K1OM_FORMAT;
10326           }
10327         else if (cpu_arch_isa == PROCESSOR_IAMCU)
10328           {
10329             if (x86_elf_abi != I386_ABI)
10330               as_fatal (_("Intel MCU is 32bit only"));
10331             return ELF_TARGET_IAMCU_FORMAT;
10332           }
10333         else
10334           return format;
10335       }
10336 #endif
10337 #if defined (OBJ_MACH_O)
10338     case bfd_target_mach_o_flavour:
10339       if (flag_code == CODE_64BIT)
10340         {
10341           use_rela_relocations = 1;
10342           object_64bit = 1;
10343           return "mach-o-x86-64";
10344         }
10345       else
10346         return "mach-o-i386";
10347 #endif
10348     default:
10349       abort ();
10350       return NULL;
10351     }
10352 }
10353
10354 #endif /* OBJ_MAYBE_ more than one  */
10355 \f
10356 symbolS *
10357 md_undefined_symbol (char *name)
10358 {
10359   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
10360       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
10361       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
10362       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
10363     {
10364       if (!GOT_symbol)
10365         {
10366           if (symbol_find (name))
10367             as_bad (_("GOT already in symbol table"));
10368           GOT_symbol = symbol_new (name, undefined_section,
10369                                    (valueT) 0, &zero_address_frag);
10370         };
10371       return GOT_symbol;
10372     }
10373   return 0;
10374 }
10375
10376 /* Round up a section size to the appropriate boundary.  */
10377
10378 valueT
10379 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
10380 {
10381 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10382   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
10383     {
10384       /* For a.out, force the section size to be aligned.  If we don't do
10385          this, BFD will align it for us, but it will not write out the
10386          final bytes of the section.  This may be a bug in BFD, but it is
10387          easier to fix it here since that is how the other a.out targets
10388          work.  */
10389       int align;
10390
10391       align = bfd_get_section_alignment (stdoutput, segment);
10392       size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
10393     }
10394 #endif
10395
10396   return size;
10397 }
10398
10399 /* On the i386, PC-relative offsets are relative to the start of the
10400    next instruction.  That is, the address of the offset, plus its
10401    size, since the offset is always the last part of the insn.  */
10402
10403 long
10404 md_pcrel_from (fixS *fixP)
10405 {
10406   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
10407 }
10408
10409 #ifndef I386COFF
10410
10411 static void
10412 s_bss (int ignore ATTRIBUTE_UNUSED)
10413 {
10414   int temp;
10415
10416 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10417   if (IS_ELF)
10418     obj_elf_section_change_hook ();
10419 #endif
10420   temp = get_absolute_expression ();
10421   subseg_set (bss_section, (subsegT) temp);
10422   demand_empty_rest_of_line ();
10423 }
10424
10425 #endif
10426
10427 void
10428 i386_validate_fix (fixS *fixp)
10429 {
10430   if (fixp->fx_subsy)
10431     {
10432       if (fixp->fx_subsy == GOT_symbol)
10433         {
10434           if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
10435             {
10436               if (!object_64bit)
10437                 abort ();
10438 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10439               if (fixp->fx_tcbit2)
10440                 fixp->fx_r_type = (fixp->fx_tcbit
10441                                    ? BFD_RELOC_X86_64_REX_GOTPCRELX
10442                                    : BFD_RELOC_X86_64_GOTPCRELX);
10443               else
10444 #endif
10445                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
10446             }
10447           else
10448             {
10449               if (!object_64bit)
10450                 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
10451               else
10452                 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
10453             }
10454           fixp->fx_subsy = 0;
10455         }
10456     }
10457 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10458   else if (!object_64bit)
10459     {
10460       if (fixp->fx_r_type == BFD_RELOC_386_GOT32
10461           && fixp->fx_tcbit2)
10462         fixp->fx_r_type = BFD_RELOC_386_GOT32X;
10463     }
10464 #endif
10465 }
10466
10467 arelent *
10468 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
10469 {
10470   arelent *rel;
10471   bfd_reloc_code_real_type code;
10472
10473   switch (fixp->fx_r_type)
10474     {
10475 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10476     case BFD_RELOC_SIZE32:
10477     case BFD_RELOC_SIZE64:
10478       if (S_IS_DEFINED (fixp->fx_addsy)
10479           && !S_IS_EXTERNAL (fixp->fx_addsy))
10480         {
10481           /* Resolve size relocation against local symbol to size of
10482              the symbol plus addend.  */
10483           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
10484           if (fixp->fx_r_type == BFD_RELOC_SIZE32
10485               && !fits_in_unsigned_long (value))
10486             as_bad_where (fixp->fx_file, fixp->fx_line,
10487                           _("symbol size computation overflow"));
10488           fixp->fx_addsy = NULL;
10489           fixp->fx_subsy = NULL;
10490           md_apply_fix (fixp, (valueT *) &value, NULL);
10491           return NULL;
10492         }
10493 #endif
10494
10495     case BFD_RELOC_X86_64_PLT32:
10496     case BFD_RELOC_X86_64_GOT32:
10497     case BFD_RELOC_X86_64_GOTPCREL:
10498     case BFD_RELOC_X86_64_GOTPCRELX:
10499     case BFD_RELOC_X86_64_REX_GOTPCRELX:
10500     case BFD_RELOC_386_PLT32:
10501     case BFD_RELOC_386_GOT32:
10502     case BFD_RELOC_386_GOT32X:
10503     case BFD_RELOC_386_GOTOFF:
10504     case BFD_RELOC_386_GOTPC:
10505     case BFD_RELOC_386_TLS_GD:
10506     case BFD_RELOC_386_TLS_LDM:
10507     case BFD_RELOC_386_TLS_LDO_32:
10508     case BFD_RELOC_386_TLS_IE_32:
10509     case BFD_RELOC_386_TLS_IE:
10510     case BFD_RELOC_386_TLS_GOTIE:
10511     case BFD_RELOC_386_TLS_LE_32:
10512     case BFD_RELOC_386_TLS_LE:
10513     case BFD_RELOC_386_TLS_GOTDESC:
10514     case BFD_RELOC_386_TLS_DESC_CALL:
10515     case BFD_RELOC_X86_64_TLSGD:
10516     case BFD_RELOC_X86_64_TLSLD:
10517     case BFD_RELOC_X86_64_DTPOFF32:
10518     case BFD_RELOC_X86_64_DTPOFF64:
10519     case BFD_RELOC_X86_64_GOTTPOFF:
10520     case BFD_RELOC_X86_64_TPOFF32:
10521     case BFD_RELOC_X86_64_TPOFF64:
10522     case BFD_RELOC_X86_64_GOTOFF64:
10523     case BFD_RELOC_X86_64_GOTPC32:
10524     case BFD_RELOC_X86_64_GOT64:
10525     case BFD_RELOC_X86_64_GOTPCREL64:
10526     case BFD_RELOC_X86_64_GOTPC64:
10527     case BFD_RELOC_X86_64_GOTPLT64:
10528     case BFD_RELOC_X86_64_PLTOFF64:
10529     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10530     case BFD_RELOC_X86_64_TLSDESC_CALL:
10531     case BFD_RELOC_RVA:
10532     case BFD_RELOC_VTABLE_ENTRY:
10533     case BFD_RELOC_VTABLE_INHERIT:
10534 #ifdef TE_PE
10535     case BFD_RELOC_32_SECREL:
10536 #endif
10537       code = fixp->fx_r_type;
10538       break;
10539     case BFD_RELOC_X86_64_32S:
10540       if (!fixp->fx_pcrel)
10541         {
10542           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
10543           code = fixp->fx_r_type;
10544           break;
10545         }
10546     default:
10547       if (fixp->fx_pcrel)
10548         {
10549           switch (fixp->fx_size)
10550             {
10551             default:
10552               as_bad_where (fixp->fx_file, fixp->fx_line,
10553                             _("can not do %d byte pc-relative relocation"),
10554                             fixp->fx_size);
10555               code = BFD_RELOC_32_PCREL;
10556               break;
10557             case 1: code = BFD_RELOC_8_PCREL;  break;
10558             case 2: code = BFD_RELOC_16_PCREL; break;
10559             case 4: code = BFD_RELOC_32_PCREL; break;
10560 #ifdef BFD64
10561             case 8: code = BFD_RELOC_64_PCREL; break;
10562 #endif
10563             }
10564         }
10565       else
10566         {
10567           switch (fixp->fx_size)
10568             {
10569             default:
10570               as_bad_where (fixp->fx_file, fixp->fx_line,
10571                             _("can not do %d byte relocation"),
10572                             fixp->fx_size);
10573               code = BFD_RELOC_32;
10574               break;
10575             case 1: code = BFD_RELOC_8;  break;
10576             case 2: code = BFD_RELOC_16; break;
10577             case 4: code = BFD_RELOC_32; break;
10578 #ifdef BFD64
10579             case 8: code = BFD_RELOC_64; break;
10580 #endif
10581             }
10582         }
10583       break;
10584     }
10585
10586   if ((code == BFD_RELOC_32
10587        || code == BFD_RELOC_32_PCREL
10588        || code == BFD_RELOC_X86_64_32S)
10589       && GOT_symbol
10590       && fixp->fx_addsy == GOT_symbol)
10591     {
10592       if (!object_64bit)
10593         code = BFD_RELOC_386_GOTPC;
10594       else
10595         code = BFD_RELOC_X86_64_GOTPC32;
10596     }
10597   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
10598       && GOT_symbol
10599       && fixp->fx_addsy == GOT_symbol)
10600     {
10601       code = BFD_RELOC_X86_64_GOTPC64;
10602     }
10603
10604   rel = (arelent *) xmalloc (sizeof (arelent));
10605   rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
10606   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
10607
10608   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
10609
10610   if (!use_rela_relocations)
10611     {
10612       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
10613          vtable entry to be used in the relocation's section offset.  */
10614       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
10615         rel->address = fixp->fx_offset;
10616 #if defined (OBJ_COFF) && defined (TE_PE)
10617       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
10618         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
10619       else
10620 #endif
10621       rel->addend = 0;
10622     }
10623   /* Use the rela in 64bit mode.  */
10624   else
10625     {
10626       if (disallow_64bit_reloc)
10627         switch (code)
10628           {
10629           case BFD_RELOC_X86_64_DTPOFF64:
10630           case BFD_RELOC_X86_64_TPOFF64:
10631           case BFD_RELOC_64_PCREL:
10632           case BFD_RELOC_X86_64_GOTOFF64:
10633           case BFD_RELOC_X86_64_GOT64:
10634           case BFD_RELOC_X86_64_GOTPCREL64:
10635           case BFD_RELOC_X86_64_GOTPC64:
10636           case BFD_RELOC_X86_64_GOTPLT64:
10637           case BFD_RELOC_X86_64_PLTOFF64:
10638             as_bad_where (fixp->fx_file, fixp->fx_line,
10639                           _("cannot represent relocation type %s in x32 mode"),
10640                           bfd_get_reloc_code_name (code));
10641             break;
10642           default:
10643             break;
10644           }
10645
10646       if (!fixp->fx_pcrel)
10647         rel->addend = fixp->fx_offset;
10648       else
10649         switch (code)
10650           {
10651           case BFD_RELOC_X86_64_PLT32:
10652           case BFD_RELOC_X86_64_GOT32:
10653           case BFD_RELOC_X86_64_GOTPCREL:
10654           case BFD_RELOC_X86_64_GOTPCRELX:
10655           case BFD_RELOC_X86_64_REX_GOTPCRELX:
10656           case BFD_RELOC_X86_64_TLSGD:
10657           case BFD_RELOC_X86_64_TLSLD:
10658           case BFD_RELOC_X86_64_GOTTPOFF:
10659           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10660           case BFD_RELOC_X86_64_TLSDESC_CALL:
10661             rel->addend = fixp->fx_offset - fixp->fx_size;
10662             break;
10663           default:
10664             rel->addend = (section->vma
10665                            - fixp->fx_size
10666                            + fixp->fx_addnumber
10667                            + md_pcrel_from (fixp));
10668             break;
10669           }
10670     }
10671
10672   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
10673   if (rel->howto == NULL)
10674     {
10675       as_bad_where (fixp->fx_file, fixp->fx_line,
10676                     _("cannot represent relocation type %s"),
10677                     bfd_get_reloc_code_name (code));
10678       /* Set howto to a garbage value so that we can keep going.  */
10679       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
10680       gas_assert (rel->howto != NULL);
10681     }
10682
10683   return rel;
10684 }
10685
10686 #include "tc-i386-intel.c"
10687
10688 void
10689 tc_x86_parse_to_dw2regnum (expressionS *exp)
10690 {
10691   int saved_naked_reg;
10692   char saved_register_dot;
10693
10694   saved_naked_reg = allow_naked_reg;
10695   allow_naked_reg = 1;
10696   saved_register_dot = register_chars['.'];
10697   register_chars['.'] = '.';
10698   allow_pseudo_reg = 1;
10699   expression_and_evaluate (exp);
10700   allow_pseudo_reg = 0;
10701   register_chars['.'] = saved_register_dot;
10702   allow_naked_reg = saved_naked_reg;
10703
10704   if (exp->X_op == O_register && exp->X_add_number >= 0)
10705     {
10706       if ((addressT) exp->X_add_number < i386_regtab_size)
10707         {
10708           exp->X_op = O_constant;
10709           exp->X_add_number = i386_regtab[exp->X_add_number]
10710                               .dw2_regnum[flag_code >> 1];
10711         }
10712       else
10713         exp->X_op = O_illegal;
10714     }
10715 }
10716
10717 void
10718 tc_x86_frame_initial_instructions (void)
10719 {
10720   static unsigned int sp_regno[2];
10721
10722   if (!sp_regno[flag_code >> 1])
10723     {
10724       char *saved_input = input_line_pointer;
10725       char sp[][4] = {"esp", "rsp"};
10726       expressionS exp;
10727
10728       input_line_pointer = sp[flag_code >> 1];
10729       tc_x86_parse_to_dw2regnum (&exp);
10730       gas_assert (exp.X_op == O_constant);
10731       sp_regno[flag_code >> 1] = exp.X_add_number;
10732       input_line_pointer = saved_input;
10733     }
10734
10735   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
10736   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
10737 }
10738
10739 int
10740 x86_dwarf2_addr_size (void)
10741 {
10742 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10743   if (x86_elf_abi == X86_64_X32_ABI)
10744     return 4;
10745 #endif
10746   return bfd_arch_bits_per_address (stdoutput) / 8;
10747 }
10748
10749 int
10750 i386_elf_section_type (const char *str, size_t len)
10751 {
10752   if (flag_code == CODE_64BIT
10753       && len == sizeof ("unwind") - 1
10754       && strncmp (str, "unwind", 6) == 0)
10755     return SHT_X86_64_UNWIND;
10756
10757   return -1;
10758 }
10759
10760 #ifdef TE_SOLARIS
10761 void
10762 i386_solaris_fix_up_eh_frame (segT sec)
10763 {
10764   if (flag_code == CODE_64BIT)
10765     elf_section_type (sec) = SHT_X86_64_UNWIND;
10766 }
10767 #endif
10768
10769 #ifdef TE_PE
10770 void
10771 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
10772 {
10773   expressionS exp;
10774
10775   exp.X_op = O_secrel;
10776   exp.X_add_symbol = symbol;
10777   exp.X_add_number = 0;
10778   emit_expr (&exp, size);
10779 }
10780 #endif
10781
10782 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10783 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
10784
10785 bfd_vma
10786 x86_64_section_letter (int letter, const char **ptr_msg)
10787 {
10788   if (flag_code == CODE_64BIT)
10789     {
10790       if (letter == 'l')
10791         return SHF_X86_64_LARGE;
10792
10793       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
10794     }
10795   else
10796     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
10797   return -1;
10798 }
10799
10800 bfd_vma
10801 x86_64_section_word (char *str, size_t len)
10802 {
10803   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
10804     return SHF_X86_64_LARGE;
10805
10806   return -1;
10807 }
10808
10809 static void
10810 handle_large_common (int small ATTRIBUTE_UNUSED)
10811 {
10812   if (flag_code != CODE_64BIT)
10813     {
10814       s_comm_internal (0, elf_common_parse);
10815       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
10816     }
10817   else
10818     {
10819       static segT lbss_section;
10820       asection *saved_com_section_ptr = elf_com_section_ptr;
10821       asection *saved_bss_section = bss_section;
10822
10823       if (lbss_section == NULL)
10824         {
10825           flagword applicable;
10826           segT seg = now_seg;
10827           subsegT subseg = now_subseg;
10828
10829           /* The .lbss section is for local .largecomm symbols.  */
10830           lbss_section = subseg_new (".lbss", 0);
10831           applicable = bfd_applicable_section_flags (stdoutput);
10832           bfd_set_section_flags (stdoutput, lbss_section,
10833                                  applicable & SEC_ALLOC);
10834           seg_info (lbss_section)->bss = 1;
10835
10836           subseg_set (seg, subseg);
10837         }
10838
10839       elf_com_section_ptr = &_bfd_elf_large_com_section;
10840       bss_section = lbss_section;
10841
10842       s_comm_internal (0, elf_common_parse);
10843
10844       elf_com_section_ptr = saved_com_section_ptr;
10845       bss_section = saved_bss_section;
10846     }
10847 }
10848 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */