gas/config/tc-i386.c

   1 /* tc-i386.c -- Assemble code for the Intel 80386
   2    Copyright (C) 1989-2014 Free Software Foundation, Inc.
   3
   4    This file is part of GAS, the GNU Assembler.
   5
   6    GAS is free software; you can redistribute it and/or modify
   7    it under the terms of the GNU General Public License as published by
   8    the Free Software Foundation; either version 3, or (at your option)
   9    any later version.
  10
  11    GAS is distributed in the hope that it will be useful,
  12    but WITHOUT ANY WARRANTY; without even the implied warranty of
  13    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14    GNU General Public License for more details.
  15
  16    You should have received a copy of the GNU General Public License
  17    along with GAS; see the file COPYING.  If not, write to the Free
  18    Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
  19    02110-1301, USA.  */
  20
  21 /* Intel 80386 machine specific gas.
  22    Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
  23    x86_64 support by Jan Hubicka (jh@suse.cz)
  24    VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
  25    Bugs & suggestions are completely welcome.  This is free software.
  26    Please help us make it better.  */
  27
  28 #include "as.h"
  29 #include "safe-ctype.h"
  30 #include "subsegs.h"
  31 #include "dwarf2dbg.h"
  32 #include "dw2gencfi.h"
  33 #include "elf/x86-64.h"
  34 #include "opcodes/i386-init.h"
  35
  36 #ifndef REGISTER_WARNINGS
  37 #define REGISTER_WARNINGS 1
  38 #endif
  39
  40 #ifndef INFER_ADDR_PREFIX
  41 #define INFER_ADDR_PREFIX 1
  42 #endif
  43
  44 #ifndef DEFAULT_ARCH
  45 #define DEFAULT_ARCH "i386"
  46 #endif
  47
  48 #ifndef INLINE
  49 #if __GNUC__ >= 2
  50 #define INLINE __inline__
  51 #else
  52 #define INLINE
  53 #endif
  54 #endif
  55
  56 /* Prefixes will be emitted in the order defined below.
  57    WAIT_PREFIX must be the first prefix since FWAIT is really is an
  58    instruction, and so must come before any prefixes.
  59    The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
  60    REP_PREFIX/HLE_PREFIX, LOCK_PREFIX.  */
  61 #define WAIT_PREFIX     0
  62 #define SEG_PREFIX      1
  63 #define ADDR_PREFIX     2
  64 #define DATA_PREFIX     3
  65 #define REP_PREFIX      4
  66 #define HLE_PREFIX      REP_PREFIX
  67 #define BND_PREFIX      REP_PREFIX
  68 #define LOCK_PREFIX     5
  69 #define REX_PREFIX      6       /* must come last.  */
  70 #define MAX_PREFIXES    7       /* max prefixes per opcode */
  71
  72 /* we define the syntax here (modulo base,index,scale syntax) */
  73 #define REGISTER_PREFIX '%'
  74 #define IMMEDIATE_PREFIX '$'
  75 #define ABSOLUTE_PREFIX '*'
  76
  77 /* these are the instruction mnemonic suffixes in AT&T syntax or
  78    memory operand size in Intel syntax.  */
  79 #define WORD_MNEM_SUFFIX  'w'
  80 #define BYTE_MNEM_SUFFIX  'b'
  81 #define SHORT_MNEM_SUFFIX 's'
  82 #define LONG_MNEM_SUFFIX  'l'
  83 #define QWORD_MNEM_SUFFIX  'q'
  84 #define XMMWORD_MNEM_SUFFIX  'x'
  85 #define YMMWORD_MNEM_SUFFIX 'y'
  86 #define ZMMWORD_MNEM_SUFFIX 'z'
  87 /* Intel Syntax.  Use a non-ascii letter since since it never appears
  88    in instructions.  */
  89 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
  90
  91 #define END_OF_INSN '\0'
  92
  93 /*
  94   'templates' is for grouping together 'template' structures for opcodes
  95   of the same name.  This is only used for storing the insns in the grand
  96   ole hash table of insns.
  97   The templates themselves start at START and range up to (but not including)
  98   END.
  99   */
 100 typedef struct
 101 {
 102   const insn_template *start;
 103   const insn_template *end;
 104 }
 105 templates;
 106
 107 /* 386 operand encoding bytes:  see 386 book for details of this.  */
 108 typedef struct
 109 {
 110   unsigned int regmem;  /* codes register or memory operand */
 111   unsigned int reg;     /* codes register operand (or extended opcode) */
 112   unsigned int mode;    /* how to interpret regmem & reg */
 113 }
 114 modrm_byte;
 115
 116 /* x86-64 extension prefix.  */
 117 typedef int rex_byte;
 118
 119 /* 386 opcode byte to code indirect addressing.  */
 120 typedef struct
 121 {
 122   unsigned base;
 123   unsigned index;
 124   unsigned scale;
 125 }
 126 sib_byte;
 127
 128 /* x86 arch names, types and features */
 129 typedef struct
 130 {
 131   const char *name;             /* arch name */
 132   unsigned int len;             /* arch string length */
 133   enum processor_type type;     /* arch type */
 134   i386_cpu_flags flags;         /* cpu feature flags */
 135   unsigned int skip;            /* show_arch should skip this. */
 136   unsigned int negated;         /* turn off indicated flags.  */
 137 }
 138 arch_entry;
 139
 140 static void update_code_flag (int, int);
 141 static void set_code_flag (int);
 142 static void set_16bit_gcc_code_flag (int);
 143 static void set_intel_syntax (int);
 144 static void set_intel_mnemonic (int);
 145 static void set_allow_index_reg (int);
 146 static void set_check (int);
 147 static void set_cpu_arch (int);
 148 #ifdef TE_PE
 149 static void pe_directive_secrel (int);
 150 #endif
 151 static void signed_cons (int);
 152 static char *output_invalid (int c);
 153 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
 154                                     const char *);
 155 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
 156                                        const char *);
 157 static int i386_att_operand (char *);
 158 static int i386_intel_operand (char *, int);
 159 static int i386_intel_simplify (expressionS *);
 160 static int i386_intel_parse_name (const char *, expressionS *);
 161 static const reg_entry *parse_register (char *, char **);
 162 static char *parse_insn (char *, char *);
 163 static char *parse_operands (char *, const char *);
 164 static void swap_operands (void);
 165 static void swap_2_operands (int, int);
 166 static void optimize_imm (void);
 167 static void optimize_disp (void);
 168 static const insn_template *match_template (void);
 169 static int check_string (void);
 170 static int process_suffix (void);
 171 static int check_byte_reg (void);
 172 static int check_long_reg (void);
 173 static int check_qword_reg (void);
 174 static int check_word_reg (void);
 175 static int finalize_imm (void);
 176 static int process_operands (void);
 177 static const seg_entry *build_modrm_byte (void);
 178 static void output_insn (void);
 179 static void output_imm (fragS *, offsetT);
 180 static void output_disp (fragS *, offsetT);
 181 #ifndef I386COFF
 182 static void s_bss (int);
 183 #endif
 184 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
 185 static void handle_large_common (int small ATTRIBUTE_UNUSED);
 186 #endif
 187
 188 static const char *default_arch = DEFAULT_ARCH;
 189
 190 /* This struct describes rounding control and SAE in the instruction.  */
 191 struct RC_Operation
 192 {
 193   enum rc_type
 194     {
 195       rne = 0,
 196       rd,
 197       ru,
 198       rz,
 199       saeonly
 200     } type;
 201   int operand;
 202 };
 203
 204 static struct RC_Operation rc_op;
 205
 206 /* The struct describes masking, applied to OPERAND in the instruction.
 207    MASK is a pointer to the corresponding mask register.  ZEROING tells
 208    whether merging or zeroing mask is used.  */
 209 struct Mask_Operation
 210 {
 211   const reg_entry *mask;
 212   unsigned int zeroing;
 213   /* The operand where this operation is associated.  */
 214   int operand;
 215 };
 216
 217 static struct Mask_Operation mask_op;
 218
 219 /* The struct describes broadcasting, applied to OPERAND.  FACTOR is
 220    broadcast factor.  */
 221 struct Broadcast_Operation
 222 {
 223   /* Type of broadcast: no broadcast, {1to8}, or {1to16}.  */
 224   int type;
 225
 226   /* Index of broadcasted operand.  */
 227   int operand;
 228 };
 229
 230 static struct Broadcast_Operation broadcast_op;
 231
 232 /* VEX prefix.  */
 233 typedef struct
 234 {
 235   /* VEX prefix is either 2 byte or 3 byte.  EVEX is 4 byte.  */
 236   unsigned char bytes[4];
 237   unsigned int length;
 238   /* Destination or source register specifier.  */
 239   const reg_entry *register_specifier;
 240 } vex_prefix;
 241
 242 /* 'md_assemble ()' gathers together information and puts it into a
 243    i386_insn.  */
 244
 245 union i386_op
 246   {
 247     expressionS *disps;
 248     expressionS *imms;
 249     const reg_entry *regs;
 250   };
 251
 252 enum i386_error
 253   {
 254     operand_size_mismatch,
 255     operand_type_mismatch,
 256     register_type_mismatch,
 257     number_of_operands_mismatch,
 258     invalid_instruction_suffix,
 259     bad_imm4,
 260     old_gcc_only,
 261     unsupported_with_intel_mnemonic,
 262     unsupported_syntax,
 263     unsupported,
 264     invalid_vsib_address,
 265     invalid_vector_register_set,
 266     unsupported_vector_index_register,
 267     unsupported_broadcast,
 268     broadcast_not_on_src_operand,
 269     broadcast_needed,
 270     unsupported_masking,
 271     mask_not_on_destination,
 272     no_default_mask,
 273     unsupported_rc_sae,
 274     rc_sae_operand_not_last_imm,
 275     invalid_register_operand,
 276     try_vector_disp8
 277   };
 278
 279 struct _i386_insn
 280   {
 281     /* TM holds the template for the insn were currently assembling.  */
 282     insn_template tm;
 283
 284     /* SUFFIX holds the instruction size suffix for byte, word, dword
 285        or qword, if given.  */
 286     char suffix;
 287
 288     /* OPERANDS gives the number of given operands.  */
 289     unsigned int operands;
 290
 291     /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
 292        of given register, displacement, memory operands and immediate
 293        operands.  */
 294     unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
 295
 296     /* TYPES [i] is the type (see above #defines) which tells us how to
 297        use OP[i] for the corresponding operand.  */
 298     i386_operand_type types[MAX_OPERANDS];
 299
 300     /* Displacement expression, immediate expression, or register for each
 301        operand.  */
 302     union i386_op op[MAX_OPERANDS];
 303
 304     /* Flags for operands.  */
 305     unsigned int flags[MAX_OPERANDS];
 306 #define Operand_PCrel 1
 307
 308     /* Relocation type for operand */
 309     enum bfd_reloc_code_real reloc[MAX_OPERANDS];
 310
 311     /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
 312        the base index byte below.  */
 313     const reg_entry *base_reg;
 314     const reg_entry *index_reg;
 315     unsigned int log2_scale_factor;
 316
 317     /* SEG gives the seg_entries of this insn.  They are zero unless
 318        explicit segment overrides are given.  */
 319     const seg_entry *seg[2];
 320
 321     /* PREFIX holds all the given prefix opcodes (usually null).
 322        PREFIXES is the number of prefix opcodes.  */
 323     unsigned int prefixes;
 324     unsigned char prefix[MAX_PREFIXES];
 325
 326     /* RM and SIB are the modrm byte and the sib byte where the
 327        addressing modes of this insn are encoded.  */
 328     modrm_byte rm;
 329     rex_byte rex;
 330     rex_byte vrex;
 331     sib_byte sib;
 332     vex_prefix vex;
 333
 334     /* Masking attributes.  */
 335     struct Mask_Operation *mask;
 336
 337     /* Rounding control and SAE attributes.  */
 338     struct RC_Operation *rounding;
 339
 340     /* Broadcasting attributes.  */
 341     struct Broadcast_Operation *broadcast;
 342
 343     /* Compressed disp8*N attribute.  */
 344     unsigned int memshift;
 345
 346     /* Swap operand in encoding.  */
 347     unsigned int swap_operand;
 348
 349     /* Prefer 8bit or 32bit displacement in encoding.  */
 350     enum
 351       {
 352         disp_encoding_default = 0,
 353         disp_encoding_8bit,
 354         disp_encoding_32bit
 355       } disp_encoding;
 356
 357     /* REP prefix.  */
 358     const char *rep_prefix;
 359
 360     /* HLE prefix.  */
 361     const char *hle_prefix;
 362
 363     /* Have BND prefix.  */
 364     const char *bnd_prefix;
 365
 366     /* Need VREX to support upper 16 registers.  */
 367     int need_vrex;
 368
 369     /* Error message.  */
 370     enum i386_error error;
 371   };
 372
 373 typedef struct _i386_insn i386_insn;
 374
 375 /* Link RC type with corresponding string, that'll be looked for in
 376    asm.  */
 377 struct RC_name
 378 {
 379   enum rc_type type;
 380   const char *name;
 381   unsigned int len;
 382 };
 383
 384 static const struct RC_name RC_NamesTable[] =
 385 {
 386   {  rne, STRING_COMMA_LEN ("rn-sae") },
 387   {  rd,  STRING_COMMA_LEN ("rd-sae") },
 388   {  ru,  STRING_COMMA_LEN ("ru-sae") },
 389   {  rz,  STRING_COMMA_LEN ("rz-sae") },
 390   {  saeonly,  STRING_COMMA_LEN ("sae") },
 391 };
 392
 393 /* List of chars besides those in app.c:symbol_chars that can start an
 394    operand.  Used to prevent the scrubber eating vital white-space.  */
 395 const char extra_symbol_chars[] = "*%-([{"
 396 #ifdef LEX_AT
 397         "@"
 398 #endif
 399 #ifdef LEX_QM
 400         "?"
 401 #endif
 402         ;
 403
 404 #if (defined (TE_I386AIX)                               \
 405      || ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
 406          && !defined (TE_GNU)                           \
 407          && !defined (TE_LINUX)                         \
 408          && !defined (TE_NACL)                          \
 409          && !defined (TE_NETWARE)                       \
 410          && !defined (TE_FreeBSD)                       \
 411          && !defined (TE_DragonFly)                     \
 412          && !defined (TE_NetBSD)))
 413 /* This array holds the chars that always start a comment.  If the
 414    pre-processor is disabled, these aren't very useful.  The option
 415    --divide will remove '/' from this list.  */
 416 const char *i386_comment_chars = "#/";
 417 #define SVR4_COMMENT_CHARS 1
 418 #define PREFIX_SEPARATOR '\\'
 419
 420 #else
 421 const char *i386_comment_chars = "#";
 422 #define PREFIX_SEPARATOR '/'
 423 #endif
 424
 425 /* This array holds the chars that only start a comment at the beginning of
 426    a line.  If the line seems to have the form '# 123 filename'
 427    .line and .file directives will appear in the pre-processed output.
 428    Note that input_file.c hand checks for '#' at the beginning of the
 429    first line of the input file.  This is because the compiler outputs
 430    #NO_APP at the beginning of its output.
 431    Also note that comments started like this one will always work if
 432    '/' isn't otherwise defined.  */
 433 const char line_comment_chars[] = "#/";
 434
 435 const char line_separator_chars[] = ";";
 436
 437 /* Chars that can be used to separate mant from exp in floating point
 438    nums.  */
 439 const char EXP_CHARS[] = "eE";
 440
 441 /* Chars that mean this number is a floating point constant
 442    As in 0f12.456
 443    or    0d1.2345e12.  */
 444 const char FLT_CHARS[] = "fFdDxX";
 445
 446 /* Tables for lexical analysis.  */
 447 static char mnemonic_chars[256];
 448 static char register_chars[256];
 449 static char operand_chars[256];
 450 static char identifier_chars[256];
 451 static char digit_chars[256];
 452
 453 /* Lexical macros.  */
 454 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
 455 #define is_operand_char(x) (operand_chars[(unsigned char) x])
 456 #define is_register_char(x) (register_chars[(unsigned char) x])
 457 #define is_space_char(x) ((x) == ' ')
 458 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
 459 #define is_digit_char(x) (digit_chars[(unsigned char) x])
 460
 461 /* All non-digit non-letter characters that may occur in an operand.  */
 462 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
 463
 464 /* md_assemble() always leaves the strings it's passed unaltered.  To
 465    effect this we maintain a stack of saved characters that we've smashed
 466    with '\0's (indicating end of strings for various sub-fields of the
 467    assembler instruction).  */
 468 static char save_stack[32];
 469 static char *save_stack_p;
 470 #define END_STRING_AND_SAVE(s) \
 471         do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
 472 #define RESTORE_END_STRING(s) \
 473         do { *(s) = *--save_stack_p; } while (0)
 474
 475 /* The instruction we're assembling.  */
 476 static i386_insn i;
 477
 478 /* Possible templates for current insn.  */
 479 static const templates *current_templates;
 480
 481 /* Per instruction expressionS buffers: max displacements & immediates.  */
 482 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
 483 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
 484
 485 /* Current operand we are working on.  */
 486 static int this_operand = -1;
 487
 488 /* We support four different modes.  FLAG_CODE variable is used to distinguish
 489    these.  */
 490
 491 enum flag_code {
 492         CODE_32BIT,
 493         CODE_16BIT,
 494         CODE_64BIT };
 495
 496 static enum flag_code flag_code;
 497 static unsigned int object_64bit;
 498 static unsigned int disallow_64bit_reloc;
 499 static int use_rela_relocations = 0;
 500
 501 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
 502      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
 503      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
 504
 505 /* The ELF ABI to use.  */
 506 enum x86_elf_abi
 507 {
 508   I386_ABI,
 509   X86_64_ABI,
 510   X86_64_X32_ABI
 511 };
 512
 513 static enum x86_elf_abi x86_elf_abi = I386_ABI;
 514 #endif
 515
 516 #if defined (TE_PE) || defined (TE_PEP)
 517 /* Use big object file format.  */
 518 static int use_big_obj = 0;
 519 #endif
 520
 521 /* 1 for intel syntax,
 522    0 if att syntax.  */
 523 static int intel_syntax = 0;
 524
 525 /* 1 for intel mnemonic,
 526    0 if att mnemonic.  */
 527 static int intel_mnemonic = !SYSV386_COMPAT;
 528
 529 /* 1 if support old (<= 2.8.1) versions of gcc.  */
 530 static int old_gcc = OLDGCC_COMPAT;
 531
 532 /* 1 if pseudo registers are permitted.  */
 533 static int allow_pseudo_reg = 0;
 534
 535 /* 1 if register prefix % not required.  */
 536 static int allow_naked_reg = 0;
 537
 538 /* 1 if the assembler should add BND prefix for all control-tranferring
 539    instructions supporting it, even if this prefix wasn't specified
 540    explicitly.  */
 541 static int add_bnd_prefix = 0;
 542
 543 /* 1 if pseudo index register, eiz/riz, is allowed .  */
 544 static int allow_index_reg = 0;
 545
 546 static enum check_kind
 547   {
 548     check_none = 0,
 549     check_warning,
 550     check_error
 551   }
 552 sse_check, operand_check = check_warning;
 553
 554 /* Register prefix used for error message.  */
 555 static const char *register_prefix = "%";
 556
 557 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
 558    leave, push, and pop instructions so that gcc has the same stack
 559    frame as in 32 bit mode.  */
 560 static char stackop_size = '\0';
 561
 562 /* Non-zero to optimize code alignment.  */
 563 int optimize_align_code = 1;
 564
 565 /* Non-zero to quieten some warnings.  */
 566 static int quiet_warnings = 0;
 567
 568 /* CPU name.  */
 569 static const char *cpu_arch_name = NULL;
 570 static char *cpu_sub_arch_name = NULL;
 571
 572 /* CPU feature flags.  */
 573 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
 574
 575 /* If we have selected a cpu we are generating instructions for.  */
 576 static int cpu_arch_tune_set = 0;
 577
 578 /* Cpu we are generating instructions for.  */
 579 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
 580
 581 /* CPU feature flags of cpu we are generating instructions for.  */
 582 static i386_cpu_flags cpu_arch_tune_flags;
 583
 584 /* CPU instruction set architecture used.  */
 585 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
 586
 587 /* CPU feature flags of instruction set architecture used.  */
 588 i386_cpu_flags cpu_arch_isa_flags;
 589
 590 /* If set, conditional jumps are not automatically promoted to handle
 591    larger than a byte offset.  */
 592 static unsigned int no_cond_jump_promotion = 0;
 593
 594 /* Encode SSE instructions with VEX prefix.  */
 595 static unsigned int sse2avx;
 596
 597 /* Encode scalar AVX instructions with specific vector length.  */
 598 static enum
 599   {
 600     vex128 = 0,
 601     vex256
 602   } avxscalar;
 603
 604 /* Encode scalar EVEX LIG instructions with specific vector length.  */
 605 static enum
 606   {
 607     evexl128 = 0,
 608     evexl256,
 609     evexl512
 610   } evexlig;
 611
 612 /* Encode EVEX WIG instructions with specific evex.w.  */
 613 static enum
 614   {
 615     evexw0 = 0,
 616     evexw1
 617   } evexwig;
 618
 619 /* Pre-defined "_GLOBAL_OFFSET_TABLE_".  */
 620 static symbolS *GOT_symbol;
 621
 622 /* The dwarf2 return column, adjusted for 32 or 64 bit.  */
 623 unsigned int x86_dwarf2_return_column;
 624
 625 /* The dwarf2 data alignment, adjusted for 32 or 64 bit.  */
 626 int x86_cie_data_alignment;
 627
 628 /* Interface to relax_segment.
 629    There are 3 major relax states for 386 jump insns because the
 630    different types of jumps add different sizes to frags when we're
 631    figuring out what sort of jump to choose to reach a given label.  */
 632
 633 /* Types.  */
 634 #define UNCOND_JUMP 0
 635 #define COND_JUMP 1
 636 #define COND_JUMP86 2
 637
 638 /* Sizes.  */
 639 #define CODE16  1
 640 #define SMALL   0
 641 #define SMALL16 (SMALL | CODE16)
 642 #define BIG     2
 643 #define BIG16   (BIG | CODE16)
 644
 645 #ifndef INLINE
 646 #ifdef __GNUC__
 647 #define INLINE __inline__
 648 #else
 649 #define INLINE
 650 #endif
 651 #endif
 652
 653 #define ENCODE_RELAX_STATE(type, size) \
 654   ((relax_substateT) (((type) << 2) | (size)))
 655 #define TYPE_FROM_RELAX_STATE(s) \
 656   ((s) >> 2)
 657 #define DISP_SIZE_FROM_RELAX_STATE(s) \
 658     ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
 659
 660 /* This table is used by relax_frag to promote short jumps to long
 661    ones where necessary.  SMALL (short) jumps may be promoted to BIG
 662    (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long).  We
 663    don't allow a short jump in a 32 bit code segment to be promoted to
 664    a 16 bit offset jump because it's slower (requires data size
 665    prefix), and doesn't work, unless the destination is in the bottom
 666    64k of the code segment (The top 16 bits of eip are zeroed).  */
 667
 668 const relax_typeS md_relax_table[] =
 669 {
 670   /* The fields are:
 671      1) most positive reach of this state,
 672      2) most negative reach of this state,
 673      3) how many bytes this mode will have in the variable part of the frag
 674      4) which index into the table to try if we can't fit into this one.  */
 675
 676   /* UNCOND_JUMP states.  */
 677   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
 678   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
 679   /* dword jmp adds 4 bytes to frag:
 680      0 extra opcode bytes, 4 displacement bytes.  */
 681   {0, 0, 4, 0},
 682   /* word jmp adds 2 byte2 to frag:
 683      0 extra opcode bytes, 2 displacement bytes.  */
 684   {0, 0, 2, 0},
 685
 686   /* COND_JUMP states.  */
 687   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
 688   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
 689   /* dword conditionals adds 5 bytes to frag:
 690      1 extra opcode byte, 4 displacement bytes.  */
 691   {0, 0, 5, 0},
 692   /* word conditionals add 3 bytes to frag:
 693      1 extra opcode byte, 2 displacement bytes.  */
 694   {0, 0, 3, 0},
 695
 696   /* COND_JUMP86 states.  */
 697   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
 698   {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
 699   /* dword conditionals adds 5 bytes to frag:
 700      1 extra opcode byte, 4 displacement bytes.  */
 701   {0, 0, 5, 0},
 702   /* word conditionals add 4 bytes to frag:
 703      1 displacement byte and a 3 byte long branch insn.  */
 704   {0, 0, 4, 0}
 705 };
 706
 707 static const arch_entry cpu_arch[] =
 708 {
 709   /* Do not replace the first two entries - i386_target_format()
 710      relies on them being there in this order.  */
 711   { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
 712     CPU_GENERIC32_FLAGS, 0, 0 },
 713   { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
 714     CPU_GENERIC64_FLAGS, 0, 0 },
 715   { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
 716     CPU_NONE_FLAGS, 0, 0 },
 717   { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
 718     CPU_I186_FLAGS, 0, 0 },
 719   { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
 720     CPU_I286_FLAGS, 0, 0 },
 721   { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
 722     CPU_I386_FLAGS, 0, 0 },
 723   { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
 724     CPU_I486_FLAGS, 0, 0 },
 725   { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
 726     CPU_I586_FLAGS, 0, 0 },
 727   { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
 728     CPU_I686_FLAGS, 0, 0 },
 729   { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
 730     CPU_I586_FLAGS, 0, 0 },
 731   { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
 732     CPU_PENTIUMPRO_FLAGS, 0, 0 },
 733   { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
 734     CPU_P2_FLAGS, 0, 0 },
 735   { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
 736     CPU_P3_FLAGS, 0, 0 },
 737   { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
 738     CPU_P4_FLAGS, 0, 0 },
 739   { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
 740     CPU_CORE_FLAGS, 0, 0 },
 741   { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
 742     CPU_NOCONA_FLAGS, 0, 0 },
 743   { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
 744     CPU_CORE_FLAGS, 1, 0 },
 745   { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
 746     CPU_CORE_FLAGS, 0, 0 },
 747   { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
 748     CPU_CORE2_FLAGS, 1, 0 },
 749   { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
 750     CPU_CORE2_FLAGS, 0, 0 },
 751   { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
 752     CPU_COREI7_FLAGS, 0, 0 },
 753   { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
 754     CPU_L1OM_FLAGS, 0, 0 },
 755   { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
 756     CPU_K1OM_FLAGS, 0, 0 },
 757   { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
 758     CPU_K6_FLAGS, 0, 0 },
 759   { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
 760     CPU_K6_2_FLAGS, 0, 0 },
 761   { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
 762     CPU_ATHLON_FLAGS, 0, 0 },
 763   { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
 764     CPU_K8_FLAGS, 1, 0 },
 765   { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
 766     CPU_K8_FLAGS, 0, 0 },
 767   { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
 768     CPU_K8_FLAGS, 0, 0 },
 769   { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
 770     CPU_AMDFAM10_FLAGS, 0, 0 },
 771   { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
 772     CPU_BDVER1_FLAGS, 0, 0 },
 773   { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
 774     CPU_BDVER2_FLAGS, 0, 0 },
 775   { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
 776     CPU_BDVER3_FLAGS, 0, 0 },
 777   { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
 778     CPU_BDVER4_FLAGS, 0, 0 },
 779   { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
 780     CPU_BTVER1_FLAGS, 0, 0 },
 781   { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
 782     CPU_BTVER2_FLAGS, 0, 0 },
 783   { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
 784     CPU_8087_FLAGS, 0, 0 },
 785   { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
 786     CPU_287_FLAGS, 0, 0 },
 787   { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
 788     CPU_387_FLAGS, 0, 0 },
 789   { STRING_COMMA_LEN (".no87"), PROCESSOR_UNKNOWN,
 790     CPU_ANY87_FLAGS, 0, 1 },
 791   { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
 792     CPU_MMX_FLAGS, 0, 0 },
 793   { STRING_COMMA_LEN (".nommx"), PROCESSOR_UNKNOWN,
 794     CPU_3DNOWA_FLAGS, 0, 1 },
 795   { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
 796     CPU_SSE_FLAGS, 0, 0 },
 797   { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
 798     CPU_SSE2_FLAGS, 0, 0 },
 799   { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
 800     CPU_SSE3_FLAGS, 0, 0 },
 801   { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
 802     CPU_SSSE3_FLAGS, 0, 0 },
 803   { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
 804     CPU_SSE4_1_FLAGS, 0, 0 },
 805   { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
 806     CPU_SSE4_2_FLAGS, 0, 0 },
 807   { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
 808     CPU_SSE4_2_FLAGS, 0, 0 },
 809   { STRING_COMMA_LEN (".nosse"), PROCESSOR_UNKNOWN,
 810     CPU_ANY_SSE_FLAGS, 0, 1 },
 811   { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
 812     CPU_AVX_FLAGS, 0, 0 },
 813   { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
 814     CPU_AVX2_FLAGS, 0, 0 },
 815   { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
 816     CPU_AVX512F_FLAGS, 0, 0 },
 817   { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
 818     CPU_AVX512CD_FLAGS, 0, 0 },
 819   { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
 820     CPU_AVX512ER_FLAGS, 0, 0 },
 821   { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
 822     CPU_AVX512PF_FLAGS, 0, 0 },
 823   { STRING_COMMA_LEN (".noavx"), PROCESSOR_UNKNOWN,
 824     CPU_ANY_AVX_FLAGS, 0, 1 },
 825   { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
 826     CPU_VMX_FLAGS, 0, 0 },
 827   { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
 828     CPU_VMFUNC_FLAGS, 0, 0 },
 829   { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
 830     CPU_SMX_FLAGS, 0, 0 },
 831   { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
 832     CPU_XSAVE_FLAGS, 0, 0 },
 833   { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
 834     CPU_XSAVEOPT_FLAGS, 0, 0 },
 835   { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
 836     CPU_AES_FLAGS, 0, 0 },
 837   { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
 838     CPU_PCLMUL_FLAGS, 0, 0 },
 839   { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
 840     CPU_PCLMUL_FLAGS, 1, 0 },
 841   { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
 842     CPU_FSGSBASE_FLAGS, 0, 0 },
 843   { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
 844     CPU_RDRND_FLAGS, 0, 0 },
 845   { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
 846     CPU_F16C_FLAGS, 0, 0 },
 847   { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
 848     CPU_BMI2_FLAGS, 0, 0 },
 849   { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
 850     CPU_FMA_FLAGS, 0, 0 },
 851   { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
 852     CPU_FMA4_FLAGS, 0, 0 },
 853   { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
 854     CPU_XOP_FLAGS, 0, 0 },
 855   { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
 856     CPU_LWP_FLAGS, 0, 0 },
 857   { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
 858     CPU_MOVBE_FLAGS, 0, 0 },
 859   { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
 860     CPU_CX16_FLAGS, 0, 0 },
 861   { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
 862     CPU_EPT_FLAGS, 0, 0 },
 863   { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
 864     CPU_LZCNT_FLAGS, 0, 0 },
 865   { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
 866     CPU_HLE_FLAGS, 0, 0 },
 867   { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
 868     CPU_RTM_FLAGS, 0, 0 },
 869   { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
 870     CPU_INVPCID_FLAGS, 0, 0 },
 871   { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
 872     CPU_CLFLUSH_FLAGS, 0, 0 },
 873   { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
 874     CPU_NOP_FLAGS, 0, 0 },
 875   { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
 876     CPU_SYSCALL_FLAGS, 0, 0 },
 877   { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
 878     CPU_RDTSCP_FLAGS, 0, 0 },
 879   { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
 880     CPU_3DNOW_FLAGS, 0, 0 },
 881   { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
 882     CPU_3DNOWA_FLAGS, 0, 0 },
 883   { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
 884     CPU_PADLOCK_FLAGS, 0, 0 },
 885   { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
 886     CPU_SVME_FLAGS, 1, 0 },
 887   { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
 888     CPU_SVME_FLAGS, 0, 0 },
 889   { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
 890     CPU_SSE4A_FLAGS, 0, 0 },
 891   { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
 892     CPU_ABM_FLAGS, 0, 0 },
 893   { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
 894     CPU_BMI_FLAGS, 0, 0 },
 895   { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
 896     CPU_TBM_FLAGS, 0, 0 },
 897   { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
 898     CPU_ADX_FLAGS, 0, 0 },
 899   { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
 900     CPU_RDSEED_FLAGS, 0, 0 },
 901   { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
 902     CPU_PRFCHW_FLAGS, 0, 0 },
 903   { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
 904     CPU_SMAP_FLAGS, 0, 0 },
 905   { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
 906     CPU_MPX_FLAGS, 0, 0 },
 907   { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
 908     CPU_SHA_FLAGS, 0, 0 },
 909   { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
 910     CPU_CLFLUSHOPT_FLAGS, 0, 0 },
 911   { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
 912     CPU_XSAVEC_FLAGS, 0, 0 },
 913   { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
 914     CPU_XSAVES_FLAGS, 0, 0 },
 915   { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
 916     CPU_PREFETCHWT1_FLAGS, 0, 0 },
 917   { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
 918     CPU_SE1_FLAGS, 0, 0 },
 919   { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
 920     CPU_AVX512DQ_FLAGS, 0, 0 },
 921   { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
 922     CPU_AVX512BW_FLAGS, 0, 0 },
 923   { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
 924     CPU_AVX512VL_FLAGS, 0, 0 },
 925 };
 926
 927 #ifdef I386COFF
 928 /* Like s_lcomm_internal in gas/read.c but the alignment string
 929    is allowed to be optional.  */
 930
 931 static symbolS *
 932 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
 933 {
 934   addressT align = 0;
 935
 936   SKIP_WHITESPACE ();
 937
 938   if (needs_align
 939       && *input_line_pointer == ',')
 940     {
 941       align = parse_align (needs_align - 1);
 942
 943       if (align == (addressT) -1)
 944         return NULL;
 945     }
 946   else
 947     {
 948       if (size >= 8)
 949         align = 3;
 950       else if (size >= 4)
 951         align = 2;
 952       else if (size >= 2)
 953         align = 1;
 954       else
 955         align = 0;
 956     }
 957
 958   bss_alloc (symbolP, size, align);
 959   return symbolP;
 960 }
 961
 962 static void
 963 pe_lcomm (int needs_align)
 964 {
 965   s_comm_internal (needs_align * 2, pe_lcomm_internal);
 966 }
 967 #endif
 968
 969 const pseudo_typeS md_pseudo_table[] =
 970 {
 971 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
 972   {"align", s_align_bytes, 0},
 973 #else
 974   {"align", s_align_ptwo, 0},
 975 #endif
 976   {"arch", set_cpu_arch, 0},
 977 #ifndef I386COFF
 978   {"bss", s_bss, 0},
 979 #else
 980   {"lcomm", pe_lcomm, 1},
 981 #endif
 982   {"ffloat", float_cons, 'f'},
 983   {"dfloat", float_cons, 'd'},
 984   {"tfloat", float_cons, 'x'},
 985   {"value", cons, 2},
 986   {"slong", signed_cons, 4},
 987   {"noopt", s_ignore, 0},
 988   {"optim", s_ignore, 0},
 989   {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
 990   {"code16", set_code_flag, CODE_16BIT},
 991   {"code32", set_code_flag, CODE_32BIT},
 992   {"code64", set_code_flag, CODE_64BIT},
 993   {"intel_syntax", set_intel_syntax, 1},
 994   {"att_syntax", set_intel_syntax, 0},
 995   {"intel_mnemonic", set_intel_mnemonic, 1},
 996   {"att_mnemonic", set_intel_mnemonic, 0},
 997   {"allow_index_reg", set_allow_index_reg, 1},
 998   {"disallow_index_reg", set_allow_index_reg, 0},
 999   {"sse_check", set_check, 0},
1000   {"operand_check", set_check, 1},
1001 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1002   {"largecomm", handle_large_common, 0},
1003 #else
1004   {"file", (void (*) (int)) dwarf2_directive_file, 0},
1005   {"loc", dwarf2_directive_loc, 0},
1006   {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1007 #endif
1008 #ifdef TE_PE
1009   {"secrel32", pe_directive_secrel, 0},
1010 #endif
1011   {0, 0, 0}
1012 };
1013
1014 /* For interface with expression ().  */
1015 extern char *input_line_pointer;
1016
1017 /* Hash table for instruction mnemonic lookup.  */
1018 static struct hash_control *op_hash;
1019
1020 /* Hash table for register lookup.  */
1021 static struct hash_control *reg_hash;
1022 \f
1023 void
1024 i386_align_code (fragS *fragP, int count)
1025 {
1026   /* Various efficient no-op patterns for aligning code labels.
1027      Note: Don't try to assemble the instructions in the comments.
1028      0L and 0w are not legal.  */
1029   static const char f32_1[] =
1030     {0x90};                                     /* nop                  */
1031   static const char f32_2[] =
1032     {0x66,0x90};                                /* xchg %ax,%ax */
1033   static const char f32_3[] =
1034     {0x8d,0x76,0x00};                           /* leal 0(%esi),%esi    */
1035   static const char f32_4[] =
1036     {0x8d,0x74,0x26,0x00};                      /* leal 0(%esi,1),%esi  */
1037   static const char f32_5[] =
1038     {0x90,                                      /* nop                  */
1039      0x8d,0x74,0x26,0x00};                      /* leal 0(%esi,1),%esi  */
1040   static const char f32_6[] =
1041     {0x8d,0xb6,0x00,0x00,0x00,0x00};            /* leal 0L(%esi),%esi   */
1042   static const char f32_7[] =
1043     {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00};       /* leal 0L(%esi,1),%esi */
1044   static const char f32_8[] =
1045     {0x90,                                      /* nop                  */
1046      0x8d,0xb4,0x26,0x00,0x00,0x00,0x00};       /* leal 0L(%esi,1),%esi */
1047   static const char f32_9[] =
1048     {0x89,0xf6,                                 /* movl %esi,%esi       */
1049      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1050   static const char f32_10[] =
1051     {0x8d,0x76,0x00,                            /* leal 0(%esi),%esi    */
1052      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1053   static const char f32_11[] =
1054     {0x8d,0x74,0x26,0x00,                       /* leal 0(%esi,1),%esi  */
1055      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1056   static const char f32_12[] =
1057     {0x8d,0xb6,0x00,0x00,0x00,0x00,             /* leal 0L(%esi),%esi   */
1058      0x8d,0xbf,0x00,0x00,0x00,0x00};            /* leal 0L(%edi),%edi   */
1059   static const char f32_13[] =
1060     {0x8d,0xb6,0x00,0x00,0x00,0x00,             /* leal 0L(%esi),%esi   */
1061      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1062   static const char f32_14[] =
1063     {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00,        /* leal 0L(%esi,1),%esi */
1064      0x8d,0xbc,0x27,0x00,0x00,0x00,0x00};       /* leal 0L(%edi,1),%edi */
1065   static const char f16_3[] =
1066     {0x8d,0x74,0x00};                           /* lea 0(%esi),%esi     */
1067   static const char f16_4[] =
1068     {0x8d,0xb4,0x00,0x00};                      /* lea 0w(%si),%si      */
1069   static const char f16_5[] =
1070     {0x90,                                      /* nop                  */
1071      0x8d,0xb4,0x00,0x00};                      /* lea 0w(%si),%si      */
1072   static const char f16_6[] =
1073     {0x89,0xf6,                                 /* mov %si,%si          */
1074      0x8d,0xbd,0x00,0x00};                      /* lea 0w(%di),%di      */
1075   static const char f16_7[] =
1076     {0x8d,0x74,0x00,                            /* lea 0(%si),%si       */
1077      0x8d,0xbd,0x00,0x00};                      /* lea 0w(%di),%di      */
1078   static const char f16_8[] =
1079     {0x8d,0xb4,0x00,0x00,                       /* lea 0w(%si),%si      */
1080      0x8d,0xbd,0x00,0x00};                      /* lea 0w(%di),%di      */
1081   static const char jump_31[] =
1082     {0xeb,0x1d,0x90,0x90,0x90,0x90,0x90,        /* jmp .+31; lotsa nops */
1083      0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1084      0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90,
1085      0x90,0x90,0x90,0x90,0x90,0x90,0x90,0x90};
1086   static const char *const f32_patt[] = {
1087     f32_1, f32_2, f32_3, f32_4, f32_5, f32_6, f32_7, f32_8,
1088     f32_9, f32_10, f32_11, f32_12, f32_13, f32_14
1089   };
1090   static const char *const f16_patt[] = {
1091     f32_1, f32_2, f16_3, f16_4, f16_5, f16_6, f16_7, f16_8
1092   };
1093   /* nopl (%[re]ax) */
1094   static const char alt_3[] =
1095     {0x0f,0x1f,0x00};
1096   /* nopl 0(%[re]ax) */
1097   static const char alt_4[] =
1098     {0x0f,0x1f,0x40,0x00};
1099   /* nopl 0(%[re]ax,%[re]ax,1) */
1100   static const char alt_5[] =
1101     {0x0f,0x1f,0x44,0x00,0x00};
1102   /* nopw 0(%[re]ax,%[re]ax,1) */
1103   static const char alt_6[] =
1104     {0x66,0x0f,0x1f,0x44,0x00,0x00};
1105   /* nopl 0L(%[re]ax) */
1106   static const char alt_7[] =
1107     {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1108   /* nopl 0L(%[re]ax,%[re]ax,1) */
1109   static const char alt_8[] =
1110     {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1111   /* nopw 0L(%[re]ax,%[re]ax,1) */
1112   static const char alt_9[] =
1113     {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1114   /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1115   static const char alt_10[] =
1116     {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1117   /* data16
1118      nopw %cs:0L(%[re]ax,%[re]ax,1) */
1119   static const char alt_long_11[] =
1120     {0x66,
1121      0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1122   /* data16
1123      data16
1124      nopw %cs:0L(%[re]ax,%[re]ax,1) */
1125   static const char alt_long_12[] =
1126     {0x66,
1127      0x66,
1128      0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1129   /* data16
1130      data16
1131      data16
1132      nopw %cs:0L(%[re]ax,%[re]ax,1) */
1133   static const char alt_long_13[] =
1134     {0x66,
1135      0x66,
1136      0x66,
1137      0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1138   /* data16
1139      data16
1140      data16
1141      data16
1142      nopw %cs:0L(%[re]ax,%[re]ax,1) */
1143   static const char alt_long_14[] =
1144     {0x66,
1145      0x66,
1146      0x66,
1147      0x66,
1148      0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1149   /* data16
1150      data16
1151      data16
1152      data16
1153      data16
1154      nopw %cs:0L(%[re]ax,%[re]ax,1) */
1155   static const char alt_long_15[] =
1156     {0x66,
1157      0x66,
1158      0x66,
1159      0x66,
1160      0x66,
1161      0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1162   /* nopl 0(%[re]ax,%[re]ax,1)
1163      nopw 0(%[re]ax,%[re]ax,1) */
1164   static const char alt_short_11[] =
1165     {0x0f,0x1f,0x44,0x00,0x00,
1166      0x66,0x0f,0x1f,0x44,0x00,0x00};
1167   /* nopw 0(%[re]ax,%[re]ax,1)
1168      nopw 0(%[re]ax,%[re]ax,1) */
1169   static const char alt_short_12[] =
1170     {0x66,0x0f,0x1f,0x44,0x00,0x00,
1171      0x66,0x0f,0x1f,0x44,0x00,0x00};
1172   /* nopw 0(%[re]ax,%[re]ax,1)
1173      nopl 0L(%[re]ax) */
1174   static const char alt_short_13[] =
1175     {0x66,0x0f,0x1f,0x44,0x00,0x00,
1176      0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1177   /* nopl 0L(%[re]ax)
1178      nopl 0L(%[re]ax) */
1179   static const char alt_short_14[] =
1180     {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00,
1181      0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1182   /* nopl 0L(%[re]ax)
1183      nopl 0L(%[re]ax,%[re]ax,1) */
1184   static const char alt_short_15[] =
1185     {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00,
1186      0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1187   static const char *const alt_short_patt[] = {
1188     f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1189     alt_9, alt_10, alt_short_11, alt_short_12, alt_short_13,
1190     alt_short_14, alt_short_15
1191   };
1192   static const char *const alt_long_patt[] = {
1193     f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1194     alt_9, alt_10, alt_long_11, alt_long_12, alt_long_13,
1195     alt_long_14, alt_long_15
1196   };
1197
1198   /* Only align for at least a positive non-zero boundary. */
1199   if (count <= 0 || count > MAX_MEM_FOR_RS_ALIGN_CODE)
1200     return;
1201
1202   /* We need to decide which NOP sequence to use for 32bit and
1203      64bit. When -mtune= is used:
1204
1205      1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1206      PROCESSOR_GENERIC32, f32_patt will be used.
1207      2. For PROCESSOR_PENTIUMPRO, PROCESSOR_PENTIUM4, PROCESSOR_NOCONA,
1208      PROCESSOR_CORE, PROCESSOR_CORE2, PROCESSOR_COREI7, and
1209      PROCESSOR_GENERIC64, alt_long_patt will be used.
1210      3. For PROCESSOR_ATHLON, PROCESSOR_K6, PROCESSOR_K8 and
1211      PROCESSOR_AMDFAM10, PROCESSOR_BD and PROCESSOR_BT, alt_short_patt
1212      will be used.
1213
1214      When -mtune= isn't used, alt_long_patt will be used if
1215      cpu_arch_isa_flags has CpuNop.  Otherwise, f32_patt will
1216      be used.
1217
1218      When -march= or .arch is used, we can't use anything beyond
1219      cpu_arch_isa_flags.   */
1220
1221   if (flag_code == CODE_16BIT)
1222     {
1223       if (count > 8)
1224         {
1225           memcpy (fragP->fr_literal + fragP->fr_fix,
1226                   jump_31, count);
1227           /* Adjust jump offset.  */
1228           fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1229         }
1230       else
1231         memcpy (fragP->fr_literal + fragP->fr_fix,
1232                 f16_patt[count - 1], count);
1233     }
1234   else
1235     {
1236       const char *const *patt = NULL;
1237
1238       if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1239         {
1240           /* PROCESSOR_UNKNOWN means that all ISAs may be used.  */
1241           switch (cpu_arch_tune)
1242             {
1243             case PROCESSOR_UNKNOWN:
1244               /* We use cpu_arch_isa_flags to check if we SHOULD
1245                  optimize with nops.  */
1246               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1247                 patt = alt_long_patt;
1248               else
1249                 patt = f32_patt;
1250               break;
1251             case PROCESSOR_PENTIUM4:
1252             case PROCESSOR_NOCONA:
1253             case PROCESSOR_CORE:
1254             case PROCESSOR_CORE2:
1255             case PROCESSOR_COREI7:
1256             case PROCESSOR_L1OM:
1257             case PROCESSOR_K1OM:
1258             case PROCESSOR_GENERIC64:
1259               patt = alt_long_patt;
1260               break;
1261             case PROCESSOR_K6:
1262             case PROCESSOR_ATHLON:
1263             case PROCESSOR_K8:
1264             case PROCESSOR_AMDFAM10:
1265             case PROCESSOR_BD:
1266             case PROCESSOR_BT:
1267               patt = alt_short_patt;
1268               break;
1269             case PROCESSOR_I386:
1270             case PROCESSOR_I486:
1271             case PROCESSOR_PENTIUM:
1272             case PROCESSOR_PENTIUMPRO:
1273             case PROCESSOR_GENERIC32:
1274               patt = f32_patt;
1275               break;
1276             }
1277         }
1278       else
1279         {
1280           switch (fragP->tc_frag_data.tune)
1281             {
1282             case PROCESSOR_UNKNOWN:
1283               /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1284                  PROCESSOR_UNKNOWN.  */
1285               abort ();
1286               break;
1287
1288             case PROCESSOR_I386:
1289             case PROCESSOR_I486:
1290             case PROCESSOR_PENTIUM:
1291             case PROCESSOR_K6:
1292             case PROCESSOR_ATHLON:
1293             case PROCESSOR_K8:
1294             case PROCESSOR_AMDFAM10:
1295             case PROCESSOR_BD:
1296             case PROCESSOR_BT:
1297             case PROCESSOR_GENERIC32:
1298               /* We use cpu_arch_isa_flags to check if we CAN optimize
1299                  with nops.  */
1300               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1301                 patt = alt_short_patt;
1302               else
1303                 patt = f32_patt;
1304               break;
1305             case PROCESSOR_PENTIUMPRO:
1306             case PROCESSOR_PENTIUM4:
1307             case PROCESSOR_NOCONA:
1308             case PROCESSOR_CORE:
1309             case PROCESSOR_CORE2:
1310             case PROCESSOR_COREI7:
1311             case PROCESSOR_L1OM:
1312             case PROCESSOR_K1OM:
1313               if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1314                 patt = alt_long_patt;
1315               else
1316                 patt = f32_patt;
1317               break;
1318             case PROCESSOR_GENERIC64:
1319               patt = alt_long_patt;
1320               break;
1321             }
1322         }
1323
1324       if (patt == f32_patt)
1325         {
1326           /* If the padding is less than 15 bytes, we use the normal
1327              ones.  Otherwise, we use a jump instruction and adjust
1328              its offset.   */
1329           int limit;
1330
1331           /* For 64bit, the limit is 3 bytes.  */
1332           if (flag_code == CODE_64BIT
1333               && fragP->tc_frag_data.isa_flags.bitfield.cpulm)
1334             limit = 3;
1335           else
1336             limit = 15;
1337           if (count < limit)
1338             memcpy (fragP->fr_literal + fragP->fr_fix,
1339                     patt[count - 1], count);
1340           else
1341             {
1342               memcpy (fragP->fr_literal + fragP->fr_fix,
1343                       jump_31, count);
1344               /* Adjust jump offset.  */
1345               fragP->fr_literal[fragP->fr_fix + 1] = count - 2;
1346             }
1347         }
1348       else
1349         {
1350           /* Maximum length of an instruction is 15 byte.  If the
1351              padding is greater than 15 bytes and we don't use jump,
1352              we have to break it into smaller pieces.  */
1353           int padding = count;
1354           while (padding > 15)
1355             {
1356               padding -= 15;
1357               memcpy (fragP->fr_literal + fragP->fr_fix + padding,
1358                       patt [14], 15);
1359             }
1360
1361           if (padding)
1362             memcpy (fragP->fr_literal + fragP->fr_fix,
1363                     patt [padding - 1], padding);
1364         }
1365     }
1366   fragP->fr_var = count;
1367 }
1368
1369 static INLINE int
1370 operand_type_all_zero (const union i386_operand_type *x)
1371 {
1372   switch (ARRAY_SIZE(x->array))
1373     {
1374     case 3:
1375       if (x->array[2])
1376         return 0;
1377     case 2:
1378       if (x->array[1])
1379         return 0;
1380     case 1:
1381       return !x->array[0];
1382     default:
1383       abort ();
1384     }
1385 }
1386
1387 static INLINE void
1388 operand_type_set (union i386_operand_type *x, unsigned int v)
1389 {
1390   switch (ARRAY_SIZE(x->array))
1391     {
1392     case 3:
1393       x->array[2] = v;
1394     case 2:
1395       x->array[1] = v;
1396     case 1:
1397       x->array[0] = v;
1398       break;
1399     default:
1400       abort ();
1401     }
1402 }
1403
1404 static INLINE int
1405 operand_type_equal (const union i386_operand_type *x,
1406                     const union i386_operand_type *y)
1407 {
1408   switch (ARRAY_SIZE(x->array))
1409     {
1410     case 3:
1411       if (x->array[2] != y->array[2])
1412         return 0;
1413     case 2:
1414       if (x->array[1] != y->array[1])
1415         return 0;
1416     case 1:
1417       return x->array[0] == y->array[0];
1418       break;
1419     default:
1420       abort ();
1421     }
1422 }
1423
1424 static INLINE int
1425 cpu_flags_all_zero (const union i386_cpu_flags *x)
1426 {
1427   switch (ARRAY_SIZE(x->array))
1428     {
1429     case 3:
1430       if (x->array[2])
1431         return 0;
1432     case 2:
1433       if (x->array[1])
1434         return 0;
1435     case 1:
1436       return !x->array[0];
1437     default:
1438       abort ();
1439     }
1440 }
1441
1442 static INLINE void
1443 cpu_flags_set (union i386_cpu_flags *x, unsigned int v)
1444 {
1445   switch (ARRAY_SIZE(x->array))
1446     {
1447     case 3:
1448       x->array[2] = v;
1449     case 2:
1450       x->array[1] = v;
1451     case 1:
1452       x->array[0] = v;
1453       break;
1454     default:
1455       abort ();
1456     }
1457 }
1458
1459 static INLINE int
1460 cpu_flags_equal (const union i386_cpu_flags *x,
1461                  const union i386_cpu_flags *y)
1462 {
1463   switch (ARRAY_SIZE(x->array))
1464     {
1465     case 3:
1466       if (x->array[2] != y->array[2])
1467         return 0;
1468     case 2:
1469       if (x->array[1] != y->array[1])
1470         return 0;
1471     case 1:
1472       return x->array[0] == y->array[0];
1473       break;
1474     default:
1475       abort ();
1476     }
1477 }
1478
1479 static INLINE int
1480 cpu_flags_check_cpu64 (i386_cpu_flags f)
1481 {
1482   return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1483            || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1484 }
1485
1486 static INLINE i386_cpu_flags
1487 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1488 {
1489   switch (ARRAY_SIZE (x.array))
1490     {
1491     case 3:
1492       x.array [2] &= y.array [2];
1493     case 2:
1494       x.array [1] &= y.array [1];
1495     case 1:
1496       x.array [0] &= y.array [0];
1497       break;
1498     default:
1499       abort ();
1500     }
1501   return x;
1502 }
1503
1504 static INLINE i386_cpu_flags
1505 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1506 {
1507   switch (ARRAY_SIZE (x.array))
1508     {
1509     case 3:
1510       x.array [2] |= y.array [2];
1511     case 2:
1512       x.array [1] |= y.array [1];
1513     case 1:
1514       x.array [0] |= y.array [0];
1515       break;
1516     default:
1517       abort ();
1518     }
1519   return x;
1520 }
1521
1522 static INLINE i386_cpu_flags
1523 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1524 {
1525   switch (ARRAY_SIZE (x.array))
1526     {
1527     case 3:
1528       x.array [2] &= ~y.array [2];
1529     case 2:
1530       x.array [1] &= ~y.array [1];
1531     case 1:
1532       x.array [0] &= ~y.array [0];
1533       break;
1534     default:
1535       abort ();
1536     }
1537   return x;
1538 }
1539
1540 #define CPU_FLAGS_ARCH_MATCH            0x1
1541 #define CPU_FLAGS_64BIT_MATCH           0x2
1542 #define CPU_FLAGS_AES_MATCH             0x4
1543 #define CPU_FLAGS_PCLMUL_MATCH          0x8
1544 #define CPU_FLAGS_AVX_MATCH            0x10
1545
1546 #define CPU_FLAGS_32BIT_MATCH \
1547   (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_AES_MATCH \
1548    | CPU_FLAGS_PCLMUL_MATCH | CPU_FLAGS_AVX_MATCH)
1549 #define CPU_FLAGS_PERFECT_MATCH \
1550   (CPU_FLAGS_32BIT_MATCH | CPU_FLAGS_64BIT_MATCH)
1551
1552 /* Return CPU flags match bits. */
1553
1554 static int
1555 cpu_flags_match (const insn_template *t)
1556 {
1557   i386_cpu_flags x = t->cpu_flags;
1558   int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1559
1560   x.bitfield.cpu64 = 0;
1561   x.bitfield.cpuno64 = 0;
1562
1563   if (cpu_flags_all_zero (&x))
1564     {
1565       /* This instruction is available on all archs.  */
1566       match |= CPU_FLAGS_32BIT_MATCH;
1567     }
1568   else
1569     {
1570       /* This instruction is available only on some archs.  */
1571       i386_cpu_flags cpu = cpu_arch_flags;
1572
1573       cpu.bitfield.cpu64 = 0;
1574       cpu.bitfield.cpuno64 = 0;
1575       cpu = cpu_flags_and (x, cpu);
1576       if (!cpu_flags_all_zero (&cpu))
1577         {
1578           if (x.bitfield.cpuavx)
1579             {
1580               /* We only need to check AES/PCLMUL/SSE2AVX with AVX.  */
1581               if (cpu.bitfield.cpuavx)
1582                 {
1583                   /* Check SSE2AVX.  */
1584                   if (!t->opcode_modifier.sse2avx|| sse2avx)
1585                     {
1586                       match |= (CPU_FLAGS_ARCH_MATCH
1587                                 | CPU_FLAGS_AVX_MATCH);
1588                       /* Check AES.  */
1589                       if (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1590                         match |= CPU_FLAGS_AES_MATCH;
1591                       /* Check PCLMUL.  */
1592                       if (!x.bitfield.cpupclmul
1593                           || cpu.bitfield.cpupclmul)
1594                         match |= CPU_FLAGS_PCLMUL_MATCH;
1595                     }
1596                 }
1597               else
1598                 match |= CPU_FLAGS_ARCH_MATCH;
1599             }
1600           else
1601             match |= CPU_FLAGS_32BIT_MATCH;
1602         }
1603     }
1604   return match;
1605 }
1606
1607 static INLINE i386_operand_type
1608 operand_type_and (i386_operand_type x, i386_operand_type y)
1609 {
1610   switch (ARRAY_SIZE (x.array))
1611     {
1612     case 3:
1613       x.array [2] &= y.array [2];
1614     case 2:
1615       x.array [1] &= y.array [1];
1616     case 1:
1617       x.array [0] &= y.array [0];
1618       break;
1619     default:
1620       abort ();
1621     }
1622   return x;
1623 }
1624
1625 static INLINE i386_operand_type
1626 operand_type_or (i386_operand_type x, i386_operand_type y)
1627 {
1628   switch (ARRAY_SIZE (x.array))
1629     {
1630     case 3:
1631       x.array [2] |= y.array [2];
1632     case 2:
1633       x.array [1] |= y.array [1];
1634     case 1:
1635       x.array [0] |= y.array [0];
1636       break;
1637     default:
1638       abort ();
1639     }
1640   return x;
1641 }
1642
1643 static INLINE i386_operand_type
1644 operand_type_xor (i386_operand_type x, i386_operand_type y)
1645 {
1646   switch (ARRAY_SIZE (x.array))
1647     {
1648     case 3:
1649       x.array [2] ^= y.array [2];
1650     case 2:
1651       x.array [1] ^= y.array [1];
1652     case 1:
1653       x.array [0] ^= y.array [0];
1654       break;
1655     default:
1656       abort ();
1657     }
1658   return x;
1659 }
1660
1661 static const i386_operand_type acc32 = OPERAND_TYPE_ACC32;
1662 static const i386_operand_type acc64 = OPERAND_TYPE_ACC64;
1663 static const i386_operand_type control = OPERAND_TYPE_CONTROL;
1664 static const i386_operand_type inoutportreg
1665   = OPERAND_TYPE_INOUTPORTREG;
1666 static const i386_operand_type reg16_inoutportreg
1667   = OPERAND_TYPE_REG16_INOUTPORTREG;
1668 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
1669 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
1670 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
1671 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
1672 static const i386_operand_type anydisp
1673   = OPERAND_TYPE_ANYDISP;
1674 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
1675 static const i386_operand_type regymm = OPERAND_TYPE_REGYMM;
1676 static const i386_operand_type regzmm = OPERAND_TYPE_REGZMM;
1677 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
1678 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
1679 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
1680 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
1681 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
1682 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
1683 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
1684 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
1685 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
1686 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
1687 static const i386_operand_type vec_imm4 = OPERAND_TYPE_VEC_IMM4;
1688
1689 enum operand_type
1690 {
1691   reg,
1692   imm,
1693   disp,
1694   anymem
1695 };
1696
1697 static INLINE int
1698 operand_type_check (i386_operand_type t, enum operand_type c)
1699 {
1700   switch (c)
1701     {
1702     case reg:
1703       return (t.bitfield.reg8
1704               || t.bitfield.reg16
1705               || t.bitfield.reg32
1706               || t.bitfield.reg64);
1707
1708     case imm:
1709       return (t.bitfield.imm8
1710               || t.bitfield.imm8s
1711               || t.bitfield.imm16
1712               || t.bitfield.imm32
1713               || t.bitfield.imm32s
1714               || t.bitfield.imm64);
1715
1716     case disp:
1717       return (t.bitfield.disp8
1718               || t.bitfield.disp16
1719               || t.bitfield.disp32
1720               || t.bitfield.disp32s
1721               || t.bitfield.disp64);
1722
1723     case anymem:
1724       return (t.bitfield.disp8
1725               || t.bitfield.disp16
1726               || t.bitfield.disp32
1727               || t.bitfield.disp32s
1728               || t.bitfield.disp64
1729               || t.bitfield.baseindex);
1730
1731     default:
1732       abort ();
1733     }
1734
1735   return 0;
1736 }
1737
1738 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit on
1739    operand J for instruction template T.  */
1740
1741 static INLINE int
1742 match_reg_size (const insn_template *t, unsigned int j)
1743 {
1744   return !((i.types[j].bitfield.byte
1745             && !t->operand_types[j].bitfield.byte)
1746            || (i.types[j].bitfield.word
1747                && !t->operand_types[j].bitfield.word)
1748            || (i.types[j].bitfield.dword
1749                && !t->operand_types[j].bitfield.dword)
1750            || (i.types[j].bitfield.qword
1751                && !t->operand_types[j].bitfield.qword));
1752 }
1753
1754 /* Return 1 if there is no conflict in any size on operand J for
1755    instruction template T.  */
1756
1757 static INLINE int
1758 match_mem_size (const insn_template *t, unsigned int j)
1759 {
1760   return (match_reg_size (t, j)
1761           && !((i.types[j].bitfield.unspecified
1762                 && !t->operand_types[j].bitfield.unspecified)
1763                || (i.types[j].bitfield.fword
1764                    && !t->operand_types[j].bitfield.fword)
1765                || (i.types[j].bitfield.tbyte
1766                    && !t->operand_types[j].bitfield.tbyte)
1767                || (i.types[j].bitfield.xmmword
1768                    && !t->operand_types[j].bitfield.xmmword)
1769                || (i.types[j].bitfield.ymmword
1770                    && !t->operand_types[j].bitfield.ymmword)
1771                || (i.types[j].bitfield.zmmword
1772                    && !t->operand_types[j].bitfield.zmmword)));
1773 }
1774
1775 /* Return 1 if there is no size conflict on any operands for
1776    instruction template T.  */
1777
1778 static INLINE int
1779 operand_size_match (const insn_template *t)
1780 {
1781   unsigned int j;
1782   int match = 1;
1783
1784   /* Don't check jump instructions.  */
1785   if (t->opcode_modifier.jump
1786       || t->opcode_modifier.jumpbyte
1787       || t->opcode_modifier.jumpdword
1788       || t->opcode_modifier.jumpintersegment)
1789     return match;
1790
1791   /* Check memory and accumulator operand size.  */
1792   for (j = 0; j < i.operands; j++)
1793     {
1794       if (t->operand_types[j].bitfield.anysize)
1795         continue;
1796
1797       if (t->operand_types[j].bitfield.acc && !match_reg_size (t, j))
1798         {
1799           match = 0;
1800           break;
1801         }
1802
1803       if (i.types[j].bitfield.mem && !match_mem_size (t, j))
1804         {
1805           match = 0;
1806           break;
1807         }
1808     }
1809
1810   if (match)
1811     return match;
1812   else if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
1813     {
1814 mismatch:
1815       i.error = operand_size_mismatch;
1816       return 0;
1817     }
1818
1819   /* Check reverse.  */
1820   gas_assert (i.operands == 2);
1821
1822   match = 1;
1823   for (j = 0; j < 2; j++)
1824     {
1825       if (t->operand_types[j].bitfield.acc
1826           && !match_reg_size (t, j ? 0 : 1))
1827         goto mismatch;
1828
1829       if (i.types[j].bitfield.mem
1830           && !match_mem_size (t, j ? 0 : 1))
1831         goto mismatch;
1832     }
1833
1834   return match;
1835 }
1836
1837 static INLINE int
1838 operand_type_match (i386_operand_type overlap,
1839                     i386_operand_type given)
1840 {
1841   i386_operand_type temp = overlap;
1842
1843   temp.bitfield.jumpabsolute = 0;
1844   temp.bitfield.unspecified = 0;
1845   temp.bitfield.byte = 0;
1846   temp.bitfield.word = 0;
1847   temp.bitfield.dword = 0;
1848   temp.bitfield.fword = 0;
1849   temp.bitfield.qword = 0;
1850   temp.bitfield.tbyte = 0;
1851   temp.bitfield.xmmword = 0;
1852   temp.bitfield.ymmword = 0;
1853   temp.bitfield.zmmword = 0;
1854   if (operand_type_all_zero (&temp))
1855     goto mismatch;
1856
1857   if (given.bitfield.baseindex == overlap.bitfield.baseindex
1858       && given.bitfield.jumpabsolute == overlap.bitfield.jumpabsolute)
1859     return 1;
1860
1861 mismatch:
1862   i.error = operand_type_mismatch;
1863   return 0;
1864 }
1865
1866 /* If given types g0 and g1 are registers they must be of the same type
1867    unless the expected operand type register overlap is null.
1868    Note that Acc in a template matches every size of reg.  */
1869
1870 static INLINE int
1871 operand_type_register_match (i386_operand_type m0,
1872                              i386_operand_type g0,
1873                              i386_operand_type t0,
1874                              i386_operand_type m1,
1875                              i386_operand_type g1,
1876                              i386_operand_type t1)
1877 {
1878   if (!operand_type_check (g0, reg))
1879     return 1;
1880
1881   if (!operand_type_check (g1, reg))
1882     return 1;
1883
1884   if (g0.bitfield.reg8 == g1.bitfield.reg8
1885       && g0.bitfield.reg16 == g1.bitfield.reg16
1886       && g0.bitfield.reg32 == g1.bitfield.reg32
1887       && g0.bitfield.reg64 == g1.bitfield.reg64)
1888     return 1;
1889
1890   if (m0.bitfield.acc)
1891     {
1892       t0.bitfield.reg8 = 1;
1893       t0.bitfield.reg16 = 1;
1894       t0.bitfield.reg32 = 1;
1895       t0.bitfield.reg64 = 1;
1896     }
1897
1898   if (m1.bitfield.acc)
1899     {
1900       t1.bitfield.reg8 = 1;
1901       t1.bitfield.reg16 = 1;
1902       t1.bitfield.reg32 = 1;
1903       t1.bitfield.reg64 = 1;
1904     }
1905
1906   if (!(t0.bitfield.reg8 & t1.bitfield.reg8)
1907       && !(t0.bitfield.reg16 & t1.bitfield.reg16)
1908       && !(t0.bitfield.reg32 & t1.bitfield.reg32)
1909       && !(t0.bitfield.reg64 & t1.bitfield.reg64))
1910     return 1;
1911
1912   i.error = register_type_mismatch;
1913
1914   return 0;
1915 }
1916
1917 static INLINE unsigned int
1918 register_number (const reg_entry *r)
1919 {
1920   unsigned int nr = r->reg_num;
1921
1922   if (r->reg_flags & RegRex)
1923     nr += 8;
1924
1925   return nr;
1926 }
1927
1928 static INLINE unsigned int
1929 mode_from_disp_size (i386_operand_type t)
1930 {
1931   if (t.bitfield.disp8 || t.bitfield.vec_disp8)
1932     return 1;
1933   else if (t.bitfield.disp16
1934            || t.bitfield.disp32
1935            || t.bitfield.disp32s)
1936     return 2;
1937   else
1938     return 0;
1939 }
1940
1941 static INLINE int
1942 fits_in_signed_byte (offsetT num)
1943 {
1944   return (num >= -128) && (num <= 127);
1945 }
1946
1947 static INLINE int
1948 fits_in_unsigned_byte (offsetT num)
1949 {
1950   return (num & 0xff) == num;
1951 }
1952
1953 static INLINE int
1954 fits_in_unsigned_word (offsetT num)
1955 {
1956   return (num & 0xffff) == num;
1957 }
1958
1959 static INLINE int
1960 fits_in_signed_word (offsetT num)
1961 {
1962   return (-32768 <= num) && (num <= 32767);
1963 }
1964
1965 static INLINE int
1966 fits_in_signed_long (offsetT num ATTRIBUTE_UNUSED)
1967 {
1968 #ifndef BFD64
1969   return 1;
1970 #else
1971   return (!(((offsetT) -1 << 31) & num)
1972           || (((offsetT) -1 << 31) & num) == ((offsetT) -1 << 31));
1973 #endif
1974 }                               /* fits_in_signed_long() */
1975
1976 static INLINE int
1977 fits_in_unsigned_long (offsetT num ATTRIBUTE_UNUSED)
1978 {
1979 #ifndef BFD64
1980   return 1;
1981 #else
1982   return (num & (((offsetT) 2 << 31) - 1)) == num;
1983 #endif
1984 }                               /* fits_in_unsigned_long() */
1985
1986 static INLINE int
1987 fits_in_vec_disp8 (offsetT num)
1988 {
1989   int shift = i.memshift;
1990   unsigned int mask;
1991
1992   if (shift == -1)
1993     abort ();
1994
1995   mask = (1 << shift) - 1;
1996
1997   /* Return 0 if NUM isn't properly aligned.  */
1998   if ((num & mask))
1999     return 0;
2000
2001   /* Check if NUM will fit in 8bit after shift.  */
2002   return fits_in_signed_byte (num >> shift);
2003 }
2004
2005 static INLINE int
2006 fits_in_imm4 (offsetT num)
2007 {
2008   return (num & 0xf) == num;
2009 }
2010
2011 static i386_operand_type
2012 smallest_imm_type (offsetT num)
2013 {
2014   i386_operand_type t;
2015
2016   operand_type_set (&t, 0);
2017   t.bitfield.imm64 = 1;
2018
2019   if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2020     {
2021       /* This code is disabled on the 486 because all the Imm1 forms
2022          in the opcode table are slower on the i486.  They're the
2023          versions with the implicitly specified single-position
2024          displacement, which has another syntax if you really want to
2025          use that form.  */
2026       t.bitfield.imm1 = 1;
2027       t.bitfield.imm8 = 1;
2028       t.bitfield.imm8s = 1;
2029       t.bitfield.imm16 = 1;
2030       t.bitfield.imm32 = 1;
2031       t.bitfield.imm32s = 1;
2032     }
2033   else if (fits_in_signed_byte (num))
2034     {
2035       t.bitfield.imm8 = 1;
2036       t.bitfield.imm8s = 1;
2037       t.bitfield.imm16 = 1;
2038       t.bitfield.imm32 = 1;
2039       t.bitfield.imm32s = 1;
2040     }
2041   else if (fits_in_unsigned_byte (num))
2042     {
2043       t.bitfield.imm8 = 1;
2044       t.bitfield.imm16 = 1;
2045       t.bitfield.imm32 = 1;
2046       t.bitfield.imm32s = 1;
2047     }
2048   else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2049     {
2050       t.bitfield.imm16 = 1;
2051       t.bitfield.imm32 = 1;
2052       t.bitfield.imm32s = 1;
2053     }
2054   else if (fits_in_signed_long (num))
2055     {
2056       t.bitfield.imm32 = 1;
2057       t.bitfield.imm32s = 1;
2058     }
2059   else if (fits_in_unsigned_long (num))
2060     t.bitfield.imm32 = 1;
2061
2062   return t;
2063 }
2064
2065 static offsetT
2066 offset_in_range (offsetT val, int size)
2067 {
2068   addressT mask;
2069
2070   switch (size)
2071     {
2072     case 1: mask = ((addressT) 1 <<  8) - 1; break;
2073     case 2: mask = ((addressT) 1 << 16) - 1; break;
2074     case 4: mask = ((addressT) 2 << 31) - 1; break;
2075 #ifdef BFD64
2076     case 8: mask = ((addressT) 2 << 63) - 1; break;
2077 #endif
2078     default: abort ();
2079     }
2080
2081 #ifdef BFD64
2082   /* If BFD64, sign extend val for 32bit address mode.  */
2083   if (flag_code != CODE_64BIT
2084       || i.prefix[ADDR_PREFIX])
2085     if ((val & ~(((addressT) 2 << 31) - 1)) == 0)
2086       val = (val ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
2087 #endif
2088
2089   if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2090     {
2091       char buf1[40], buf2[40];
2092
2093       sprint_value (buf1, val);
2094       sprint_value (buf2, val & mask);
2095       as_warn (_("%s shortened to %s"), buf1, buf2);
2096     }
2097   return val & mask;
2098 }
2099
2100 enum PREFIX_GROUP
2101 {
2102   PREFIX_EXIST = 0,
2103   PREFIX_LOCK,
2104   PREFIX_REP,
2105   PREFIX_OTHER
2106 };
2107
2108 /* Returns
2109    a. PREFIX_EXIST if attempting to add a prefix where one from the
2110    same class already exists.
2111    b. PREFIX_LOCK if lock prefix is added.
2112    c. PREFIX_REP if rep/repne prefix is added.
2113    d. PREFIX_OTHER if other prefix is added.
2114  */
2115
2116 static enum PREFIX_GROUP
2117 add_prefix (unsigned int prefix)
2118 {
2119   enum PREFIX_GROUP ret = PREFIX_OTHER;
2120   unsigned int q;
2121
2122   if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2123       && flag_code == CODE_64BIT)
2124     {
2125       if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2126           || ((i.prefix[REX_PREFIX] & (REX_R | REX_X | REX_B))
2127               && (prefix & (REX_R | REX_X | REX_B))))
2128         ret = PREFIX_EXIST;
2129       q = REX_PREFIX;
2130     }
2131   else
2132     {
2133       switch (prefix)
2134         {
2135         default:
2136           abort ();
2137
2138         case CS_PREFIX_OPCODE:
2139         case DS_PREFIX_OPCODE:
2140         case ES_PREFIX_OPCODE:
2141         case FS_PREFIX_OPCODE:
2142         case GS_PREFIX_OPCODE:
2143         case SS_PREFIX_OPCODE:
2144           q = SEG_PREFIX;
2145           break;
2146
2147         case REPNE_PREFIX_OPCODE:
2148         case REPE_PREFIX_OPCODE:
2149           q = REP_PREFIX;
2150           ret = PREFIX_REP;
2151           break;
2152
2153         case LOCK_PREFIX_OPCODE:
2154           q = LOCK_PREFIX;
2155           ret = PREFIX_LOCK;
2156           break;
2157
2158         case FWAIT_OPCODE:
2159           q = WAIT_PREFIX;
2160           break;
2161
2162         case ADDR_PREFIX_OPCODE:
2163           q = ADDR_PREFIX;
2164           break;
2165
2166         case DATA_PREFIX_OPCODE:
2167           q = DATA_PREFIX;
2168           break;
2169         }
2170       if (i.prefix[q] != 0)
2171         ret = PREFIX_EXIST;
2172     }
2173
2174   if (ret)
2175     {
2176       if (!i.prefix[q])
2177         ++i.prefixes;
2178       i.prefix[q] |= prefix;
2179     }
2180   else
2181     as_bad (_("same type of prefix used twice"));
2182
2183   return ret;
2184 }
2185
2186 static void
2187 update_code_flag (int value, int check)
2188 {
2189   PRINTF_LIKE ((*as_error));
2190
2191   flag_code = (enum flag_code) value;
2192   if (flag_code == CODE_64BIT)
2193     {
2194       cpu_arch_flags.bitfield.cpu64 = 1;
2195       cpu_arch_flags.bitfield.cpuno64 = 0;
2196     }
2197   else
2198     {
2199       cpu_arch_flags.bitfield.cpu64 = 0;
2200       cpu_arch_flags.bitfield.cpuno64 = 1;
2201     }
2202   if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2203     {
2204       if (check)
2205         as_error = as_fatal;
2206       else
2207         as_error = as_bad;
2208       (*as_error) (_("64bit mode not supported on `%s'."),
2209                    cpu_arch_name ? cpu_arch_name : default_arch);
2210     }
2211   if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2212     {
2213       if (check)
2214         as_error = as_fatal;
2215       else
2216         as_error = as_bad;
2217       (*as_error) (_("32bit mode not supported on `%s'."),
2218                    cpu_arch_name ? cpu_arch_name : default_arch);
2219     }
2220   stackop_size = '\0';
2221 }
2222
2223 static void
2224 set_code_flag (int value)
2225 {
2226   update_code_flag (value, 0);
2227 }
2228
2229 static void
2230 set_16bit_gcc_code_flag (int new_code_flag)
2231 {
2232   flag_code = (enum flag_code) new_code_flag;
2233   if (flag_code != CODE_16BIT)
2234     abort ();
2235   cpu_arch_flags.bitfield.cpu64 = 0;
2236   cpu_arch_flags.bitfield.cpuno64 = 1;
2237   stackop_size = LONG_MNEM_SUFFIX;
2238 }
2239
2240 static void
2241 set_intel_syntax (int syntax_flag)
2242 {
2243   /* Find out if register prefixing is specified.  */
2244   int ask_naked_reg = 0;
2245
2246   SKIP_WHITESPACE ();
2247   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2248     {
2249       char *string = input_line_pointer;
2250       int e = get_symbol_end ();
2251
2252       if (strcmp (string, "prefix") == 0)
2253         ask_naked_reg = 1;
2254       else if (strcmp (string, "noprefix") == 0)
2255         ask_naked_reg = -1;
2256       else
2257         as_bad (_("bad argument to syntax directive."));
2258       *input_line_pointer = e;
2259     }
2260   demand_empty_rest_of_line ();
2261
2262   intel_syntax = syntax_flag;
2263
2264   if (ask_naked_reg == 0)
2265     allow_naked_reg = (intel_syntax
2266                        && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2267   else
2268     allow_naked_reg = (ask_naked_reg < 0);
2269
2270   expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2271
2272   identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2273   identifier_chars['$'] = intel_syntax ? '$' : 0;
2274   register_prefix = allow_naked_reg ? "" : "%";
2275 }
2276
2277 static void
2278 set_intel_mnemonic (int mnemonic_flag)
2279 {
2280   intel_mnemonic = mnemonic_flag;
2281 }
2282
2283 static void
2284 set_allow_index_reg (int flag)
2285 {
2286   allow_index_reg = flag;
2287 }
2288
2289 static void
2290 set_check (int what)
2291 {
2292   enum check_kind *kind;
2293   const char *str;
2294
2295   if (what)
2296     {
2297       kind = &operand_check;
2298       str = "operand";
2299     }
2300   else
2301     {
2302       kind = &sse_check;
2303       str = "sse";
2304     }
2305
2306   SKIP_WHITESPACE ();
2307
2308   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2309     {
2310       char *string = input_line_pointer;
2311       int e = get_symbol_end ();
2312
2313       if (strcmp (string, "none") == 0)
2314         *kind = check_none;
2315       else if (strcmp (string, "warning") == 0)
2316         *kind = check_warning;
2317       else if (strcmp (string, "error") == 0)
2318         *kind = check_error;
2319       else
2320         as_bad (_("bad argument to %s_check directive."), str);
2321       *input_line_pointer = e;
2322     }
2323   else
2324     as_bad (_("missing argument for %s_check directive"), str);
2325
2326   demand_empty_rest_of_line ();
2327 }
2328
2329 static void
2330 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2331                            i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2332 {
2333 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2334   static const char *arch;
2335
2336   /* Intel LIOM is only supported on ELF.  */
2337   if (!IS_ELF)
2338     return;
2339
2340   if (!arch)
2341     {
2342       /* Use cpu_arch_name if it is set in md_parse_option.  Otherwise
2343          use default_arch.  */
2344       arch = cpu_arch_name;
2345       if (!arch)
2346         arch = default_arch;
2347     }
2348
2349   /* If we are targeting Intel L1OM, we must enable it.  */
2350   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2351       || new_flag.bitfield.cpul1om)
2352     return;
2353
2354   /* If we are targeting Intel K1OM, we must enable it.  */
2355   if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2356       || new_flag.bitfield.cpuk1om)
2357     return;
2358
2359   as_bad (_("`%s' is not supported on `%s'"), name, arch);
2360 #endif
2361 }
2362
2363 static void
2364 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2365 {
2366   SKIP_WHITESPACE ();
2367
2368   if (!is_end_of_line[(unsigned char) *input_line_pointer])
2369     {
2370       char *string = input_line_pointer;
2371       int e = get_symbol_end ();
2372       unsigned int j;
2373       i386_cpu_flags flags;
2374
2375       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2376         {
2377           if (strcmp (string, cpu_arch[j].name) == 0)
2378             {
2379               check_cpu_arch_compatible (string, cpu_arch[j].flags);
2380
2381               if (*string != '.')
2382                 {
2383                   cpu_arch_name = cpu_arch[j].name;
2384                   cpu_sub_arch_name = NULL;
2385                   cpu_arch_flags = cpu_arch[j].flags;
2386                   if (flag_code == CODE_64BIT)
2387                     {
2388                       cpu_arch_flags.bitfield.cpu64 = 1;
2389                       cpu_arch_flags.bitfield.cpuno64 = 0;
2390                     }
2391                   else
2392                     {
2393                       cpu_arch_flags.bitfield.cpu64 = 0;
2394                       cpu_arch_flags.bitfield.cpuno64 = 1;
2395                     }
2396                   cpu_arch_isa = cpu_arch[j].type;
2397                   cpu_arch_isa_flags = cpu_arch[j].flags;
2398                   if (!cpu_arch_tune_set)
2399                     {
2400                       cpu_arch_tune = cpu_arch_isa;
2401                       cpu_arch_tune_flags = cpu_arch_isa_flags;
2402                     }
2403                   break;
2404                 }
2405
2406               if (!cpu_arch[j].negated)
2407                 flags = cpu_flags_or (cpu_arch_flags,
2408                                       cpu_arch[j].flags);
2409               else
2410                 flags = cpu_flags_and_not (cpu_arch_flags,
2411                                            cpu_arch[j].flags);
2412               if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2413                 {
2414                   if (cpu_sub_arch_name)
2415                     {
2416                       char *name = cpu_sub_arch_name;
2417                       cpu_sub_arch_name = concat (name,
2418                                                   cpu_arch[j].name,
2419                                                   (const char *) NULL);
2420                       free (name);
2421                     }
2422                   else
2423                     cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2424                   cpu_arch_flags = flags;
2425                   cpu_arch_isa_flags = flags;
2426                 }
2427               *input_line_pointer = e;
2428               demand_empty_rest_of_line ();
2429               return;
2430             }
2431         }
2432       if (j >= ARRAY_SIZE (cpu_arch))
2433         as_bad (_("no such architecture: `%s'"), string);
2434
2435       *input_line_pointer = e;
2436     }
2437   else
2438     as_bad (_("missing cpu architecture"));
2439
2440   no_cond_jump_promotion = 0;
2441   if (*input_line_pointer == ','
2442       && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2443     {
2444       char *string = ++input_line_pointer;
2445       int e = get_symbol_end ();
2446
2447       if (strcmp (string, "nojumps") == 0)
2448         no_cond_jump_promotion = 1;
2449       else if (strcmp (string, "jumps") == 0)
2450         ;
2451       else
2452         as_bad (_("no such architecture modifier: `%s'"), string);
2453
2454       *input_line_pointer = e;
2455     }
2456
2457   demand_empty_rest_of_line ();
2458 }
2459
2460 enum bfd_architecture
2461 i386_arch (void)
2462 {
2463   if (cpu_arch_isa == PROCESSOR_L1OM)
2464     {
2465       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2466           || flag_code != CODE_64BIT)
2467         as_fatal (_("Intel L1OM is 64bit ELF only"));
2468       return bfd_arch_l1om;
2469     }
2470   else if (cpu_arch_isa == PROCESSOR_K1OM)
2471     {
2472       if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2473           || flag_code != CODE_64BIT)
2474         as_fatal (_("Intel K1OM is 64bit ELF only"));
2475       return bfd_arch_k1om;
2476     }
2477   else
2478     return bfd_arch_i386;
2479 }
2480
2481 unsigned long
2482 i386_mach (void)
2483 {
2484   if (!strncmp (default_arch, "x86_64", 6))
2485     {
2486       if (cpu_arch_isa == PROCESSOR_L1OM)
2487         {
2488           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2489               || default_arch[6] != '\0')
2490             as_fatal (_("Intel L1OM is 64bit ELF only"));
2491           return bfd_mach_l1om;
2492         }
2493       else if (cpu_arch_isa == PROCESSOR_K1OM)
2494         {
2495           if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2496               || default_arch[6] != '\0')
2497             as_fatal (_("Intel K1OM is 64bit ELF only"));
2498           return bfd_mach_k1om;
2499         }
2500       else if (default_arch[6] == '\0')
2501         return bfd_mach_x86_64;
2502       else
2503         return bfd_mach_x64_32;
2504     }
2505   else if (!strcmp (default_arch, "i386"))
2506     return bfd_mach_i386_i386;
2507   else
2508     as_fatal (_("unknown architecture"));
2509 }
2510 \f
2511 void
2512 md_begin (void)
2513 {
2514   const char *hash_err;
2515
2516   /* Initialize op_hash hash table.  */
2517   op_hash = hash_new ();
2518
2519   {
2520     const insn_template *optab;
2521     templates *core_optab;
2522
2523     /* Setup for loop.  */
2524     optab = i386_optab;
2525     core_optab = (templates *) xmalloc (sizeof (templates));
2526     core_optab->start = optab;
2527
2528     while (1)
2529       {
2530         ++optab;
2531         if (optab->name == NULL
2532             || strcmp (optab->name, (optab - 1)->name) != 0)
2533           {
2534             /* different name --> ship out current template list;
2535                add to hash table; & begin anew.  */
2536             core_optab->end = optab;
2537             hash_err = hash_insert (op_hash,
2538                                     (optab - 1)->name,
2539                                     (void *) core_optab);
2540             if (hash_err)
2541               {
2542                 as_fatal (_("can't hash %s: %s"),
2543                           (optab - 1)->name,
2544                           hash_err);
2545               }
2546             if (optab->name == NULL)
2547               break;
2548             core_optab = (templates *) xmalloc (sizeof (templates));
2549             core_optab->start = optab;
2550           }
2551       }
2552   }
2553
2554   /* Initialize reg_hash hash table.  */
2555   reg_hash = hash_new ();
2556   {
2557     const reg_entry *regtab;
2558     unsigned int regtab_size = i386_regtab_size;
2559
2560     for (regtab = i386_regtab; regtab_size--; regtab++)
2561       {
2562         hash_err = hash_insert (reg_hash, regtab->reg_name, (void *) regtab);
2563         if (hash_err)
2564           as_fatal (_("can't hash %s: %s"),
2565                     regtab->reg_name,
2566                     hash_err);
2567       }
2568   }
2569
2570   /* Fill in lexical tables:  mnemonic_chars, operand_chars.  */
2571   {
2572     int c;
2573     char *p;
2574
2575     for (c = 0; c < 256; c++)
2576       {
2577         if (ISDIGIT (c))
2578           {
2579             digit_chars[c] = c;
2580             mnemonic_chars[c] = c;
2581             register_chars[c] = c;
2582             operand_chars[c] = c;
2583           }
2584         else if (ISLOWER (c))
2585           {
2586             mnemonic_chars[c] = c;
2587             register_chars[c] = c;
2588             operand_chars[c] = c;
2589           }
2590         else if (ISUPPER (c))
2591           {
2592             mnemonic_chars[c] = TOLOWER (c);
2593             register_chars[c] = mnemonic_chars[c];
2594             operand_chars[c] = c;
2595           }
2596         else if (c == '{' || c == '}')
2597           operand_chars[c] = c;
2598
2599         if (ISALPHA (c) || ISDIGIT (c))
2600           identifier_chars[c] = c;
2601         else if (c >= 128)
2602           {
2603             identifier_chars[c] = c;
2604             operand_chars[c] = c;
2605           }
2606       }
2607
2608 #ifdef LEX_AT
2609     identifier_chars['@'] = '@';
2610 #endif
2611 #ifdef LEX_QM
2612     identifier_chars['?'] = '?';
2613     operand_chars['?'] = '?';
2614 #endif
2615     digit_chars['-'] = '-';
2616     mnemonic_chars['_'] = '_';
2617     mnemonic_chars['-'] = '-';
2618     mnemonic_chars['.'] = '.';
2619     identifier_chars['_'] = '_';
2620     identifier_chars['.'] = '.';
2621
2622     for (p = operand_special_chars; *p != '\0'; p++)
2623       operand_chars[(unsigned char) *p] = *p;
2624   }
2625
2626   if (flag_code == CODE_64BIT)
2627     {
2628 #if defined (OBJ_COFF) && defined (TE_PE)
2629       x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
2630                                   ? 32 : 16);
2631 #else
2632       x86_dwarf2_return_column = 16;
2633 #endif
2634       x86_cie_data_alignment = -8;
2635     }
2636   else
2637     {
2638       x86_dwarf2_return_column = 8;
2639       x86_cie_data_alignment = -4;
2640     }
2641 }
2642
2643 void
2644 i386_print_statistics (FILE *file)
2645 {
2646   hash_print_statistics (file, "i386 opcode", op_hash);
2647   hash_print_statistics (file, "i386 register", reg_hash);
2648 }
2649 \f
2650 #ifdef DEBUG386
2651
2652 /* Debugging routines for md_assemble.  */
2653 static void pte (insn_template *);
2654 static void pt (i386_operand_type);
2655 static void pe (expressionS *);
2656 static void ps (symbolS *);
2657
2658 static void
2659 pi (char *line, i386_insn *x)
2660 {
2661   unsigned int j;
2662
2663   fprintf (stdout, "%s: template ", line);
2664   pte (&x->tm);
2665   fprintf (stdout, "  address: base %s  index %s  scale %x\n",
2666            x->base_reg ? x->base_reg->reg_name : "none",
2667            x->index_reg ? x->index_reg->reg_name : "none",
2668            x->log2_scale_factor);
2669   fprintf (stdout, "  modrm:  mode %x  reg %x  reg/mem %x\n",
2670            x->rm.mode, x->rm.reg, x->rm.regmem);
2671   fprintf (stdout, "  sib:  base %x  index %x  scale %x\n",
2672            x->sib.base, x->sib.index, x->sib.scale);
2673   fprintf (stdout, "  rex: 64bit %x  extX %x  extY %x  extZ %x\n",
2674            (x->rex & REX_W) != 0,
2675            (x->rex & REX_R) != 0,
2676            (x->rex & REX_X) != 0,
2677            (x->rex & REX_B) != 0);
2678   for (j = 0; j < x->operands; j++)
2679     {
2680       fprintf (stdout, "    #%d:  ", j + 1);
2681       pt (x->types[j]);
2682       fprintf (stdout, "\n");
2683       if (x->types[j].bitfield.reg8
2684           || x->types[j].bitfield.reg16
2685           || x->types[j].bitfield.reg32
2686           || x->types[j].bitfield.reg64
2687           || x->types[j].bitfield.regmmx
2688           || x->types[j].bitfield.regxmm
2689           || x->types[j].bitfield.regymm
2690           || x->types[j].bitfield.regzmm
2691           || x->types[j].bitfield.sreg2
2692           || x->types[j].bitfield.sreg3
2693           || x->types[j].bitfield.control
2694           || x->types[j].bitfield.debug
2695           || x->types[j].bitfield.test)
2696         fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
2697       if (operand_type_check (x->types[j], imm))
2698         pe (x->op[j].imms);
2699       if (operand_type_check (x->types[j], disp))
2700         pe (x->op[j].disps);
2701     }
2702 }
2703
2704 static void
2705 pte (insn_template *t)
2706 {
2707   unsigned int j;
2708   fprintf (stdout, " %d operands ", t->operands);
2709   fprintf (stdout, "opcode %x ", t->base_opcode);
2710   if (t->extension_opcode != None)
2711     fprintf (stdout, "ext %x ", t->extension_opcode);
2712   if (t->opcode_modifier.d)
2713     fprintf (stdout, "D");
2714   if (t->opcode_modifier.w)
2715     fprintf (stdout, "W");
2716   fprintf (stdout, "\n");
2717   for (j = 0; j < t->operands; j++)
2718     {
2719       fprintf (stdout, "    #%d type ", j + 1);
2720       pt (t->operand_types[j]);
2721       fprintf (stdout, "\n");
2722     }
2723 }
2724
2725 static void
2726 pe (expressionS *e)
2727 {
2728   fprintf (stdout, "    operation     %d\n", e->X_op);
2729   fprintf (stdout, "    add_number    %ld (%lx)\n",
2730            (long) e->X_add_number, (long) e->X_add_number);
2731   if (e->X_add_symbol)
2732     {
2733       fprintf (stdout, "    add_symbol    ");
2734       ps (e->X_add_symbol);
2735       fprintf (stdout, "\n");
2736     }
2737   if (e->X_op_symbol)
2738     {
2739       fprintf (stdout, "    op_symbol    ");
2740       ps (e->X_op_symbol);
2741       fprintf (stdout, "\n");
2742     }
2743 }
2744
2745 static void
2746 ps (symbolS *s)
2747 {
2748   fprintf (stdout, "%s type %s%s",
2749            S_GET_NAME (s),
2750            S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
2751            segment_name (S_GET_SEGMENT (s)));
2752 }
2753
2754 static struct type_name
2755   {
2756     i386_operand_type mask;
2757     const char *name;
2758   }
2759 const type_names[] =
2760 {
2761   { OPERAND_TYPE_REG8, "r8" },
2762   { OPERAND_TYPE_REG16, "r16" },
2763   { OPERAND_TYPE_REG32, "r32" },
2764   { OPERAND_TYPE_REG64, "r64" },
2765   { OPERAND_TYPE_IMM8, "i8" },
2766   { OPERAND_TYPE_IMM8, "i8s" },
2767   { OPERAND_TYPE_IMM16, "i16" },
2768   { OPERAND_TYPE_IMM32, "i32" },
2769   { OPERAND_TYPE_IMM32S, "i32s" },
2770   { OPERAND_TYPE_IMM64, "i64" },
2771   { OPERAND_TYPE_IMM1, "i1" },
2772   { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
2773   { OPERAND_TYPE_DISP8, "d8" },
2774   { OPERAND_TYPE_DISP16, "d16" },
2775   { OPERAND_TYPE_DISP32, "d32" },
2776   { OPERAND_TYPE_DISP32S, "d32s" },
2777   { OPERAND_TYPE_DISP64, "d64" },
2778   { OPERAND_TYPE_VEC_DISP8, "Vector d8" },
2779   { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
2780   { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
2781   { OPERAND_TYPE_CONTROL, "control reg" },
2782   { OPERAND_TYPE_TEST, "test reg" },
2783   { OPERAND_TYPE_DEBUG, "debug reg" },
2784   { OPERAND_TYPE_FLOATREG, "FReg" },
2785   { OPERAND_TYPE_FLOATACC, "FAcc" },
2786   { OPERAND_TYPE_SREG2, "SReg2" },
2787   { OPERAND_TYPE_SREG3, "SReg3" },
2788   { OPERAND_TYPE_ACC, "Acc" },
2789   { OPERAND_TYPE_JUMPABSOLUTE, "Jump Absolute" },
2790   { OPERAND_TYPE_REGMMX, "rMMX" },
2791   { OPERAND_TYPE_REGXMM, "rXMM" },
2792   { OPERAND_TYPE_REGYMM, "rYMM" },
2793   { OPERAND_TYPE_REGZMM, "rZMM" },
2794   { OPERAND_TYPE_REGMASK, "Mask reg" },
2795   { OPERAND_TYPE_ESSEG, "es" },
2796 };
2797
2798 static void
2799 pt (i386_operand_type t)
2800 {
2801   unsigned int j;
2802   i386_operand_type a;
2803
2804   for (j = 0; j < ARRAY_SIZE (type_names); j++)
2805     {
2806       a = operand_type_and (t, type_names[j].mask);
2807       if (!operand_type_all_zero (&a))
2808         fprintf (stdout, "%s, ",  type_names[j].name);
2809     }
2810   fflush (stdout);
2811 }
2812
2813 #endif /* DEBUG386 */
2814 \f
2815 static bfd_reloc_code_real_type
2816 reloc (unsigned int size,
2817        int pcrel,
2818        int sign,
2819        int bnd_prefix,
2820        bfd_reloc_code_real_type other)
2821 {
2822   if (other != NO_RELOC)
2823     {
2824       reloc_howto_type *rel;
2825
2826       if (size == 8)
2827         switch (other)
2828           {
2829           case BFD_RELOC_X86_64_GOT32:
2830             return BFD_RELOC_X86_64_GOT64;
2831             break;
2832           case BFD_RELOC_X86_64_PLTOFF64:
2833             return BFD_RELOC_X86_64_PLTOFF64;
2834             break;
2835           case BFD_RELOC_X86_64_GOTPC32:
2836             other = BFD_RELOC_X86_64_GOTPC64;
2837             break;
2838           case BFD_RELOC_X86_64_GOTPCREL:
2839             other = BFD_RELOC_X86_64_GOTPCREL64;
2840             break;
2841           case BFD_RELOC_X86_64_TPOFF32:
2842             other = BFD_RELOC_X86_64_TPOFF64;
2843             break;
2844           case BFD_RELOC_X86_64_DTPOFF32:
2845             other = BFD_RELOC_X86_64_DTPOFF64;
2846             break;
2847           default:
2848             break;
2849           }
2850
2851 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2852       if (other == BFD_RELOC_SIZE32)
2853         {
2854           if (size == 8)
2855             other = BFD_RELOC_SIZE64;
2856           if (pcrel)
2857             {
2858               as_bad (_("there are no pc-relative size relocations"));
2859               return NO_RELOC;
2860             }
2861         }
2862 #endif
2863
2864       /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless.  */
2865       if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
2866         sign = -1;
2867
2868       rel = bfd_reloc_type_lookup (stdoutput, other);
2869       if (!rel)
2870         as_bad (_("unknown relocation (%u)"), other);
2871       else if (size != bfd_get_reloc_size (rel))
2872         as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
2873                 bfd_get_reloc_size (rel),
2874                 size);
2875       else if (pcrel && !rel->pc_relative)
2876         as_bad (_("non-pc-relative relocation for pc-relative field"));
2877       else if ((rel->complain_on_overflow == complain_overflow_signed
2878                 && !sign)
2879                || (rel->complain_on_overflow == complain_overflow_unsigned
2880                    && sign > 0))
2881         as_bad (_("relocated field and relocation type differ in signedness"));
2882       else
2883         return other;
2884       return NO_RELOC;
2885     }
2886
2887   if (pcrel)
2888     {
2889       if (!sign)
2890         as_bad (_("there are no unsigned pc-relative relocations"));
2891       switch (size)
2892         {
2893         case 1: return BFD_RELOC_8_PCREL;
2894         case 2: return BFD_RELOC_16_PCREL;
2895         case 4: return (bnd_prefix && object_64bit
2896                         ? BFD_RELOC_X86_64_PC32_BND
2897                         : BFD_RELOC_32_PCREL);
2898         case 8: return BFD_RELOC_64_PCREL;
2899         }
2900       as_bad (_("cannot do %u byte pc-relative relocation"), size);
2901     }
2902   else
2903     {
2904       if (sign > 0)
2905         switch (size)
2906           {
2907           case 4: return BFD_RELOC_X86_64_32S;
2908           }
2909       else
2910         switch (size)
2911           {
2912           case 1: return BFD_RELOC_8;
2913           case 2: return BFD_RELOC_16;
2914           case 4: return BFD_RELOC_32;
2915           case 8: return BFD_RELOC_64;
2916           }
2917       as_bad (_("cannot do %s %u byte relocation"),
2918               sign > 0 ? "signed" : "unsigned", size);
2919     }
2920
2921   return NO_RELOC;
2922 }
2923
2924 /* Here we decide which fixups can be adjusted to make them relative to
2925    the beginning of the section instead of the symbol.  Basically we need
2926    to make sure that the dynamic relocations are done correctly, so in
2927    some cases we force the original symbol to be used.  */
2928
2929 int
2930 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
2931 {
2932 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2933   if (!IS_ELF)
2934     return 1;
2935
2936   /* Don't adjust pc-relative references to merge sections in 64-bit
2937      mode.  */
2938   if (use_rela_relocations
2939       && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
2940       && fixP->fx_pcrel)
2941     return 0;
2942
2943   /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
2944      and changed later by validate_fix.  */
2945   if (GOT_symbol && fixP->fx_subsy == GOT_symbol
2946       && fixP->fx_r_type == BFD_RELOC_32_PCREL)
2947     return 0;
2948
2949   /* Adjust_reloc_syms doesn't know about the GOT.  Need to keep symbol
2950      for size relocations.  */
2951   if (fixP->fx_r_type == BFD_RELOC_SIZE32
2952       || fixP->fx_r_type == BFD_RELOC_SIZE64
2953       || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
2954       || fixP->fx_r_type == BFD_RELOC_386_PLT32
2955       || fixP->fx_r_type == BFD_RELOC_386_GOT32
2956       || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
2957       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
2958       || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
2959       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
2960       || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
2961       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
2962       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
2963       || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
2964       || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
2965       || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
2966       || fixP->fx_r_type == BFD_RELOC_X86_64_PLT32
2967       || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
2968       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
2969       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
2970       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
2971       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
2972       || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
2973       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
2974       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
2975       || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
2976       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
2977       || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
2978       || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
2979       || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
2980       || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
2981     return 0;
2982 #endif
2983   return 1;
2984 }
2985
2986 static int
2987 intel_float_operand (const char *mnemonic)
2988 {
2989   /* Note that the value returned is meaningful only for opcodes with (memory)
2990      operands, hence the code here is free to improperly handle opcodes that
2991      have no operands (for better performance and smaller code). */
2992
2993   if (mnemonic[0] != 'f')
2994     return 0; /* non-math */
2995
2996   switch (mnemonic[1])
2997     {
2998     /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
2999        the fs segment override prefix not currently handled because no
3000        call path can make opcodes without operands get here */
3001     case 'i':
3002       return 2 /* integer op */;
3003     case 'l':
3004       if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3005         return 3; /* fldcw/fldenv */
3006       break;
3007     case 'n':
3008       if (mnemonic[2] != 'o' /* fnop */)
3009         return 3; /* non-waiting control op */
3010       break;
3011     case 'r':
3012       if (mnemonic[2] == 's')
3013         return 3; /* frstor/frstpm */
3014       break;
3015     case 's':
3016       if (mnemonic[2] == 'a')
3017         return 3; /* fsave */
3018       if (mnemonic[2] == 't')
3019         {
3020           switch (mnemonic[3])
3021             {
3022             case 'c': /* fstcw */
3023             case 'd': /* fstdw */
3024             case 'e': /* fstenv */
3025             case 's': /* fsts[gw] */
3026               return 3;
3027             }
3028         }
3029       break;
3030     case 'x':
3031       if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3032         return 0; /* fxsave/fxrstor are not really math ops */
3033       break;
3034     }
3035
3036   return 1;
3037 }
3038
3039 /* Build the VEX prefix.  */
3040
3041 static void
3042 build_vex_prefix (const insn_template *t)
3043 {
3044   unsigned int register_specifier;
3045   unsigned int implied_prefix;
3046   unsigned int vector_length;
3047
3048   /* Check register specifier.  */
3049   if (i.vex.register_specifier)
3050     {
3051       register_specifier =
3052         ~register_number (i.vex.register_specifier) & 0xf;
3053       gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3054     }
3055   else
3056     register_specifier = 0xf;
3057
3058   /* Use 2-byte VEX prefix by swappping destination and source
3059      operand.  */
3060   if (!i.swap_operand
3061       && i.operands == i.reg_operands
3062       && i.tm.opcode_modifier.vexopcode == VEX0F
3063       && i.tm.opcode_modifier.s
3064       && i.rex == REX_B)
3065     {
3066       unsigned int xchg = i.operands - 1;
3067       union i386_op temp_op;
3068       i386_operand_type temp_type;
3069
3070       temp_type = i.types[xchg];
3071       i.types[xchg] = i.types[0];
3072       i.types[0] = temp_type;
3073       temp_op = i.op[xchg];
3074       i.op[xchg] = i.op[0];
3075       i.op[0] = temp_op;
3076
3077       gas_assert (i.rm.mode == 3);
3078
3079       i.rex = REX_R;
3080       xchg = i.rm.regmem;
3081       i.rm.regmem = i.rm.reg;
3082       i.rm.reg = xchg;
3083
3084       /* Use the next insn.  */
3085       i.tm = t[1];
3086     }
3087
3088   if (i.tm.opcode_modifier.vex == VEXScalar)
3089     vector_length = avxscalar;
3090   else
3091     vector_length = i.tm.opcode_modifier.vex == VEX256 ? 1 : 0;
3092
3093   switch ((i.tm.base_opcode >> 8) & 0xff)
3094     {
3095     case 0:
3096       implied_prefix = 0;
3097       break;
3098     case DATA_PREFIX_OPCODE:
3099       implied_prefix = 1;
3100       break;
3101     case REPE_PREFIX_OPCODE:
3102       implied_prefix = 2;
3103       break;
3104     case REPNE_PREFIX_OPCODE:
3105       implied_prefix = 3;
3106       break;
3107     default:
3108       abort ();
3109     }
3110
3111   /* Use 2-byte VEX prefix if possible.  */
3112   if (i.tm.opcode_modifier.vexopcode == VEX0F
3113       && i.tm.opcode_modifier.vexw != VEXW1
3114       && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3115     {
3116       /* 2-byte VEX prefix.  */
3117       unsigned int r;
3118
3119       i.vex.length = 2;
3120       i.vex.bytes[0] = 0xc5;
3121
3122       /* Check the REX.R bit.  */
3123       r = (i.rex & REX_R) ? 0 : 1;
3124       i.vex.bytes[1] = (r << 7
3125                         | register_specifier << 3
3126                         | vector_length << 2
3127                         | implied_prefix);
3128     }
3129   else
3130     {
3131       /* 3-byte VEX prefix.  */
3132       unsigned int m, w;
3133
3134       i.vex.length = 3;
3135
3136       switch (i.tm.opcode_modifier.vexopcode)
3137         {
3138         case VEX0F:
3139           m = 0x1;
3140           i.vex.bytes[0] = 0xc4;
3141           break;
3142         case VEX0F38:
3143           m = 0x2;
3144           i.vex.bytes[0] = 0xc4;
3145           break;
3146         case VEX0F3A:
3147           m = 0x3;
3148           i.vex.bytes[0] = 0xc4;
3149           break;
3150         case XOP08:
3151           m = 0x8;
3152           i.vex.bytes[0] = 0x8f;
3153           break;
3154         case XOP09:
3155           m = 0x9;
3156           i.vex.bytes[0] = 0x8f;
3157           break;
3158         case XOP0A:
3159           m = 0xa;
3160           i.vex.bytes[0] = 0x8f;
3161           break;
3162         default:
3163           abort ();
3164         }
3165
3166       /* The high 3 bits of the second VEX byte are 1's compliment
3167          of RXB bits from REX.  */
3168       i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3169
3170       /* Check the REX.W bit.  */
3171       w = (i.rex & REX_W) ? 1 : 0;
3172       if (i.tm.opcode_modifier.vexw == VEXW1)
3173         w = 1;
3174
3175       i.vex.bytes[2] = (w << 7
3176                         | register_specifier << 3
3177                         | vector_length << 2
3178                         | implied_prefix);
3179     }
3180 }
3181
3182 /* Build the EVEX prefix.  */
3183
3184 static void
3185 build_evex_prefix (void)
3186 {
3187   unsigned int register_specifier;
3188   unsigned int implied_prefix;
3189   unsigned int m, w;
3190   rex_byte vrex_used = 0;
3191
3192   /* Check register specifier.  */
3193   if (i.vex.register_specifier)
3194     {
3195       gas_assert ((i.vrex & REX_X) == 0);
3196
3197       register_specifier = i.vex.register_specifier->reg_num;
3198       if ((i.vex.register_specifier->reg_flags & RegRex))
3199         register_specifier += 8;
3200       /* The upper 16 registers are encoded in the fourth byte of the
3201          EVEX prefix.  */
3202       if (!(i.vex.register_specifier->reg_flags & RegVRex))
3203         i.vex.bytes[3] = 0x8;
3204       register_specifier = ~register_specifier & 0xf;
3205     }
3206   else
3207     {
3208       register_specifier = 0xf;
3209
3210       /* Encode upper 16 vector index register in the fourth byte of
3211          the EVEX prefix.  */
3212       if (!(i.vrex & REX_X))
3213         i.vex.bytes[3] = 0x8;
3214       else
3215         vrex_used |= REX_X;
3216     }
3217
3218   switch ((i.tm.base_opcode >> 8) & 0xff)
3219     {
3220     case 0:
3221       implied_prefix = 0;
3222       break;
3223     case DATA_PREFIX_OPCODE:
3224       implied_prefix = 1;
3225       break;
3226     case REPE_PREFIX_OPCODE:
3227       implied_prefix = 2;
3228       break;
3229     case REPNE_PREFIX_OPCODE:
3230       implied_prefix = 3;
3231       break;
3232     default:
3233       abort ();
3234     }
3235
3236   /* 4 byte EVEX prefix.  */
3237   i.vex.length = 4;
3238   i.vex.bytes[0] = 0x62;
3239
3240   /* mmmm bits.  */
3241   switch (i.tm.opcode_modifier.vexopcode)
3242     {
3243     case VEX0F:
3244       m = 1;
3245       break;
3246     case VEX0F38:
3247       m = 2;
3248       break;
3249     case VEX0F3A:
3250       m = 3;
3251       break;
3252     default:
3253       abort ();
3254       break;
3255     }
3256
3257   /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3258      bits from REX.  */
3259   i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3260
3261   /* The fifth bit of the second EVEX byte is 1's compliment of the
3262      REX_R bit in VREX.  */
3263   if (!(i.vrex & REX_R))
3264     i.vex.bytes[1] |= 0x10;
3265   else
3266     vrex_used |= REX_R;
3267
3268   if ((i.reg_operands + i.imm_operands) == i.operands)
3269     {
3270       /* When all operands are registers, the REX_X bit in REX is not
3271          used.  We reuse it to encode the upper 16 registers, which is
3272          indicated by the REX_B bit in VREX.  The REX_X bit is encoded
3273          as 1's compliment.  */
3274       if ((i.vrex & REX_B))
3275         {
3276           vrex_used |= REX_B;
3277           i.vex.bytes[1] &= ~0x40;
3278         }
3279     }
3280
3281   /* EVEX instructions shouldn't need the REX prefix.  */
3282   i.vrex &= ~vrex_used;
3283   gas_assert (i.vrex == 0);
3284
3285   /* Check the REX.W bit.  */
3286   w = (i.rex & REX_W) ? 1 : 0;
3287   if (i.tm.opcode_modifier.vexw)
3288     {
3289       if (i.tm.opcode_modifier.vexw == VEXW1)
3290         w = 1;
3291     }
3292   /* If w is not set it means we are dealing with WIG instruction.  */
3293   else if (!w)
3294     {
3295       if (evexwig == evexw1)
3296         w = 1;
3297     }
3298
3299   /* Encode the U bit.  */
3300   implied_prefix |= 0x4;
3301
3302   /* The third byte of the EVEX prefix.  */
3303   i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3304
3305   /* The fourth byte of the EVEX prefix.  */
3306   /* The zeroing-masking bit.  */
3307   if (i.mask && i.mask->zeroing)
3308     i.vex.bytes[3] |= 0x80;
3309
3310   /* Don't always set the broadcast bit if there is no RC.  */
3311   if (!i.rounding)
3312     {
3313       /* Encode the vector length.  */
3314       unsigned int vec_length;
3315
3316       switch (i.tm.opcode_modifier.evex)
3317         {
3318         case EVEXLIG: /* LL' is ignored */
3319           vec_length = evexlig << 5;
3320           break;
3321         case EVEX128:
3322           vec_length = 0 << 5;
3323           break;
3324         case EVEX256:
3325           vec_length = 1 << 5;
3326           break;
3327         case EVEX512:
3328           vec_length = 2 << 5;
3329           break;
3330         default:
3331           abort ();
3332           break;
3333         }
3334       i.vex.bytes[3] |= vec_length;
3335       /* Encode the broadcast bit.  */
3336       if (i.broadcast)
3337         i.vex.bytes[3] |= 0x10;
3338     }
3339   else
3340     {
3341       if (i.rounding->type != saeonly)
3342         i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3343       else
3344         i.vex.bytes[3] |= 0x10;
3345     }
3346
3347   if (i.mask && i.mask->mask)
3348     i.vex.bytes[3] |= i.mask->mask->reg_num;
3349 }
3350
3351 static void
3352 process_immext (void)
3353 {
3354   expressionS *exp;
3355
3356   if ((i.tm.cpu_flags.bitfield.cpusse3 || i.tm.cpu_flags.bitfield.cpusvme)
3357       && i.operands > 0)
3358     {
3359       /* MONITOR/MWAIT as well as SVME instructions have fixed operands
3360          with an opcode suffix which is coded in the same place as an
3361          8-bit immediate field would be.
3362          Here we check those operands and remove them afterwards.  */
3363       unsigned int x;
3364
3365       for (x = 0; x < i.operands; x++)
3366         if (register_number (i.op[x].regs) != x)
3367           as_bad (_("can't use register '%s%s' as operand %d in '%s'."),
3368                   register_prefix, i.op[x].regs->reg_name, x + 1,
3369                   i.tm.name);
3370
3371       i.operands = 0;
3372     }
3373
3374   /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3375      which is coded in the same place as an 8-bit immediate field
3376      would be.  Here we fake an 8-bit immediate operand from the
3377      opcode suffix stored in tm.extension_opcode.
3378
3379      AVX instructions also use this encoding, for some of
3380      3 argument instructions.  */
3381
3382   gas_assert (i.imm_operands <= 1
3383               && (i.operands <= 2
3384                   || ((i.tm.opcode_modifier.vex
3385                        || i.tm.opcode_modifier.evex)
3386                       && i.operands <= 4)));
3387
3388   exp = &im_expressions[i.imm_operands++];
3389   i.op[i.operands].imms = exp;
3390   i.types[i.operands] = imm8;
3391   i.operands++;
3392   exp->X_op = O_constant;
3393   exp->X_add_number = i.tm.extension_opcode;
3394   i.tm.extension_opcode = None;
3395 }
3396
3397
3398 static int
3399 check_hle (void)
3400 {
3401   switch (i.tm.opcode_modifier.hleprefixok)
3402     {
3403     default:
3404       abort ();
3405     case HLEPrefixNone:
3406       as_bad (_("invalid instruction `%s' after `%s'"),
3407               i.tm.name, i.hle_prefix);
3408       return 0;
3409     case HLEPrefixLock:
3410       if (i.prefix[LOCK_PREFIX])
3411         return 1;
3412       as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
3413       return 0;
3414     case HLEPrefixAny:
3415       return 1;
3416     case HLEPrefixRelease:
3417       if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
3418         {
3419           as_bad (_("instruction `%s' after `xacquire' not allowed"),
3420                   i.tm.name);
3421           return 0;
3422         }
3423       if (i.mem_operands == 0
3424           || !operand_type_check (i.types[i.operands - 1], anymem))
3425         {
3426           as_bad (_("memory destination needed for instruction `%s'"
3427                     " after `xrelease'"), i.tm.name);
3428           return 0;
3429         }
3430       return 1;
3431     }
3432 }
3433
3434 /* This is the guts of the machine-dependent assembler.  LINE points to a
3435    machine dependent instruction.  This function is supposed to emit
3436    the frags/bytes it assembles to.  */
3437
3438 void
3439 md_assemble (char *line)
3440 {
3441   unsigned int j;
3442   char mnemonic[MAX_MNEM_SIZE];
3443   const insn_template *t;
3444
3445   /* Initialize globals.  */
3446   memset (&i, '\0', sizeof (i));
3447   for (j = 0; j < MAX_OPERANDS; j++)
3448     i.reloc[j] = NO_RELOC;
3449   memset (disp_expressions, '\0', sizeof (disp_expressions));
3450   memset (im_expressions, '\0', sizeof (im_expressions));
3451   save_stack_p = save_stack;
3452
3453   /* First parse an instruction mnemonic & call i386_operand for the operands.
3454      We assume that the scrubber has arranged it so that line[0] is the valid
3455      start of a (possibly prefixed) mnemonic.  */
3456
3457   line = parse_insn (line, mnemonic);
3458   if (line == NULL)
3459     return;
3460
3461   line = parse_operands (line, mnemonic);
3462   this_operand = -1;
3463   if (line == NULL)
3464     return;
3465
3466   /* Now we've parsed the mnemonic into a set of templates, and have the
3467      operands at hand.  */
3468
3469   /* All intel opcodes have reversed operands except for "bound" and
3470      "enter".  We also don't reverse intersegment "jmp" and "call"
3471      instructions with 2 immediate operands so that the immediate segment
3472      precedes the offset, as it does when in AT&T mode. */
3473   if (intel_syntax
3474       && i.operands > 1
3475       && (strcmp (mnemonic, "bound") != 0)
3476       && (strcmp (mnemonic, "invlpga") != 0)
3477       && !(operand_type_check (i.types[0], imm)
3478            && operand_type_check (i.types[1], imm)))
3479     swap_operands ();
3480
3481   /* The order of the immediates should be reversed
3482      for 2 immediates extrq and insertq instructions */
3483   if (i.imm_operands == 2
3484       && (strcmp (mnemonic, "extrq") == 0
3485           || strcmp (mnemonic, "insertq") == 0))
3486       swap_2_operands (0, 1);
3487
3488   if (i.imm_operands)
3489     optimize_imm ();
3490
3491   /* Don't optimize displacement for movabs since it only takes 64bit
3492      displacement.  */
3493   if (i.disp_operands
3494       && i.disp_encoding != disp_encoding_32bit
3495       && (flag_code != CODE_64BIT
3496           || strcmp (mnemonic, "movabs") != 0))
3497     optimize_disp ();
3498
3499   /* Next, we find a template that matches the given insn,
3500      making sure the overlap of the given operands types is consistent
3501      with the template operand types.  */
3502
3503   if (!(t = match_template ()))
3504     return;
3505
3506   if (sse_check != check_none
3507       && !i.tm.opcode_modifier.noavx
3508       && (i.tm.cpu_flags.bitfield.cpusse
3509           || i.tm.cpu_flags.bitfield.cpusse2
3510           || i.tm.cpu_flags.bitfield.cpusse3
3511           || i.tm.cpu_flags.bitfield.cpussse3
3512           || i.tm.cpu_flags.bitfield.cpusse4_1
3513           || i.tm.cpu_flags.bitfield.cpusse4_2))
3514     {
3515       (sse_check == check_warning
3516        ? as_warn
3517        : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
3518     }
3519
3520   /* Zap movzx and movsx suffix.  The suffix has been set from
3521      "word ptr" or "byte ptr" on the source operand in Intel syntax
3522      or extracted from mnemonic in AT&T syntax.  But we'll use
3523      the destination register to choose the suffix for encoding.  */
3524   if ((i.tm.base_opcode & ~9) == 0x0fb6)
3525     {
3526       /* In Intel syntax, there must be a suffix.  In AT&T syntax, if
3527          there is no suffix, the default will be byte extension.  */
3528       if (i.reg_operands != 2
3529           && !i.suffix
3530           && intel_syntax)
3531         as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
3532
3533       i.suffix = 0;
3534     }
3535
3536   if (i.tm.opcode_modifier.fwait)
3537     if (!add_prefix (FWAIT_OPCODE))
3538       return;
3539
3540   /* Check if REP prefix is OK.  */
3541   if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
3542     {
3543       as_bad (_("invalid instruction `%s' after `%s'"),
3544                 i.tm.name, i.rep_prefix);
3545       return;
3546     }
3547
3548   /* Check for lock without a lockable instruction.  Destination operand
3549      must be memory unless it is xchg (0x86).  */
3550   if (i.prefix[LOCK_PREFIX]
3551       && (!i.tm.opcode_modifier.islockable
3552           || i.mem_operands == 0
3553           || (i.tm.base_opcode != 0x86
3554               && !operand_type_check (i.types[i.operands - 1], anymem))))
3555     {
3556       as_bad (_("expecting lockable instruction after `lock'"));
3557       return;
3558     }
3559
3560   /* Check if HLE prefix is OK.  */
3561   if (i.hle_prefix && !check_hle ())
3562     return;
3563
3564   /* Check BND prefix.  */
3565   if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
3566     as_bad (_("expecting valid branch instruction after `bnd'"));
3567
3568   if (i.tm.cpu_flags.bitfield.cpumpx
3569       && flag_code == CODE_64BIT
3570       && i.prefix[ADDR_PREFIX])
3571     as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
3572
3573   /* Insert BND prefix.  */
3574   if (add_bnd_prefix
3575       && i.tm.opcode_modifier.bndprefixok
3576       && !i.prefix[BND_PREFIX])
3577     add_prefix (BND_PREFIX_OPCODE);
3578
3579   /* Check string instruction segment overrides.  */
3580   if (i.tm.opcode_modifier.isstring && i.mem_operands != 0)
3581     {
3582       if (!check_string ())
3583         return;
3584       i.disp_operands = 0;
3585     }
3586
3587   if (!process_suffix ())
3588     return;
3589
3590   /* Update operand types.  */
3591   for (j = 0; j < i.operands; j++)
3592     i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
3593
3594   /* Make still unresolved immediate matches conform to size of immediate
3595      given in i.suffix.  */
3596   if (!finalize_imm ())
3597     return;
3598
3599   if (i.types[0].bitfield.imm1)
3600     i.imm_operands = 0; /* kludge for shift insns.  */
3601
3602   /* We only need to check those implicit registers for instructions
3603      with 3 operands or less.  */
3604   if (i.operands <= 3)
3605     for (j = 0; j < i.operands; j++)
3606       if (i.types[j].bitfield.inoutportreg
3607           || i.types[j].bitfield.shiftcount
3608           || i.types[j].bitfield.acc
3609           || i.types[j].bitfield.floatacc)
3610         i.reg_operands--;
3611
3612   /* ImmExt should be processed after SSE2AVX.  */
3613   if (!i.tm.opcode_modifier.sse2avx
3614       && i.tm.opcode_modifier.immext)
3615     process_immext ();
3616
3617   /* For insns with operands there are more diddles to do to the opcode.  */
3618   if (i.operands)
3619     {
3620       if (!process_operands ())
3621         return;
3622     }
3623   else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
3624     {
3625       /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc.  */
3626       as_warn (_("translating to `%sp'"), i.tm.name);
3627     }
3628
3629   if (i.tm.opcode_modifier.vex)
3630     build_vex_prefix (t);
3631
3632   if (i.tm.opcode_modifier.evex)
3633     build_evex_prefix ();
3634
3635   /* Handle conversion of 'int $3' --> special int3 insn.  XOP or FMA4
3636      instructions may define INT_OPCODE as well, so avoid this corner
3637      case for those instructions that use MODRM.  */
3638   if (i.tm.base_opcode == INT_OPCODE
3639       && !i.tm.opcode_modifier.modrm
3640       && i.op[0].imms->X_add_number == 3)
3641     {
3642       i.tm.base_opcode = INT3_OPCODE;
3643       i.imm_operands = 0;
3644     }
3645
3646   if ((i.tm.opcode_modifier.jump
3647        || i.tm.opcode_modifier.jumpbyte
3648        || i.tm.opcode_modifier.jumpdword)
3649       && i.op[0].disps->X_op == O_constant)
3650     {
3651       /* Convert "jmp constant" (and "call constant") to a jump (call) to
3652          the absolute address given by the constant.  Since ix86 jumps and
3653          calls are pc relative, we need to generate a reloc.  */
3654       i.op[0].disps->X_add_symbol = &abs_symbol;
3655       i.op[0].disps->X_op = O_symbol;
3656     }
3657
3658   if (i.tm.opcode_modifier.rex64)
3659     i.rex |= REX_W;
3660
3661   /* For 8 bit registers we need an empty rex prefix.  Also if the
3662      instruction already has a prefix, we need to convert old
3663      registers to new ones.  */
3664
3665   if ((i.types[0].bitfield.reg8
3666        && (i.op[0].regs->reg_flags & RegRex64) != 0)
3667       || (i.types[1].bitfield.reg8
3668           && (i.op[1].regs->reg_flags & RegRex64) != 0)
3669       || ((i.types[0].bitfield.reg8
3670            || i.types[1].bitfield.reg8)
3671           && i.rex != 0))
3672     {
3673       int x;
3674
3675       i.rex |= REX_OPCODE;
3676       for (x = 0; x < 2; x++)
3677         {
3678           /* Look for 8 bit operand that uses old registers.  */
3679           if (i.types[x].bitfield.reg8
3680               && (i.op[x].regs->reg_flags & RegRex64) == 0)
3681             {
3682               /* In case it is "hi" register, give up.  */
3683               if (i.op[x].regs->reg_num > 3)
3684                 as_bad (_("can't encode register '%s%s' in an "
3685                           "instruction requiring REX prefix."),
3686                         register_prefix, i.op[x].regs->reg_name);
3687
3688               /* Otherwise it is equivalent to the extended register.
3689                  Since the encoding doesn't change this is merely
3690                  cosmetic cleanup for debug output.  */
3691
3692               i.op[x].regs = i.op[x].regs + 8;
3693             }
3694         }
3695     }
3696
3697   if (i.rex != 0)
3698     add_prefix (REX_OPCODE | i.rex);
3699
3700   /* We are ready to output the insn.  */
3701   output_insn ();
3702 }
3703
3704 static char *
3705 parse_insn (char *line, char *mnemonic)
3706 {
3707   char *l = line;
3708   char *token_start = l;
3709   char *mnem_p;
3710   int supported;
3711   const insn_template *t;
3712   char *dot_p = NULL;
3713
3714   while (1)
3715     {
3716       mnem_p = mnemonic;
3717       while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
3718         {
3719           if (*mnem_p == '.')
3720             dot_p = mnem_p;
3721           mnem_p++;
3722           if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
3723             {
3724               as_bad (_("no such instruction: `%s'"), token_start);
3725               return NULL;
3726             }
3727           l++;
3728         }
3729       if (!is_space_char (*l)
3730           && *l != END_OF_INSN
3731           && (intel_syntax
3732               || (*l != PREFIX_SEPARATOR
3733                   && *l != ',')))
3734         {
3735           as_bad (_("invalid character %s in mnemonic"),
3736                   output_invalid (*l));
3737           return NULL;
3738         }
3739       if (token_start == l)
3740         {
3741           if (!intel_syntax && *l == PREFIX_SEPARATOR)
3742             as_bad (_("expecting prefix; got nothing"));
3743           else
3744             as_bad (_("expecting mnemonic; got nothing"));
3745           return NULL;
3746         }
3747
3748       /* Look up instruction (or prefix) via hash table.  */
3749       current_templates = (const templates *) hash_find (op_hash, mnemonic);
3750
3751       if (*l != END_OF_INSN
3752           && (!is_space_char (*l) || l[1] != END_OF_INSN)
3753           && current_templates
3754           && current_templates->start->opcode_modifier.isprefix)
3755         {
3756           if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
3757             {
3758               as_bad ((flag_code != CODE_64BIT
3759                        ? _("`%s' is only supported in 64-bit mode")
3760                        : _("`%s' is not supported in 64-bit mode")),
3761                       current_templates->start->name);
3762               return NULL;
3763             }
3764           /* If we are in 16-bit mode, do not allow addr16 or data16.
3765              Similarly, in 32-bit mode, do not allow addr32 or data32.  */
3766           if ((current_templates->start->opcode_modifier.size16
3767                || current_templates->start->opcode_modifier.size32)
3768               && flag_code != CODE_64BIT
3769               && (current_templates->start->opcode_modifier.size32
3770                   ^ (flag_code == CODE_16BIT)))
3771             {
3772               as_bad (_("redundant %s prefix"),
3773                       current_templates->start->name);
3774               return NULL;
3775             }
3776           /* Add prefix, checking for repeated prefixes.  */
3777           switch (add_prefix (current_templates->start->base_opcode))
3778             {
3779             case PREFIX_EXIST:
3780               return NULL;
3781             case PREFIX_REP:
3782               if (current_templates->start->cpu_flags.bitfield.cpuhle)
3783                 i.hle_prefix = current_templates->start->name;
3784               else if (current_templates->start->cpu_flags.bitfield.cpumpx)
3785                 i.bnd_prefix = current_templates->start->name;
3786               else
3787                 i.rep_prefix = current_templates->start->name;
3788               break;
3789             default:
3790               break;
3791             }
3792           /* Skip past PREFIX_SEPARATOR and reset token_start.  */
3793           token_start = ++l;
3794         }
3795       else
3796         break;
3797     }
3798
3799   if (!current_templates)
3800     {
3801       /* Check if we should swap operand or force 32bit displacement in
3802          encoding.  */
3803       if (mnem_p - 2 == dot_p && dot_p[1] == 's')
3804         i.swap_operand = 1;
3805       else if (mnem_p - 3 == dot_p
3806                && dot_p[1] == 'd'
3807                && dot_p[2] == '8')
3808         i.disp_encoding = disp_encoding_8bit;
3809       else if (mnem_p - 4 == dot_p
3810                && dot_p[1] == 'd'
3811                && dot_p[2] == '3'
3812                && dot_p[3] == '2')
3813         i.disp_encoding = disp_encoding_32bit;
3814       else
3815         goto check_suffix;
3816       mnem_p = dot_p;
3817       *dot_p = '\0';
3818       current_templates = (const templates *) hash_find (op_hash, mnemonic);
3819     }
3820
3821   if (!current_templates)
3822     {
3823 check_suffix:
3824       /* See if we can get a match by trimming off a suffix.  */
3825       switch (mnem_p[-1])
3826         {
3827         case WORD_MNEM_SUFFIX:
3828           if (intel_syntax && (intel_float_operand (mnemonic) & 2))
3829             i.suffix = SHORT_MNEM_SUFFIX;
3830           else
3831         case BYTE_MNEM_SUFFIX:
3832         case QWORD_MNEM_SUFFIX:
3833           i.suffix = mnem_p[-1];
3834           mnem_p[-1] = '\0';
3835           current_templates = (const templates *) hash_find (op_hash,
3836                                                              mnemonic);
3837           break;
3838         case SHORT_MNEM_SUFFIX:
3839         case LONG_MNEM_SUFFIX:
3840           if (!intel_syntax)
3841             {
3842               i.suffix = mnem_p[-1];
3843               mnem_p[-1] = '\0';
3844               current_templates = (const templates *) hash_find (op_hash,
3845                                                                  mnemonic);
3846             }
3847           break;
3848
3849           /* Intel Syntax.  */
3850         case 'd':
3851           if (intel_syntax)
3852             {
3853               if (intel_float_operand (mnemonic) == 1)
3854                 i.suffix = SHORT_MNEM_SUFFIX;
3855               else
3856                 i.suffix = LONG_MNEM_SUFFIX;
3857               mnem_p[-1] = '\0';
3858               current_templates = (const templates *) hash_find (op_hash,
3859                                                                  mnemonic);
3860             }
3861           break;
3862         }
3863       if (!current_templates)
3864         {
3865           as_bad (_("no such instruction: `%s'"), token_start);
3866           return NULL;
3867         }
3868     }
3869
3870   if (current_templates->start->opcode_modifier.jump
3871       || current_templates->start->opcode_modifier.jumpbyte)
3872     {
3873       /* Check for a branch hint.  We allow ",pt" and ",pn" for
3874          predict taken and predict not taken respectively.
3875          I'm not sure that branch hints actually do anything on loop
3876          and jcxz insns (JumpByte) for current Pentium4 chips.  They
3877          may work in the future and it doesn't hurt to accept them
3878          now.  */
3879       if (l[0] == ',' && l[1] == 'p')
3880         {
3881           if (l[2] == 't')
3882             {
3883               if (!add_prefix (DS_PREFIX_OPCODE))
3884                 return NULL;
3885               l += 3;
3886             }
3887           else if (l[2] == 'n')
3888             {
3889               if (!add_prefix (CS_PREFIX_OPCODE))
3890                 return NULL;
3891               l += 3;
3892             }
3893         }
3894     }
3895   /* Any other comma loses.  */
3896   if (*l == ',')
3897     {
3898       as_bad (_("invalid character %s in mnemonic"),
3899               output_invalid (*l));
3900       return NULL;
3901     }
3902
3903   /* Check if instruction is supported on specified architecture.  */
3904   supported = 0;
3905   for (t = current_templates->start; t < current_templates->end; ++t)
3906     {
3907       supported |= cpu_flags_match (t);
3908       if (supported == CPU_FLAGS_PERFECT_MATCH)
3909         goto skip;
3910     }
3911
3912   if (!(supported & CPU_FLAGS_64BIT_MATCH))
3913     {
3914       as_bad (flag_code == CODE_64BIT
3915               ? _("`%s' is not supported in 64-bit mode")
3916               : _("`%s' is only supported in 64-bit mode"),
3917               current_templates->start->name);
3918       return NULL;
3919     }
3920   if (supported != CPU_FLAGS_PERFECT_MATCH)
3921     {
3922       as_bad (_("`%s' is not supported on `%s%s'"),
3923               current_templates->start->name,
3924               cpu_arch_name ? cpu_arch_name : default_arch,
3925               cpu_sub_arch_name ? cpu_sub_arch_name : "");
3926       return NULL;
3927     }
3928
3929 skip:
3930   if (!cpu_arch_flags.bitfield.cpui386
3931            && (flag_code != CODE_16BIT))
3932     {
3933       as_warn (_("use .code16 to ensure correct addressing mode"));
3934     }
3935
3936   return l;
3937 }
3938
3939 static char *
3940 parse_operands (char *l, const char *mnemonic)
3941 {
3942   char *token_start;
3943
3944   /* 1 if operand is pending after ','.  */
3945   unsigned int expecting_operand = 0;
3946
3947   /* Non-zero if operand parens not balanced.  */
3948   unsigned int paren_not_balanced;
3949
3950   while (*l != END_OF_INSN)
3951     {
3952       /* Skip optional white space before operand.  */
3953       if (is_space_char (*l))
3954         ++l;
3955       if (!is_operand_char (*l) && *l != END_OF_INSN)
3956         {
3957           as_bad (_("invalid character %s before operand %d"),
3958                   output_invalid (*l),
3959                   i.operands + 1);
3960           return NULL;
3961         }
3962       token_start = l;  /* after white space */
3963       paren_not_balanced = 0;
3964       while (paren_not_balanced || *l != ',')
3965         {
3966           if (*l == END_OF_INSN)
3967             {
3968               if (paren_not_balanced)
3969                 {
3970                   if (!intel_syntax)
3971                     as_bad (_("unbalanced parenthesis in operand %d."),
3972                             i.operands + 1);
3973                   else
3974                     as_bad (_("unbalanced brackets in operand %d."),
3975                             i.operands + 1);
3976                   return NULL;
3977                 }
3978               else
3979                 break;  /* we are done */
3980             }
3981           else if (!is_operand_char (*l) && !is_space_char (*l))
3982             {
3983               as_bad (_("invalid character %s in operand %d"),
3984                       output_invalid (*l),
3985                       i.operands + 1);
3986               return NULL;
3987             }
3988           if (!intel_syntax)
3989             {
3990               if (*l == '(')
3991                 ++paren_not_balanced;
3992               if (*l == ')')
3993                 --paren_not_balanced;
3994             }
3995           else
3996             {
3997               if (*l == '[')
3998                 ++paren_not_balanced;
3999               if (*l == ']')
4000                 --paren_not_balanced;
4001             }
4002           l++;
4003         }
4004       if (l != token_start)
4005         {                       /* Yes, we've read in another operand.  */
4006           unsigned int operand_ok;
4007           this_operand = i.operands++;
4008           i.types[this_operand].bitfield.unspecified = 1;
4009           if (i.operands > MAX_OPERANDS)
4010             {
4011               as_bad (_("spurious operands; (%d operands/instruction max)"),
4012                       MAX_OPERANDS);
4013               return NULL;
4014             }
4015           /* Now parse operand adding info to 'i' as we go along.  */
4016           END_STRING_AND_SAVE (l);
4017
4018           if (intel_syntax)
4019             operand_ok =
4020               i386_intel_operand (token_start,
4021                                   intel_float_operand (mnemonic));
4022           else
4023             operand_ok = i386_att_operand (token_start);
4024
4025           RESTORE_END_STRING (l);
4026           if (!operand_ok)
4027             return NULL;
4028         }
4029       else
4030         {
4031           if (expecting_operand)
4032             {
4033             expecting_operand_after_comma:
4034               as_bad (_("expecting operand after ','; got nothing"));
4035               return NULL;
4036             }
4037           if (*l == ',')
4038             {
4039               as_bad (_("expecting operand before ','; got nothing"));
4040               return NULL;
4041             }
4042         }
4043
4044       /* Now *l must be either ',' or END_OF_INSN.  */
4045       if (*l == ',')
4046         {
4047           if (*++l == END_OF_INSN)
4048             {
4049               /* Just skip it, if it's \n complain.  */
4050               goto expecting_operand_after_comma;
4051             }
4052           expecting_operand = 1;
4053         }
4054     }
4055   return l;
4056 }
4057
4058 static void
4059 swap_2_operands (int xchg1, int xchg2)
4060 {
4061   union i386_op temp_op;
4062   i386_operand_type temp_type;
4063   enum bfd_reloc_code_real temp_reloc;
4064
4065   temp_type = i.types[xchg2];
4066   i.types[xchg2] = i.types[xchg1];
4067   i.types[xchg1] = temp_type;
4068   temp_op = i.op[xchg2];
4069   i.op[xchg2] = i.op[xchg1];
4070   i.op[xchg1] = temp_op;
4071   temp_reloc = i.reloc[xchg2];
4072   i.reloc[xchg2] = i.reloc[xchg1];
4073   i.reloc[xchg1] = temp_reloc;
4074
4075   if (i.mask)
4076     {
4077       if (i.mask->operand == xchg1)
4078         i.mask->operand = xchg2;
4079       else if (i.mask->operand == xchg2)
4080         i.mask->operand = xchg1;
4081     }
4082   if (i.broadcast)
4083     {
4084       if (i.broadcast->operand == xchg1)
4085         i.broadcast->operand = xchg2;
4086       else if (i.broadcast->operand == xchg2)
4087         i.broadcast->operand = xchg1;
4088     }
4089   if (i.rounding)
4090     {
4091       if (i.rounding->operand == xchg1)
4092         i.rounding->operand = xchg2;
4093       else if (i.rounding->operand == xchg2)
4094         i.rounding->operand = xchg1;
4095     }
4096 }
4097
4098 static void
4099 swap_operands (void)
4100 {
4101   switch (i.operands)
4102     {
4103     case 5:
4104     case 4:
4105       swap_2_operands (1, i.operands - 2);
4106     case 3:
4107     case 2:
4108       swap_2_operands (0, i.operands - 1);
4109       break;
4110     default:
4111       abort ();
4112     }
4113
4114   if (i.mem_operands == 2)
4115     {
4116       const seg_entry *temp_seg;
4117       temp_seg = i.seg[0];
4118       i.seg[0] = i.seg[1];
4119       i.seg[1] = temp_seg;
4120     }
4121 }
4122
4123 /* Try to ensure constant immediates are represented in the smallest
4124    opcode possible.  */
4125 static void
4126 optimize_imm (void)
4127 {
4128   char guess_suffix = 0;
4129   int op;
4130
4131   if (i.suffix)
4132     guess_suffix = i.suffix;
4133   else if (i.reg_operands)
4134     {
4135       /* Figure out a suffix from the last register operand specified.
4136          We can't do this properly yet, ie. excluding InOutPortReg,
4137          but the following works for instructions with immediates.
4138          In any case, we can't set i.suffix yet.  */
4139       for (op = i.operands; --op >= 0;)
4140         if (i.types[op].bitfield.reg8)
4141           {
4142             guess_suffix = BYTE_MNEM_SUFFIX;
4143             break;
4144           }
4145         else if (i.types[op].bitfield.reg16)
4146           {
4147             guess_suffix = WORD_MNEM_SUFFIX;
4148             break;
4149           }
4150         else if (i.types[op].bitfield.reg32)
4151           {
4152             guess_suffix = LONG_MNEM_SUFFIX;
4153             break;
4154           }
4155         else if (i.types[op].bitfield.reg64)
4156           {
4157             guess_suffix = QWORD_MNEM_SUFFIX;
4158             break;
4159           }
4160     }
4161   else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
4162     guess_suffix = WORD_MNEM_SUFFIX;
4163
4164   for (op = i.operands; --op >= 0;)
4165     if (operand_type_check (i.types[op], imm))
4166       {
4167         switch (i.op[op].imms->X_op)
4168           {
4169           case O_constant:
4170             /* If a suffix is given, this operand may be shortened.  */
4171             switch (guess_suffix)
4172               {
4173               case LONG_MNEM_SUFFIX:
4174                 i.types[op].bitfield.imm32 = 1;
4175                 i.types[op].bitfield.imm64 = 1;
4176                 break;
4177               case WORD_MNEM_SUFFIX:
4178                 i.types[op].bitfield.imm16 = 1;
4179                 i.types[op].bitfield.imm32 = 1;
4180                 i.types[op].bitfield.imm32s = 1;
4181                 i.types[op].bitfield.imm64 = 1;
4182                 break;
4183               case BYTE_MNEM_SUFFIX:
4184                 i.types[op].bitfield.imm8 = 1;
4185                 i.types[op].bitfield.imm8s = 1;
4186                 i.types[op].bitfield.imm16 = 1;
4187                 i.types[op].bitfield.imm32 = 1;
4188                 i.types[op].bitfield.imm32s = 1;
4189                 i.types[op].bitfield.imm64 = 1;
4190                 break;
4191               }
4192
4193             /* If this operand is at most 16 bits, convert it
4194                to a signed 16 bit number before trying to see
4195                whether it will fit in an even smaller size.
4196                This allows a 16-bit operand such as $0xffe0 to
4197                be recognised as within Imm8S range.  */
4198             if ((i.types[op].bitfield.imm16)
4199                 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
4200               {
4201                 i.op[op].imms->X_add_number =
4202                   (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
4203               }
4204             if ((i.types[op].bitfield.imm32)
4205                 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
4206                     == 0))
4207               {
4208                 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
4209                                                 ^ ((offsetT) 1 << 31))
4210                                                - ((offsetT) 1 << 31));
4211               }
4212             i.types[op]
4213               = operand_type_or (i.types[op],
4214                                  smallest_imm_type (i.op[op].imms->X_add_number));
4215
4216             /* We must avoid matching of Imm32 templates when 64bit
4217                only immediate is available.  */
4218             if (guess_suffix == QWORD_MNEM_SUFFIX)
4219               i.types[op].bitfield.imm32 = 0;
4220             break;
4221
4222           case O_absent:
4223           case O_register:
4224             abort ();
4225
4226             /* Symbols and expressions.  */
4227           default:
4228             /* Convert symbolic operand to proper sizes for matching, but don't
4229                prevent matching a set of insns that only supports sizes other
4230                than those matching the insn suffix.  */
4231             {
4232               i386_operand_type mask, allowed;
4233               const insn_template *t;
4234
4235               operand_type_set (&mask, 0);
4236               operand_type_set (&allowed, 0);
4237
4238               for (t = current_templates->start;
4239                    t < current_templates->end;
4240                    ++t)
4241                 allowed = operand_type_or (allowed,
4242                                            t->operand_types[op]);
4243               switch (guess_suffix)
4244                 {
4245                 case QWORD_MNEM_SUFFIX:
4246                   mask.bitfield.imm64 = 1;
4247                   mask.bitfield.imm32s = 1;
4248                   break;
4249                 case LONG_MNEM_SUFFIX:
4250                   mask.bitfield.imm32 = 1;
4251                   break;
4252                 case WORD_MNEM_SUFFIX:
4253                   mask.bitfield.imm16 = 1;
4254                   break;
4255                 case BYTE_MNEM_SUFFIX:
4256                   mask.bitfield.imm8 = 1;
4257                   break;
4258                 default:
4259                   break;
4260                 }
4261               allowed = operand_type_and (mask, allowed);
4262               if (!operand_type_all_zero (&allowed))
4263                 i.types[op] = operand_type_and (i.types[op], mask);
4264             }
4265             break;
4266           }
4267       }
4268 }
4269
4270 /* Try to use the smallest displacement type too.  */
4271 static void
4272 optimize_disp (void)
4273 {
4274   int op;
4275
4276   for (op = i.operands; --op >= 0;)
4277     if (operand_type_check (i.types[op], disp))
4278       {
4279         if (i.op[op].disps->X_op == O_constant)
4280           {
4281             offsetT op_disp = i.op[op].disps->X_add_number;
4282
4283             if (i.types[op].bitfield.disp16
4284                 && (op_disp & ~(offsetT) 0xffff) == 0)
4285               {
4286                 /* If this operand is at most 16 bits, convert
4287                    to a signed 16 bit number and don't use 64bit
4288                    displacement.  */
4289                 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
4290                 i.types[op].bitfield.disp64 = 0;
4291               }
4292             if (i.types[op].bitfield.disp32
4293                 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
4294               {
4295                 /* If this operand is at most 32 bits, convert
4296                    to a signed 32 bit number and don't use 64bit
4297                    displacement.  */
4298                 op_disp &= (((offsetT) 2 << 31) - 1);
4299                 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
4300                 i.types[op].bitfield.disp64 = 0;
4301               }
4302             if (!op_disp && i.types[op].bitfield.baseindex)
4303               {
4304                 i.types[op].bitfield.disp8 = 0;
4305                 i.types[op].bitfield.disp16 = 0;
4306                 i.types[op].bitfield.disp32 = 0;
4307                 i.types[op].bitfield.disp32s = 0;
4308                 i.types[op].bitfield.disp64 = 0;
4309                 i.op[op].disps = 0;
4310                 i.disp_operands--;
4311               }
4312             else if (flag_code == CODE_64BIT)
4313               {
4314                 if (fits_in_signed_long (op_disp))
4315                   {
4316                     i.types[op].bitfield.disp64 = 0;
4317                     i.types[op].bitfield.disp32s = 1;
4318                   }
4319                 if (i.prefix[ADDR_PREFIX]
4320                     && fits_in_unsigned_long (op_disp))
4321                   i.types[op].bitfield.disp32 = 1;
4322               }
4323             if ((i.types[op].bitfield.disp32
4324                  || i.types[op].bitfield.disp32s
4325                  || i.types[op].bitfield.disp16)
4326                 && fits_in_signed_byte (op_disp))
4327               i.types[op].bitfield.disp8 = 1;
4328           }
4329         else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
4330                  || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
4331           {
4332             fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
4333                          i.op[op].disps, 0, i.reloc[op]);
4334             i.types[op].bitfield.disp8 = 0;
4335             i.types[op].bitfield.disp16 = 0;
4336             i.types[op].bitfield.disp32 = 0;
4337             i.types[op].bitfield.disp32s = 0;
4338             i.types[op].bitfield.disp64 = 0;
4339           }
4340         else
4341           /* We only support 64bit displacement on constants.  */
4342           i.types[op].bitfield.disp64 = 0;
4343       }
4344 }
4345
4346 /* Check if operands are valid for the instruction.  */
4347
4348 static int
4349 check_VecOperands (const insn_template *t)
4350 {
4351   unsigned int op;
4352
4353   /* Without VSIB byte, we can't have a vector register for index.  */
4354   if (!t->opcode_modifier.vecsib
4355       && i.index_reg
4356       && (i.index_reg->reg_type.bitfield.regxmm
4357           || i.index_reg->reg_type.bitfield.regymm
4358           || i.index_reg->reg_type.bitfield.regzmm))
4359     {
4360       i.error = unsupported_vector_index_register;
4361       return 1;
4362     }
4363
4364   /* Check if default mask is allowed.  */
4365   if (t->opcode_modifier.nodefmask
4366       && (!i.mask || i.mask->mask->reg_num == 0))
4367     {
4368       i.error = no_default_mask;
4369       return 1;
4370     }
4371
4372   /* For VSIB byte, we need a vector register for index, and all vector
4373      registers must be distinct.  */
4374   if (t->opcode_modifier.vecsib)
4375     {
4376       if (!i.index_reg
4377           || !((t->opcode_modifier.vecsib == VecSIB128
4378                 && i.index_reg->reg_type.bitfield.regxmm)
4379                || (t->opcode_modifier.vecsib == VecSIB256
4380                    && i.index_reg->reg_type.bitfield.regymm)
4381                || (t->opcode_modifier.vecsib == VecSIB512
4382                    && i.index_reg->reg_type.bitfield.regzmm)))
4383       {
4384         i.error = invalid_vsib_address;
4385         return 1;
4386       }
4387
4388       gas_assert (i.reg_operands == 2 || i.mask);
4389       if (i.reg_operands == 2 && !i.mask)
4390         {
4391           gas_assert (i.types[0].bitfield.regxmm
4392                       || i.types[0].bitfield.regymm);
4393           gas_assert (i.types[2].bitfield.regxmm
4394                       || i.types[2].bitfield.regymm);
4395           if (operand_check == check_none)
4396             return 0;
4397           if (register_number (i.op[0].regs)
4398               != register_number (i.index_reg)
4399               && register_number (i.op[2].regs)
4400                  != register_number (i.index_reg)
4401               && register_number (i.op[0].regs)
4402                  != register_number (i.op[2].regs))
4403             return 0;
4404           if (operand_check == check_error)
4405             {
4406               i.error = invalid_vector_register_set;
4407               return 1;
4408             }
4409           as_warn (_("mask, index, and destination registers should be distinct"));
4410         }
4411       else if (i.reg_operands == 1 && i.mask)
4412         {
4413           if ((i.types[1].bitfield.regymm
4414                || i.types[1].bitfield.regzmm)
4415               && (register_number (i.op[1].regs)
4416                   == register_number (i.index_reg)))
4417             {
4418               if (operand_check == check_error)
4419                 {
4420                   i.error = invalid_vector_register_set;
4421                   return 1;
4422                 }
4423               if (operand_check != check_none)
4424                 as_warn (_("index and destination registers should be distinct"));
4425             }
4426         }
4427     }
4428
4429   /* Check if broadcast is supported by the instruction and is applied
4430      to the memory operand.  */
4431   if (i.broadcast)
4432     {
4433       int broadcasted_opnd_size;
4434
4435       /* Check if specified broadcast is supported in this instruction,
4436          and it's applied to memory operand of DWORD or QWORD type,
4437          depending on VecESize.  */
4438       if (i.broadcast->type != t->opcode_modifier.broadcast
4439           || !i.types[i.broadcast->operand].bitfield.mem
4440           || (t->opcode_modifier.vecesize == 0
4441               && !i.types[i.broadcast->operand].bitfield.dword
4442               && !i.types[i.broadcast->operand].bitfield.unspecified)
4443           || (t->opcode_modifier.vecesize == 1
4444               && !i.types[i.broadcast->operand].bitfield.qword
4445               && !i.types[i.broadcast->operand].bitfield.unspecified))
4446         goto bad_broadcast;
4447
4448       broadcasted_opnd_size = t->opcode_modifier.vecesize ? 64 : 32;
4449       if (i.broadcast->type == BROADCAST_1TO16)
4450         broadcasted_opnd_size <<= 4; /* Broadcast 1to16.  */
4451       else if (i.broadcast->type == BROADCAST_1TO8)
4452         broadcasted_opnd_size <<= 3; /* Broadcast 1to8.  */
4453       else if (i.broadcast->type == BROADCAST_1TO4)
4454         broadcasted_opnd_size <<= 2; /* Broadcast 1to4.  */
4455       else if (i.broadcast->type == BROADCAST_1TO2)
4456         broadcasted_opnd_size <<= 1; /* Broadcast 1to2.  */
4457       else
4458         goto bad_broadcast;
4459
4460       if ((broadcasted_opnd_size == 256
4461            && !t->operand_types[i.broadcast->operand].bitfield.ymmword)
4462           || (broadcasted_opnd_size == 512
4463               && !t->operand_types[i.broadcast->operand].bitfield.zmmword))
4464         {
4465         bad_broadcast:
4466           i.error = unsupported_broadcast;
4467           return 1;
4468         }
4469     }
4470   /* If broadcast is supported in this instruction, we need to check if
4471      operand of one-element size isn't specified without broadcast.  */
4472   else if (t->opcode_modifier.broadcast && i.mem_operands)
4473     {
4474       /* Find memory operand.  */
4475       for (op = 0; op < i.operands; op++)
4476         if (operand_type_check (i.types[op], anymem))
4477           break;
4478       gas_assert (op < i.operands);
4479       /* Check size of the memory operand.  */
4480       if ((t->opcode_modifier.vecesize == 0
4481            && i.types[op].bitfield.dword)
4482           || (t->opcode_modifier.vecesize == 1
4483               && i.types[op].bitfield.qword))
4484         {
4485           i.error = broadcast_needed;
4486           return 1;
4487         }
4488     }
4489
4490   /* Check if requested masking is supported.  */
4491   if (i.mask
4492       && (!t->opcode_modifier.masking
4493           || (i.mask->zeroing
4494               && t->opcode_modifier.masking == MERGING_MASKING)))
4495     {
4496       i.error = unsupported_masking;
4497       return 1;
4498     }
4499
4500   /* Check if masking is applied to dest operand.  */
4501   if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
4502     {
4503       i.error = mask_not_on_destination;
4504       return 1;
4505     }
4506
4507   /* Check RC/SAE.  */
4508   if (i.rounding)
4509     {
4510       if ((i.rounding->type != saeonly
4511            && !t->opcode_modifier.staticrounding)
4512           || (i.rounding->type == saeonly
4513               && (t->opcode_modifier.staticrounding
4514                   || !t->opcode_modifier.sae)))
4515         {
4516           i.error = unsupported_rc_sae;
4517           return 1;
4518         }
4519       /* If the instruction has several immediate operands and one of
4520          them is rounding, the rounding operand should be the last
4521          immediate operand.  */
4522       if (i.imm_operands > 1
4523           && i.rounding->operand != (int) (i.imm_operands - 1))
4524         {
4525           i.error = rc_sae_operand_not_last_imm;
4526           return 1;
4527         }
4528     }
4529
4530   /* Check vector Disp8 operand.  */
4531   if (t->opcode_modifier.disp8memshift)
4532     {
4533       if (i.broadcast)
4534         i.memshift = t->opcode_modifier.vecesize ? 3 : 2;
4535       else
4536         i.memshift = t->opcode_modifier.disp8memshift;
4537
4538       for (op = 0; op < i.operands; op++)
4539         if (operand_type_check (i.types[op], disp)
4540             && i.op[op].disps->X_op == O_constant)
4541           {
4542             offsetT value = i.op[op].disps->X_add_number;
4543             int vec_disp8_ok = fits_in_vec_disp8 (value);
4544             if (t->operand_types [op].bitfield.vec_disp8)
4545               {
4546                 if (vec_disp8_ok)
4547                   i.types[op].bitfield.vec_disp8 = 1;
4548                 else
4549                   {
4550                     /* Vector insn can only have Vec_Disp8/Disp32 in
4551                        32/64bit modes, and Vec_Disp8/Disp16 in 16bit
4552                        mode.  */
4553                     i.types[op].bitfield.disp8 = 0;
4554                     if (flag_code != CODE_16BIT)
4555                       i.types[op].bitfield.disp16 = 0;
4556                   }
4557               }
4558             else if (flag_code != CODE_16BIT)
4559               {
4560                 /* One form of this instruction supports vector Disp8.
4561                    Try vector Disp8 if we need to use Disp32.  */
4562                 if (vec_disp8_ok && !fits_in_signed_byte (value))
4563                   {
4564                     i.error = try_vector_disp8;
4565                     return 1;
4566                   }
4567               }
4568           }
4569     }
4570   else
4571     i.memshift = -1;
4572
4573   return 0;
4574 }
4575
4576 /* Check if operands are valid for the instruction.  Update VEX
4577    operand types.  */
4578
4579 static int
4580 VEX_check_operands (const insn_template *t)
4581 {
4582   /* VREX is only valid with EVEX prefix.  */
4583   if (i.need_vrex && !t->opcode_modifier.evex)
4584     {
4585       i.error = invalid_register_operand;
4586       return 1;
4587     }
4588
4589   if (!t->opcode_modifier.vex)
4590     return 0;
4591
4592   /* Only check VEX_Imm4, which must be the first operand.  */
4593   if (t->operand_types[0].bitfield.vec_imm4)
4594     {
4595       if (i.op[0].imms->X_op != O_constant
4596           || !fits_in_imm4 (i.op[0].imms->X_add_number))
4597         {
4598           i.error = bad_imm4;
4599           return 1;
4600         }
4601
4602       /* Turn off Imm8 so that update_imm won't complain.  */
4603       i.types[0] = vec_imm4;
4604     }
4605
4606   return 0;
4607 }
4608
4609 static const insn_template *
4610 match_template (void)
4611 {
4612   /* Points to template once we've found it.  */
4613   const insn_template *t;
4614   i386_operand_type overlap0, overlap1, overlap2, overlap3;
4615   i386_operand_type overlap4;
4616   unsigned int found_reverse_match;
4617   i386_opcode_modifier suffix_check;
4618   i386_operand_type operand_types [MAX_OPERANDS];
4619   int addr_prefix_disp;
4620   unsigned int j;
4621   unsigned int found_cpu_match;
4622   unsigned int check_register;
4623   enum i386_error specific_error = 0;
4624
4625 #if MAX_OPERANDS != 5
4626 # error "MAX_OPERANDS must be 5."
4627 #endif
4628
4629   found_reverse_match = 0;
4630   addr_prefix_disp = -1;
4631
4632   memset (&suffix_check, 0, sizeof (suffix_check));
4633   if (i.suffix == BYTE_MNEM_SUFFIX)
4634     suffix_check.no_bsuf = 1;
4635   else if (i.suffix == WORD_MNEM_SUFFIX)
4636     suffix_check.no_wsuf = 1;
4637   else if (i.suffix == SHORT_MNEM_SUFFIX)
4638     suffix_check.no_ssuf = 1;
4639   else if (i.suffix == LONG_MNEM_SUFFIX)
4640     suffix_check.no_lsuf = 1;
4641   else if (i.suffix == QWORD_MNEM_SUFFIX)
4642     suffix_check.no_qsuf = 1;
4643   else if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
4644     suffix_check.no_ldsuf = 1;
4645
4646   /* Must have right number of operands.  */
4647   i.error = number_of_operands_mismatch;
4648
4649   for (t = current_templates->start; t < current_templates->end; t++)
4650     {
4651       addr_prefix_disp = -1;
4652
4653       if (i.operands != t->operands)
4654         continue;
4655
4656       /* Check processor support.  */
4657       i.error = unsupported;
4658       found_cpu_match = (cpu_flags_match (t)
4659                          == CPU_FLAGS_PERFECT_MATCH);
4660       if (!found_cpu_match)
4661         continue;
4662
4663       /* Check old gcc support. */
4664       i.error = old_gcc_only;
4665       if (!old_gcc && t->opcode_modifier.oldgcc)
4666         continue;
4667
4668       /* Check AT&T mnemonic.   */
4669       i.error = unsupported_with_intel_mnemonic;
4670       if (intel_mnemonic && t->opcode_modifier.attmnemonic)
4671         continue;
4672
4673       /* Check AT&T/Intel syntax.   */
4674       i.error = unsupported_syntax;
4675       if ((intel_syntax && t->opcode_modifier.attsyntax)
4676           || (!intel_syntax && t->opcode_modifier.intelsyntax))
4677         continue;
4678
4679       /* Check the suffix, except for some instructions in intel mode.  */
4680       i.error = invalid_instruction_suffix;
4681       if ((!intel_syntax || !t->opcode_modifier.ignoresize)
4682           && ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
4683               || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
4684               || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
4685               || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
4686               || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
4687               || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf)))
4688         continue;
4689
4690       if (!operand_size_match (t))
4691         continue;
4692
4693       for (j = 0; j < MAX_OPERANDS; j++)
4694         operand_types[j] = t->operand_types[j];
4695
4696       /* In general, don't allow 64-bit operands in 32-bit mode.  */
4697       if (i.suffix == QWORD_MNEM_SUFFIX
4698           && flag_code != CODE_64BIT
4699           && (intel_syntax
4700               ? (!t->opcode_modifier.ignoresize
4701                  && !intel_float_operand (t->name))
4702               : intel_float_operand (t->name) != 2)
4703           && ((!operand_types[0].bitfield.regmmx
4704                && !operand_types[0].bitfield.regxmm
4705                && !operand_types[0].bitfield.regymm
4706                && !operand_types[0].bitfield.regzmm)
4707               || (!operand_types[t->operands > 1].bitfield.regmmx
4708                   && !!operand_types[t->operands > 1].bitfield.regxmm
4709                   && !!operand_types[t->operands > 1].bitfield.regymm
4710                   && !!operand_types[t->operands > 1].bitfield.regzmm))
4711           && (t->base_opcode != 0x0fc7
4712               || t->extension_opcode != 1 /* cmpxchg8b */))
4713         continue;
4714
4715       /* In general, don't allow 32-bit operands on pre-386.  */
4716       else if (i.suffix == LONG_MNEM_SUFFIX
4717                && !cpu_arch_flags.bitfield.cpui386
4718                && (intel_syntax
4719                    ? (!t->opcode_modifier.ignoresize
4720                       && !intel_float_operand (t->name))
4721                    : intel_float_operand (t->name) != 2)
4722                && ((!operand_types[0].bitfield.regmmx
4723                     && !operand_types[0].bitfield.regxmm)
4724                    || (!operand_types[t->operands > 1].bitfield.regmmx
4725                        && !!operand_types[t->operands > 1].bitfield.regxmm)))
4726         continue;
4727
4728       /* Do not verify operands when there are none.  */
4729       else
4730         {
4731           if (!t->operands)
4732             /* We've found a match; break out of loop.  */
4733             break;
4734         }
4735
4736       /* Address size prefix will turn Disp64/Disp32/Disp16 operand
4737          into Disp32/Disp16/Disp32 operand.  */
4738       if (i.prefix[ADDR_PREFIX] != 0)
4739           {
4740             /* There should be only one Disp operand.  */
4741             switch (flag_code)
4742             {
4743             case CODE_16BIT:
4744               for (j = 0; j < MAX_OPERANDS; j++)
4745                 {
4746                   if (operand_types[j].bitfield.disp16)
4747                     {
4748                       addr_prefix_disp = j;
4749                       operand_types[j].bitfield.disp32 = 1;
4750                       operand_types[j].bitfield.disp16 = 0;
4751                       break;
4752                     }
4753                 }
4754               break;
4755             case CODE_32BIT:
4756               for (j = 0; j < MAX_OPERANDS; j++)
4757                 {
4758                   if (operand_types[j].bitfield.disp32)
4759                     {
4760                       addr_prefix_disp = j;
4761                       operand_types[j].bitfield.disp32 = 0;
4762                       operand_types[j].bitfield.disp16 = 1;
4763                       break;
4764                     }
4765                 }
4766               break;
4767             case CODE_64BIT:
4768               for (j = 0; j < MAX_OPERANDS; j++)
4769                 {
4770                   if (operand_types[j].bitfield.disp64)
4771                     {
4772                       addr_prefix_disp = j;
4773                       operand_types[j].bitfield.disp64 = 0;
4774                       operand_types[j].bitfield.disp32 = 1;
4775                       break;
4776                     }
4777                 }
4778               break;
4779             }
4780           }
4781
4782       /* We check register size if needed.  */
4783       check_register = t->opcode_modifier.checkregsize;
4784       overlap0 = operand_type_and (i.types[0], operand_types[0]);
4785       switch (t->operands)
4786         {
4787         case 1:
4788           if (!operand_type_match (overlap0, i.types[0]))
4789             continue;
4790           break;
4791         case 2:
4792           /* xchg %eax, %eax is a special case. It is an aliase for nop
4793              only in 32bit mode and we can use opcode 0x90.  In 64bit
4794              mode, we can't use 0x90 for xchg %eax, %eax since it should
4795              zero-extend %eax to %rax.  */
4796           if (flag_code == CODE_64BIT
4797               && t->base_opcode == 0x90
4798               && operand_type_equal (&i.types [0], &acc32)
4799               && operand_type_equal (&i.types [1], &acc32))
4800             continue;
4801           if (i.swap_operand)
4802             {
4803               /* If we swap operand in encoding, we either match
4804                  the next one or reverse direction of operands.  */
4805               if (t->opcode_modifier.s)
4806                 continue;
4807               else if (t->opcode_modifier.d)
4808                 goto check_reverse;
4809             }
4810
4811         case 3:
4812           /* If we swap operand in encoding, we match the next one.  */
4813           if (i.swap_operand && t->opcode_modifier.s)
4814             continue;
4815         case 4:
4816         case 5:
4817           overlap1 = operand_type_and (i.types[1], operand_types[1]);
4818           if (!operand_type_match (overlap0, i.types[0])
4819               || !operand_type_match (overlap1, i.types[1])
4820               || (check_register
4821                   && !operand_type_register_match (overlap0, i.types[0],
4822                                                    operand_types[0],
4823                                                    overlap1, i.types[1],
4824                                                    operand_types[1])))
4825             {
4826               /* Check if other direction is valid ...  */
4827               if (!t->opcode_modifier.d && !t->opcode_modifier.floatd)
4828                 continue;
4829
4830 check_reverse:
4831               /* Try reversing direction of operands.  */
4832               overlap0 = operand_type_and (i.types[0], operand_types[1]);
4833               overlap1 = operand_type_and (i.types[1], operand_types[0]);
4834               if (!operand_type_match (overlap0, i.types[0])
4835                   || !operand_type_match (overlap1, i.types[1])
4836                   || (check_register
4837                       && !operand_type_register_match (overlap0,
4838                                                        i.types[0],
4839                                                        operand_types[1],
4840                                                        overlap1,
4841                                                        i.types[1],
4842                                                        operand_types[0])))
4843                 {
4844                   /* Does not match either direction.  */
4845                   continue;
4846                 }
4847               /* found_reverse_match holds which of D or FloatDR
4848                  we've found.  */
4849               if (t->opcode_modifier.d)
4850                 found_reverse_match = Opcode_D;
4851               else if (t->opcode_modifier.floatd)
4852                 found_reverse_match = Opcode_FloatD;
4853               else
4854                 found_reverse_match = 0;
4855               if (t->opcode_modifier.floatr)
4856                 found_reverse_match |= Opcode_FloatR;
4857             }
4858           else
4859             {
4860               /* Found a forward 2 operand match here.  */
4861               switch (t->operands)
4862                 {
4863                 case 5:
4864                   overlap4 = operand_type_and (i.types[4],
4865                                                operand_types[4]);
4866                 case 4:
4867                   overlap3 = operand_type_and (i.types[3],
4868                                                operand_types[3]);
4869                 case 3:
4870                   overlap2 = operand_type_and (i.types[2],
4871                                                operand_types[2]);
4872                   break;
4873                 }
4874
4875               switch (t->operands)
4876                 {
4877                 case 5:
4878                   if (!operand_type_match (overlap4, i.types[4])
4879                       || !operand_type_register_match (overlap3,
4880                                                        i.types[3],
4881                                                        operand_types[3],
4882                                                        overlap4,
4883                                                        i.types[4],
4884                                                        operand_types[4]))
4885                     continue;
4886                 case 4:
4887                   if (!operand_type_match (overlap3, i.types[3])
4888                       || (check_register
4889                           && !operand_type_register_match (overlap2,
4890                                                            i.types[2],
4891                                                            operand_types[2],
4892                                                            overlap3,
4893                                                            i.types[3],
4894                                                            operand_types[3])))
4895                     continue;
4896                 case 3:
4897                   /* Here we make use of the fact that there are no
4898                      reverse match 3 operand instructions, and all 3
4899                      operand instructions only need to be checked for
4900                      register consistency between operands 2 and 3.  */
4901                   if (!operand_type_match (overlap2, i.types[2])
4902                       || (check_register
4903                           && !operand_type_register_match (overlap1,
4904                                                            i.types[1],
4905                                                            operand_types[1],
4906                                                            overlap2,
4907                                                            i.types[2],
4908                                                            operand_types[2])))
4909                     continue;
4910                   break;
4911                 }
4912             }
4913           /* Found either forward/reverse 2, 3 or 4 operand match here:
4914              slip through to break.  */
4915         }
4916       if (!found_cpu_match)
4917         {
4918           found_reverse_match = 0;
4919           continue;
4920         }
4921
4922       /* Check if vector and VEX operands are valid.  */
4923       if (check_VecOperands (t) || VEX_check_operands (t))
4924         {
4925           specific_error = i.error;
4926           continue;
4927         }
4928
4929       /* We've found a match; break out of loop.  */
4930       break;
4931     }
4932
4933   if (t == current_templates->end)
4934     {
4935       /* We found no match.  */
4936       const char *err_msg;
4937       switch (specific_error ? specific_error : i.error)
4938         {
4939         default:
4940           abort ();
4941         case operand_size_mismatch:
4942           err_msg = _("operand size mismatch");
4943           break;
4944         case operand_type_mismatch:
4945           err_msg = _("operand type mismatch");
4946           break;
4947         case register_type_mismatch:
4948           err_msg = _("register type mismatch");
4949           break;
4950         case number_of_operands_mismatch:
4951           err_msg = _("number of operands mismatch");
4952           break;
4953         case invalid_instruction_suffix:
4954           err_msg = _("invalid instruction suffix");
4955           break;
4956         case bad_imm4:
4957           err_msg = _("constant doesn't fit in 4 bits");
4958           break;
4959         case old_gcc_only:
4960           err_msg = _("only supported with old gcc");
4961           break;
4962         case unsupported_with_intel_mnemonic:
4963           err_msg = _("unsupported with Intel mnemonic");
4964           break;
4965         case unsupported_syntax:
4966           err_msg = _("unsupported syntax");
4967           break;
4968         case unsupported:
4969           as_bad (_("unsupported instruction `%s'"),
4970                   current_templates->start->name);
4971           return NULL;
4972         case invalid_vsib_address:
4973           err_msg = _("invalid VSIB address");
4974           break;
4975         case invalid_vector_register_set:
4976           err_msg = _("mask, index, and destination registers must be distinct");
4977           break;
4978         case unsupported_vector_index_register:
4979           err_msg = _("unsupported vector index register");
4980           break;
4981         case unsupported_broadcast:
4982           err_msg = _("unsupported broadcast");
4983           break;
4984         case broadcast_not_on_src_operand:
4985           err_msg = _("broadcast not on source memory operand");
4986           break;
4987         case broadcast_needed:
4988           err_msg = _("broadcast is needed for operand of such type");
4989           break;
4990         case unsupported_masking:
4991           err_msg = _("unsupported masking");
4992           break;
4993         case mask_not_on_destination:
4994           err_msg = _("mask not on destination operand");
4995           break;
4996         case no_default_mask:
4997           err_msg = _("default mask isn't allowed");
4998           break;
4999         case unsupported_rc_sae:
5000           err_msg = _("unsupported static rounding/sae");
5001           break;
5002         case rc_sae_operand_not_last_imm:
5003           if (intel_syntax)
5004             err_msg = _("RC/SAE operand must precede immediate operands");
5005           else
5006             err_msg = _("RC/SAE operand must follow immediate operands");
5007           break;
5008         case invalid_register_operand:
5009           err_msg = _("invalid register operand");
5010           break;
5011         }
5012       as_bad (_("%s for `%s'"), err_msg,
5013               current_templates->start->name);
5014       return NULL;
5015     }
5016
5017   if (!quiet_warnings)
5018     {
5019       if (!intel_syntax
5020           && (i.types[0].bitfield.jumpabsolute
5021               != operand_types[0].bitfield.jumpabsolute))
5022         {
5023           as_warn (_("indirect %s without `*'"), t->name);
5024         }
5025
5026       if (t->opcode_modifier.isprefix
5027           && t->opcode_modifier.ignoresize)
5028         {
5029           /* Warn them that a data or address size prefix doesn't
5030              affect assembly of the next line of code.  */
5031           as_warn (_("stand-alone `%s' prefix"), t->name);
5032         }
5033     }
5034
5035   /* Copy the template we found.  */
5036   i.tm = *t;
5037
5038   if (addr_prefix_disp != -1)
5039     i.tm.operand_types[addr_prefix_disp]
5040       = operand_types[addr_prefix_disp];
5041
5042   if (found_reverse_match)
5043     {
5044       /* If we found a reverse match we must alter the opcode
5045          direction bit.  found_reverse_match holds bits to change
5046          (different for int & float insns).  */
5047
5048       i.tm.base_opcode ^= found_reverse_match;
5049
5050       i.tm.operand_types[0] = operand_types[1];
5051       i.tm.operand_types[1] = operand_types[0];
5052     }
5053
5054   return t;
5055 }
5056
5057 static int
5058 check_string (void)
5059 {
5060   int mem_op = operand_type_check (i.types[0], anymem) ? 0 : 1;
5061   if (i.tm.operand_types[mem_op].bitfield.esseg)
5062     {
5063       if (i.seg[0] != NULL && i.seg[0] != &es)
5064         {
5065           as_bad (_("`%s' operand %d must use `%ses' segment"),
5066                   i.tm.name,
5067                   mem_op + 1,
5068                   register_prefix);
5069           return 0;
5070         }
5071       /* There's only ever one segment override allowed per instruction.
5072          This instruction possibly has a legal segment override on the
5073          second operand, so copy the segment to where non-string
5074          instructions store it, allowing common code.  */
5075       i.seg[0] = i.seg[1];
5076     }
5077   else if (i.tm.operand_types[mem_op + 1].bitfield.esseg)
5078     {
5079       if (i.seg[1] != NULL && i.seg[1] != &es)
5080         {
5081           as_bad (_("`%s' operand %d must use `%ses' segment"),
5082                   i.tm.name,
5083                   mem_op + 2,
5084                   register_prefix);
5085           return 0;
5086         }
5087     }
5088   return 1;
5089 }
5090
5091 static int
5092 process_suffix (void)
5093 {
5094   /* If matched instruction specifies an explicit instruction mnemonic
5095      suffix, use it.  */
5096   if (i.tm.opcode_modifier.size16)
5097     i.suffix = WORD_MNEM_SUFFIX;
5098   else if (i.tm.opcode_modifier.size32)
5099     i.suffix = LONG_MNEM_SUFFIX;
5100   else if (i.tm.opcode_modifier.size64)
5101     i.suffix = QWORD_MNEM_SUFFIX;
5102   else if (i.reg_operands)
5103     {
5104       /* If there's no instruction mnemonic suffix we try to invent one
5105          based on register operands.  */
5106       if (!i.suffix)
5107         {
5108           /* We take i.suffix from the last register operand specified,
5109              Destination register type is more significant than source
5110              register type.  crc32 in SSE4.2 prefers source register
5111              type. */
5112           if (i.tm.base_opcode == 0xf20f38f1)
5113             {
5114               if (i.types[0].bitfield.reg16)
5115                 i.suffix = WORD_MNEM_SUFFIX;
5116               else if (i.types[0].bitfield.reg32)
5117                 i.suffix = LONG_MNEM_SUFFIX;
5118               else if (i.types[0].bitfield.reg64)
5119                 i.suffix = QWORD_MNEM_SUFFIX;
5120             }
5121           else if (i.tm.base_opcode == 0xf20f38f0)
5122             {
5123               if (i.types[0].bitfield.reg8)
5124                 i.suffix = BYTE_MNEM_SUFFIX;
5125             }
5126
5127           if (!i.suffix)
5128             {
5129               int op;
5130
5131               if (i.tm.base_opcode == 0xf20f38f1
5132                   || i.tm.base_opcode == 0xf20f38f0)
5133                 {
5134                   /* We have to know the operand size for crc32.  */
5135                   as_bad (_("ambiguous memory operand size for `%s`"),
5136                           i.tm.name);
5137                   return 0;
5138                 }
5139
5140               for (op = i.operands; --op >= 0;)
5141                 if (!i.tm.operand_types[op].bitfield.inoutportreg)
5142                   {
5143                     if (i.types[op].bitfield.reg8)
5144                       {
5145                         i.suffix = BYTE_MNEM_SUFFIX;
5146                         break;
5147                       }
5148                     else if (i.types[op].bitfield.reg16)
5149                       {
5150                         i.suffix = WORD_MNEM_SUFFIX;
5151                         break;
5152                       }
5153                     else if (i.types[op].bitfield.reg32)
5154                       {
5155                         i.suffix = LONG_MNEM_SUFFIX;
5156                         break;
5157                       }
5158                     else if (i.types[op].bitfield.reg64)
5159                       {
5160                         i.suffix = QWORD_MNEM_SUFFIX;
5161                         break;
5162                       }
5163                   }
5164             }
5165         }
5166       else if (i.suffix == BYTE_MNEM_SUFFIX)
5167         {
5168           if (intel_syntax
5169               && i.tm.opcode_modifier.ignoresize
5170               && i.tm.opcode_modifier.no_bsuf)
5171             i.suffix = 0;
5172           else if (!check_byte_reg ())
5173             return 0;
5174         }
5175       else if (i.suffix == LONG_MNEM_SUFFIX)
5176         {
5177           if (intel_syntax
5178               && i.tm.opcode_modifier.ignoresize
5179               && i.tm.opcode_modifier.no_lsuf)
5180             i.suffix = 0;
5181           else if (!check_long_reg ())
5182             return 0;
5183         }
5184       else if (i.suffix == QWORD_MNEM_SUFFIX)
5185         {
5186           if (intel_syntax
5187               && i.tm.opcode_modifier.ignoresize
5188               && i.tm.opcode_modifier.no_qsuf)
5189             i.suffix = 0;
5190           else if (!check_qword_reg ())
5191             return 0;
5192         }
5193       else if (i.suffix == WORD_MNEM_SUFFIX)
5194         {
5195           if (intel_syntax
5196               && i.tm.opcode_modifier.ignoresize
5197               && i.tm.opcode_modifier.no_wsuf)
5198             i.suffix = 0;
5199           else if (!check_word_reg ())
5200             return 0;
5201         }
5202       else if (i.suffix == XMMWORD_MNEM_SUFFIX
5203                || i.suffix == YMMWORD_MNEM_SUFFIX
5204                || i.suffix == ZMMWORD_MNEM_SUFFIX)
5205         {
5206           /* Skip if the instruction has x/y/z suffix.  match_template
5207              should check if it is a valid suffix.  */
5208         }
5209       else if (intel_syntax && i.tm.opcode_modifier.ignoresize)
5210         /* Do nothing if the instruction is going to ignore the prefix.  */
5211         ;
5212       else
5213         abort ();
5214     }
5215   else if (i.tm.opcode_modifier.defaultsize
5216            && !i.suffix
5217            /* exclude fldenv/frstor/fsave/fstenv */
5218            && i.tm.opcode_modifier.no_ssuf)
5219     {
5220       i.suffix = stackop_size;
5221     }
5222   else if (intel_syntax
5223            && !i.suffix
5224            && (i.tm.operand_types[0].bitfield.jumpabsolute
5225                || i.tm.opcode_modifier.jumpbyte
5226                || i.tm.opcode_modifier.jumpintersegment
5227                || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
5228                    && i.tm.extension_opcode <= 3)))
5229     {
5230       switch (flag_code)
5231         {
5232         case CODE_64BIT:
5233           if (!i.tm.opcode_modifier.no_qsuf)
5234             {
5235               i.suffix = QWORD_MNEM_SUFFIX;
5236               break;
5237             }
5238         case CODE_32BIT:
5239           if (!i.tm.opcode_modifier.no_lsuf)
5240             i.suffix = LONG_MNEM_SUFFIX;
5241           break;
5242         case CODE_16BIT:
5243           if (!i.tm.opcode_modifier.no_wsuf)
5244             i.suffix = WORD_MNEM_SUFFIX;
5245           break;
5246         }
5247     }
5248
5249   if (!i.suffix)
5250     {
5251       if (!intel_syntax)
5252         {
5253           if (i.tm.opcode_modifier.w)
5254             {
5255               as_bad (_("no instruction mnemonic suffix given and "
5256                         "no register operands; can't size instruction"));
5257               return 0;
5258             }
5259         }
5260       else
5261         {
5262           unsigned int suffixes;
5263
5264           suffixes = !i.tm.opcode_modifier.no_bsuf;
5265           if (!i.tm.opcode_modifier.no_wsuf)
5266             suffixes |= 1 << 1;
5267           if (!i.tm.opcode_modifier.no_lsuf)
5268             suffixes |= 1 << 2;
5269           if (!i.tm.opcode_modifier.no_ldsuf)
5270             suffixes |= 1 << 3;
5271           if (!i.tm.opcode_modifier.no_ssuf)
5272             suffixes |= 1 << 4;
5273           if (!i.tm.opcode_modifier.no_qsuf)
5274             suffixes |= 1 << 5;
5275
5276           /* There are more than suffix matches.  */
5277           if (i.tm.opcode_modifier.w
5278               || ((suffixes & (suffixes - 1))
5279                   && !i.tm.opcode_modifier.defaultsize
5280                   && !i.tm.opcode_modifier.ignoresize))
5281             {
5282               as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
5283               return 0;
5284             }
5285         }
5286     }
5287
5288   /* Change the opcode based on the operand size given by i.suffix;
5289      We don't need to change things for byte insns.  */
5290
5291   if (i.suffix
5292       && i.suffix != BYTE_MNEM_SUFFIX
5293       && i.suffix != XMMWORD_MNEM_SUFFIX
5294       && i.suffix != YMMWORD_MNEM_SUFFIX
5295       && i.suffix != ZMMWORD_MNEM_SUFFIX)
5296     {
5297       /* It's not a byte, select word/dword operation.  */
5298       if (i.tm.opcode_modifier.w)
5299         {
5300           if (i.tm.opcode_modifier.shortform)
5301             i.tm.base_opcode |= 8;
5302           else
5303             i.tm.base_opcode |= 1;
5304         }
5305
5306       /* Now select between word & dword operations via the operand
5307          size prefix, except for instructions that will ignore this
5308          prefix anyway.  */
5309       if (i.tm.opcode_modifier.addrprefixop0)
5310         {
5311           /* The address size override prefix changes the size of the
5312              first operand.  */
5313           if ((flag_code == CODE_32BIT
5314                && i.op->regs[0].reg_type.bitfield.reg16)
5315               || (flag_code != CODE_32BIT
5316                   && i.op->regs[0].reg_type.bitfield.reg32))
5317             if (!add_prefix (ADDR_PREFIX_OPCODE))
5318               return 0;
5319         }
5320       else if (i.suffix != QWORD_MNEM_SUFFIX
5321                && i.suffix != LONG_DOUBLE_MNEM_SUFFIX
5322                && !i.tm.opcode_modifier.ignoresize
5323                && !i.tm.opcode_modifier.floatmf
5324                && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
5325                    || (flag_code == CODE_64BIT
5326                        && i.tm.opcode_modifier.jumpbyte)))
5327         {
5328           unsigned int prefix = DATA_PREFIX_OPCODE;
5329
5330           if (i.tm.opcode_modifier.jumpbyte) /* jcxz, loop */
5331             prefix = ADDR_PREFIX_OPCODE;
5332
5333           if (!add_prefix (prefix))
5334             return 0;
5335         }
5336
5337       /* Set mode64 for an operand.  */
5338       if (i.suffix == QWORD_MNEM_SUFFIX
5339           && flag_code == CODE_64BIT
5340           && !i.tm.opcode_modifier.norex64)
5341         {
5342           /* Special case for xchg %rax,%rax.  It is NOP and doesn't
5343              need rex64.  cmpxchg8b is also a special case. */
5344           if (! (i.operands == 2
5345                  && i.tm.base_opcode == 0x90
5346                  && i.tm.extension_opcode == None
5347                  && operand_type_equal (&i.types [0], &acc64)
5348                  && operand_type_equal (&i.types [1], &acc64))
5349               && ! (i.operands == 1
5350                     && i.tm.base_opcode == 0xfc7
5351                     && i.tm.extension_opcode == 1
5352                     && !operand_type_check (i.types [0], reg)
5353                     && operand_type_check (i.types [0], anymem)))
5354             i.rex |= REX_W;
5355         }
5356
5357       /* Size floating point instruction.  */
5358       if (i.suffix == LONG_MNEM_SUFFIX)
5359         if (i.tm.opcode_modifier.floatmf)
5360           i.tm.base_opcode ^= 4;
5361     }
5362
5363   return 1;
5364 }
5365
5366 static int
5367 check_byte_reg (void)
5368 {
5369   int op;
5370
5371   for (op = i.operands; --op >= 0;)
5372     {
5373       /* If this is an eight bit register, it's OK.  If it's the 16 or
5374          32 bit version of an eight bit register, we will just use the
5375          low portion, and that's OK too.  */
5376       if (i.types[op].bitfield.reg8)
5377         continue;
5378
5379       /* I/O port address operands are OK too.  */
5380       if (i.tm.operand_types[op].bitfield.inoutportreg)
5381         continue;
5382
5383       /* crc32 doesn't generate this warning.  */
5384       if (i.tm.base_opcode == 0xf20f38f0)
5385         continue;
5386
5387       if ((i.types[op].bitfield.reg16
5388            || i.types[op].bitfield.reg32
5389            || i.types[op].bitfield.reg64)
5390           && i.op[op].regs->reg_num < 4
5391           /* Prohibit these changes in 64bit mode, since the lowering
5392              would be more complicated.  */
5393           && flag_code != CODE_64BIT)
5394         {
5395 #if REGISTER_WARNINGS
5396           if (!quiet_warnings)
5397             as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5398                      register_prefix,
5399                      (i.op[op].regs + (i.types[op].bitfield.reg16
5400                                        ? REGNAM_AL - REGNAM_AX
5401                                        : REGNAM_AL - REGNAM_EAX))->reg_name,
5402                      register_prefix,
5403                      i.op[op].regs->reg_name,
5404                      i.suffix);
5405 #endif
5406           continue;
5407         }
5408       /* Any other register is bad.  */
5409       if (i.types[op].bitfield.reg16
5410           || i.types[op].bitfield.reg32
5411           || i.types[op].bitfield.reg64
5412           || i.types[op].bitfield.regmmx
5413           || i.types[op].bitfield.regxmm
5414           || i.types[op].bitfield.regymm
5415           || i.types[op].bitfield.regzmm
5416           || i.types[op].bitfield.sreg2
5417           || i.types[op].bitfield.sreg3
5418           || i.types[op].bitfield.control
5419           || i.types[op].bitfield.debug
5420           || i.types[op].bitfield.test
5421           || i.types[op].bitfield.floatreg
5422           || i.types[op].bitfield.floatacc)
5423         {
5424           as_bad (_("`%s%s' not allowed with `%s%c'"),
5425                   register_prefix,
5426                   i.op[op].regs->reg_name,
5427                   i.tm.name,
5428                   i.suffix);
5429           return 0;
5430         }
5431     }
5432   return 1;
5433 }
5434
5435 static int
5436 check_long_reg (void)
5437 {
5438   int op;
5439
5440   for (op = i.operands; --op >= 0;)
5441     /* Reject eight bit registers, except where the template requires
5442        them. (eg. movzb)  */
5443     if (i.types[op].bitfield.reg8
5444         && (i.tm.operand_types[op].bitfield.reg16
5445             || i.tm.operand_types[op].bitfield.reg32
5446             || i.tm.operand_types[op].bitfield.acc))
5447       {
5448         as_bad (_("`%s%s' not allowed with `%s%c'"),
5449                 register_prefix,
5450                 i.op[op].regs->reg_name,
5451                 i.tm.name,
5452                 i.suffix);
5453         return 0;
5454       }
5455     /* Warn if the e prefix on a general reg is missing.  */
5456     else if ((!quiet_warnings || flag_code == CODE_64BIT)
5457              && i.types[op].bitfield.reg16
5458              && (i.tm.operand_types[op].bitfield.reg32
5459                  || i.tm.operand_types[op].bitfield.acc))
5460       {
5461         /* Prohibit these changes in the 64bit mode, since the
5462            lowering is more complicated.  */
5463         if (flag_code == CODE_64BIT)
5464           {
5465             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5466                     register_prefix, i.op[op].regs->reg_name,
5467                     i.suffix);
5468             return 0;
5469           }
5470 #if REGISTER_WARNINGS
5471         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5472                  register_prefix,
5473                  (i.op[op].regs + REGNAM_EAX - REGNAM_AX)->reg_name,
5474                  register_prefix, i.op[op].regs->reg_name, i.suffix);
5475 #endif
5476       }
5477     /* Warn if the r prefix on a general reg is present.  */
5478     else if (i.types[op].bitfield.reg64
5479              && (i.tm.operand_types[op].bitfield.reg32
5480                  || i.tm.operand_types[op].bitfield.acc))
5481       {
5482         if (intel_syntax
5483             && i.tm.opcode_modifier.toqword
5484             && !i.types[0].bitfield.regxmm)
5485           {
5486             /* Convert to QWORD.  We want REX byte. */
5487             i.suffix = QWORD_MNEM_SUFFIX;
5488           }
5489         else
5490           {
5491             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5492                     register_prefix, i.op[op].regs->reg_name,
5493                     i.suffix);
5494             return 0;
5495           }
5496       }
5497   return 1;
5498 }
5499
5500 static int
5501 check_qword_reg (void)
5502 {
5503   int op;
5504
5505   for (op = i.operands; --op >= 0; )
5506     /* Reject eight bit registers, except where the template requires
5507        them. (eg. movzb)  */
5508     if (i.types[op].bitfield.reg8
5509         && (i.tm.operand_types[op].bitfield.reg16
5510             || i.tm.operand_types[op].bitfield.reg32
5511             || i.tm.operand_types[op].bitfield.acc))
5512       {
5513         as_bad (_("`%s%s' not allowed with `%s%c'"),
5514                 register_prefix,
5515                 i.op[op].regs->reg_name,
5516                 i.tm.name,
5517                 i.suffix);
5518         return 0;
5519       }
5520     /* Warn if the r prefix on a general reg is missing.  */
5521     else if ((i.types[op].bitfield.reg16
5522               || i.types[op].bitfield.reg32)
5523              && (i.tm.operand_types[op].bitfield.reg32
5524                  || i.tm.operand_types[op].bitfield.acc))
5525       {
5526         /* Prohibit these changes in the 64bit mode, since the
5527            lowering is more complicated.  */
5528         if (intel_syntax
5529             && i.tm.opcode_modifier.todword
5530             && !i.types[0].bitfield.regxmm)
5531           {
5532             /* Convert to DWORD.  We don't want REX byte. */
5533             i.suffix = LONG_MNEM_SUFFIX;
5534           }
5535         else
5536           {
5537             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5538                     register_prefix, i.op[op].regs->reg_name,
5539                     i.suffix);
5540             return 0;
5541           }
5542       }
5543   return 1;
5544 }
5545
5546 static int
5547 check_word_reg (void)
5548 {
5549   int op;
5550   for (op = i.operands; --op >= 0;)
5551     /* Reject eight bit registers, except where the template requires
5552        them. (eg. movzb)  */
5553     if (i.types[op].bitfield.reg8
5554         && (i.tm.operand_types[op].bitfield.reg16
5555             || i.tm.operand_types[op].bitfield.reg32
5556             || i.tm.operand_types[op].bitfield.acc))
5557       {
5558         as_bad (_("`%s%s' not allowed with `%s%c'"),
5559                 register_prefix,
5560                 i.op[op].regs->reg_name,
5561                 i.tm.name,
5562                 i.suffix);
5563         return 0;
5564       }
5565     /* Warn if the e or r prefix on a general reg is present.  */
5566     else if ((!quiet_warnings || flag_code == CODE_64BIT)
5567              && (i.types[op].bitfield.reg32
5568                  || i.types[op].bitfield.reg64)
5569              && (i.tm.operand_types[op].bitfield.reg16
5570                  || i.tm.operand_types[op].bitfield.acc))
5571       {
5572         /* Prohibit these changes in the 64bit mode, since the
5573            lowering is more complicated.  */
5574         if (flag_code == CODE_64BIT)
5575           {
5576             as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
5577                     register_prefix, i.op[op].regs->reg_name,
5578                     i.suffix);
5579             return 0;
5580           }
5581 #if REGISTER_WARNINGS
5582         as_warn (_("using `%s%s' instead of `%s%s' due to `%c' suffix"),
5583                  register_prefix,
5584                  (i.op[op].regs + REGNAM_AX - REGNAM_EAX)->reg_name,
5585                  register_prefix, i.op[op].regs->reg_name, i.suffix);
5586 #endif
5587       }
5588   return 1;
5589 }
5590
5591 static int
5592 update_imm (unsigned int j)
5593 {
5594   i386_operand_type overlap = i.types[j];
5595   if ((overlap.bitfield.imm8
5596        || overlap.bitfield.imm8s
5597        || overlap.bitfield.imm16
5598        || overlap.bitfield.imm32
5599        || overlap.bitfield.imm32s
5600        || overlap.bitfield.imm64)
5601       && !operand_type_equal (&overlap, &imm8)
5602       && !operand_type_equal (&overlap, &imm8s)
5603       && !operand_type_equal (&overlap, &imm16)
5604       && !operand_type_equal (&overlap, &imm32)
5605       && !operand_type_equal (&overlap, &imm32s)
5606       && !operand_type_equal (&overlap, &imm64))
5607     {
5608       if (i.suffix)
5609         {
5610           i386_operand_type temp;
5611
5612           operand_type_set (&temp, 0);
5613           if (i.suffix == BYTE_MNEM_SUFFIX)
5614             {
5615               temp.bitfield.imm8 = overlap.bitfield.imm8;
5616               temp.bitfield.imm8s = overlap.bitfield.imm8s;
5617             }
5618           else if (i.suffix == WORD_MNEM_SUFFIX)
5619             temp.bitfield.imm16 = overlap.bitfield.imm16;
5620           else if (i.suffix == QWORD_MNEM_SUFFIX)
5621             {
5622               temp.bitfield.imm64 = overlap.bitfield.imm64;
5623               temp.bitfield.imm32s = overlap.bitfield.imm32s;
5624             }
5625           else
5626             temp.bitfield.imm32 = overlap.bitfield.imm32;
5627           overlap = temp;
5628         }
5629       else if (operand_type_equal (&overlap, &imm16_32_32s)
5630                || operand_type_equal (&overlap, &imm16_32)
5631                || operand_type_equal (&overlap, &imm16_32s))
5632         {
5633           if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5634             overlap = imm16;
5635           else
5636             overlap = imm32s;
5637         }
5638       if (!operand_type_equal (&overlap, &imm8)
5639           && !operand_type_equal (&overlap, &imm8s)
5640           && !operand_type_equal (&overlap, &imm16)
5641           && !operand_type_equal (&overlap, &imm32)
5642           && !operand_type_equal (&overlap, &imm32s)
5643           && !operand_type_equal (&overlap, &imm64))
5644         {
5645           as_bad (_("no instruction mnemonic suffix given; "
5646                     "can't determine immediate size"));
5647           return 0;
5648         }
5649     }
5650   i.types[j] = overlap;
5651
5652   return 1;
5653 }
5654
5655 static int
5656 finalize_imm (void)
5657 {
5658   unsigned int j, n;
5659
5660   /* Update the first 2 immediate operands.  */
5661   n = i.operands > 2 ? 2 : i.operands;
5662   if (n)
5663     {
5664       for (j = 0; j < n; j++)
5665         if (update_imm (j) == 0)
5666           return 0;
5667
5668       /* The 3rd operand can't be immediate operand.  */
5669       gas_assert (operand_type_check (i.types[2], imm) == 0);
5670     }
5671
5672   return 1;
5673 }
5674
5675 static int
5676 bad_implicit_operand (int xmm)
5677 {
5678   const char *ireg = xmm ? "xmm0" : "ymm0";
5679
5680   if (intel_syntax)
5681     as_bad (_("the last operand of `%s' must be `%s%s'"),
5682             i.tm.name, register_prefix, ireg);
5683   else
5684     as_bad (_("the first operand of `%s' must be `%s%s'"),
5685             i.tm.name, register_prefix, ireg);
5686   return 0;
5687 }
5688
5689 static int
5690 process_operands (void)
5691 {
5692   /* Default segment register this instruction will use for memory
5693      accesses.  0 means unknown.  This is only for optimizing out
5694      unnecessary segment overrides.  */
5695   const seg_entry *default_seg = 0;
5696
5697   if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
5698     {
5699       unsigned int dupl = i.operands;
5700       unsigned int dest = dupl - 1;
5701       unsigned int j;
5702
5703       /* The destination must be an xmm register.  */
5704       gas_assert (i.reg_operands
5705                   && MAX_OPERANDS > dupl
5706                   && operand_type_equal (&i.types[dest], &regxmm));
5707
5708       if (i.tm.opcode_modifier.firstxmm0)
5709         {
5710           /* The first operand is implicit and must be xmm0.  */
5711           gas_assert (operand_type_equal (&i.types[0], &regxmm));
5712           if (register_number (i.op[0].regs) != 0)
5713             return bad_implicit_operand (1);
5714
5715           if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
5716             {
5717               /* Keep xmm0 for instructions with VEX prefix and 3
5718                  sources.  */
5719               goto duplicate;
5720             }
5721           else
5722             {
5723               /* We remove the first xmm0 and keep the number of
5724                  operands unchanged, which in fact duplicates the
5725                  destination.  */
5726               for (j = 1; j < i.operands; j++)
5727                 {
5728                   i.op[j - 1] = i.op[j];
5729                   i.types[j - 1] = i.types[j];
5730                   i.tm.operand_types[j - 1] = i.tm.operand_types[j];
5731                 }
5732             }
5733         }
5734       else if (i.tm.opcode_modifier.implicit1stxmm0)
5735         {
5736           gas_assert ((MAX_OPERANDS - 1) > dupl
5737                       && (i.tm.opcode_modifier.vexsources
5738                           == VEX3SOURCES));
5739
5740           /* Add the implicit xmm0 for instructions with VEX prefix
5741              and 3 sources.  */
5742           for (j = i.operands; j > 0; j--)
5743             {
5744               i.op[j] = i.op[j - 1];
5745               i.types[j] = i.types[j - 1];
5746               i.tm.operand_types[j] = i.tm.operand_types[j - 1];
5747             }
5748           i.op[0].regs
5749             = (const reg_entry *) hash_find (reg_hash, "xmm0");
5750           i.types[0] = regxmm;
5751           i.tm.operand_types[0] = regxmm;
5752
5753           i.operands += 2;
5754           i.reg_operands += 2;
5755           i.tm.operands += 2;
5756
5757           dupl++;
5758           dest++;
5759           i.op[dupl] = i.op[dest];
5760           i.types[dupl] = i.types[dest];
5761           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5762         }
5763       else
5764         {
5765 duplicate:
5766           i.operands++;
5767           i.reg_operands++;
5768           i.tm.operands++;
5769
5770           i.op[dupl] = i.op[dest];
5771           i.types[dupl] = i.types[dest];
5772           i.tm.operand_types[dupl] = i.tm.operand_types[dest];
5773         }
5774
5775        if (i.tm.opcode_modifier.immext)
5776          process_immext ();
5777     }
5778   else if (i.tm.opcode_modifier.firstxmm0)
5779     {
5780       unsigned int j;
5781
5782       /* The first operand is implicit and must be xmm0/ymm0/zmm0.  */
5783       gas_assert (i.reg_operands
5784                   && (operand_type_equal (&i.types[0], &regxmm)
5785                       || operand_type_equal (&i.types[0], &regymm)
5786                       || operand_type_equal (&i.types[0], &regzmm)));
5787       if (register_number (i.op[0].regs) != 0)
5788         return bad_implicit_operand (i.types[0].bitfield.regxmm);
5789
5790       for (j = 1; j < i.operands; j++)
5791         {
5792           i.op[j - 1] = i.op[j];
5793           i.types[j - 1] = i.types[j];
5794
5795           /* We need to adjust fields in i.tm since they are used by
5796              build_modrm_byte.  */
5797           i.tm.operand_types [j - 1] = i.tm.operand_types [j];
5798         }
5799
5800       i.operands--;
5801       i.reg_operands--;
5802       i.tm.operands--;
5803     }
5804   else if (i.tm.opcode_modifier.regkludge)
5805     {
5806       /* The imul $imm, %reg instruction is converted into
5807          imul $imm, %reg, %reg, and the clr %reg instruction
5808          is converted into xor %reg, %reg.  */
5809
5810       unsigned int first_reg_op;
5811
5812       if (operand_type_check (i.types[0], reg))
5813         first_reg_op = 0;
5814       else
5815         first_reg_op = 1;
5816       /* Pretend we saw the extra register operand.  */
5817       gas_assert (i.reg_operands == 1
5818                   && i.op[first_reg_op + 1].regs == 0);
5819       i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
5820       i.types[first_reg_op + 1] = i.types[first_reg_op];
5821       i.operands++;
5822       i.reg_operands++;
5823     }
5824
5825   if (i.tm.opcode_modifier.shortform)
5826     {
5827       if (i.types[0].bitfield.sreg2
5828           || i.types[0].bitfield.sreg3)
5829         {
5830           if (i.tm.base_opcode == POP_SEG_SHORT
5831               && i.op[0].regs->reg_num == 1)
5832             {
5833               as_bad (_("you can't `pop %scs'"), register_prefix);
5834               return 0;
5835             }
5836           i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
5837           if ((i.op[0].regs->reg_flags & RegRex) != 0)
5838             i.rex |= REX_B;
5839         }
5840       else
5841         {
5842           /* The register or float register operand is in operand
5843              0 or 1.  */
5844           unsigned int op;
5845
5846           if (i.types[0].bitfield.floatreg
5847               || operand_type_check (i.types[0], reg))
5848             op = 0;
5849           else
5850             op = 1;
5851           /* Register goes in low 3 bits of opcode.  */
5852           i.tm.base_opcode |= i.op[op].regs->reg_num;
5853           if ((i.op[op].regs->reg_flags & RegRex) != 0)
5854             i.rex |= REX_B;
5855           if (!quiet_warnings && i.tm.opcode_modifier.ugh)
5856             {
5857               /* Warn about some common errors, but press on regardless.
5858                  The first case can be generated by gcc (<= 2.8.1).  */
5859               if (i.operands == 2)
5860                 {
5861                   /* Reversed arguments on faddp, fsubp, etc.  */
5862                   as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
5863                            register_prefix, i.op[!intel_syntax].regs->reg_name,
5864                            register_prefix, i.op[intel_syntax].regs->reg_name);
5865                 }
5866               else
5867                 {
5868                   /* Extraneous `l' suffix on fp insn.  */
5869                   as_warn (_("translating to `%s %s%s'"), i.tm.name,
5870                            register_prefix, i.op[0].regs->reg_name);
5871                 }
5872             }
5873         }
5874     }
5875   else if (i.tm.opcode_modifier.modrm)
5876     {
5877       /* The opcode is completed (modulo i.tm.extension_opcode which
5878          must be put into the modrm byte).  Now, we make the modrm and
5879          index base bytes based on all the info we've collected.  */
5880
5881       default_seg = build_modrm_byte ();
5882     }
5883   else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
5884     {
5885       default_seg = &ds;
5886     }
5887   else if (i.tm.opcode_modifier.isstring)
5888     {
5889       /* For the string instructions that allow a segment override
5890          on one of their operands, the default segment is ds.  */
5891       default_seg = &ds;
5892     }
5893
5894   if (i.tm.base_opcode == 0x8d /* lea */
5895       && i.seg[0]
5896       && !quiet_warnings)
5897     as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
5898
5899   /* If a segment was explicitly specified, and the specified segment
5900      is not the default, use an opcode prefix to select it.  If we
5901      never figured out what the default segment is, then default_seg
5902      will be zero at this point, and the specified segment prefix will
5903      always be used.  */
5904   if ((i.seg[0]) && (i.seg[0] != default_seg))
5905     {
5906       if (!add_prefix (i.seg[0]->seg_prefix))
5907         return 0;
5908     }
5909   return 1;
5910 }
5911
5912 static const seg_entry *
5913 build_modrm_byte (void)
5914 {
5915   const seg_entry *default_seg = 0;
5916   unsigned int source, dest;
5917   int vex_3_sources;
5918
5919   /* The first operand of instructions with VEX prefix and 3 sources
5920      must be VEX_Imm4.  */
5921   vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
5922   if (vex_3_sources)
5923     {
5924       unsigned int nds, reg_slot;
5925       expressionS *exp;
5926
5927       if (i.tm.opcode_modifier.veximmext
5928           && i.tm.opcode_modifier.immext)
5929         {
5930           dest = i.operands - 2;
5931           gas_assert (dest == 3);
5932         }
5933       else
5934         dest = i.operands - 1;
5935       nds = dest - 1;
5936
5937       /* There are 2 kinds of instructions:
5938          1. 5 operands: 4 register operands or 3 register operands
5939          plus 1 memory operand plus one Vec_Imm4 operand, VexXDS, and
5940          VexW0 or VexW1.  The destination must be either XMM, YMM or
5941          ZMM register.
5942          2. 4 operands: 4 register operands or 3 register operands
5943          plus 1 memory operand, VexXDS, and VexImmExt  */
5944       gas_assert ((i.reg_operands == 4
5945                    || (i.reg_operands == 3 && i.mem_operands == 1))
5946                   && i.tm.opcode_modifier.vexvvvv == VEXXDS
5947                   && (i.tm.opcode_modifier.veximmext
5948                       || (i.imm_operands == 1
5949                           && i.types[0].bitfield.vec_imm4
5950                           && (i.tm.opcode_modifier.vexw == VEXW0
5951                               || i.tm.opcode_modifier.vexw == VEXW1)
5952                           && (operand_type_equal (&i.tm.operand_types[dest], &regxmm)
5953                               || operand_type_equal (&i.tm.operand_types[dest], &regymm)
5954                               || operand_type_equal (&i.tm.operand_types[dest], &regzmm)))));
5955
5956       if (i.imm_operands == 0)
5957         {
5958           /* When there is no immediate operand, generate an 8bit
5959              immediate operand to encode the first operand.  */
5960           exp = &im_expressions[i.imm_operands++];
5961           i.op[i.operands].imms = exp;
5962           i.types[i.operands] = imm8;
5963           i.operands++;
5964           /* If VexW1 is set, the first operand is the source and
5965              the second operand is encoded in the immediate operand.  */
5966           if (i.tm.opcode_modifier.vexw == VEXW1)
5967             {
5968               source = 0;
5969               reg_slot = 1;
5970             }
5971           else
5972             {
5973               source = 1;
5974               reg_slot = 0;
5975             }
5976
5977           /* FMA swaps REG and NDS.  */
5978           if (i.tm.cpu_flags.bitfield.cpufma)
5979             {
5980               unsigned int tmp;
5981               tmp = reg_slot;
5982               reg_slot = nds;
5983               nds = tmp;
5984             }
5985
5986           gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
5987                                           &regxmm)
5988                       || operand_type_equal (&i.tm.operand_types[reg_slot],
5989                                              &regymm)
5990                       || operand_type_equal (&i.tm.operand_types[reg_slot],
5991                                              &regzmm));
5992           exp->X_op = O_constant;
5993           exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
5994           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
5995         }
5996       else
5997         {
5998           unsigned int imm_slot;
5999
6000           if (i.tm.opcode_modifier.vexw == VEXW0)
6001             {
6002               /* If VexW0 is set, the third operand is the source and
6003                  the second operand is encoded in the immediate
6004                  operand.  */
6005               source = 2;
6006               reg_slot = 1;
6007             }
6008           else
6009             {
6010               /* VexW1 is set, the second operand is the source and
6011                  the third operand is encoded in the immediate
6012                  operand.  */
6013               source = 1;
6014               reg_slot = 2;
6015             }
6016
6017           if (i.tm.opcode_modifier.immext)
6018             {
6019               /* When ImmExt is set, the immdiate byte is the last
6020                  operand.  */
6021               imm_slot = i.operands - 1;
6022               source--;
6023               reg_slot--;
6024             }
6025           else
6026             {
6027               imm_slot = 0;
6028
6029               /* Turn on Imm8 so that output_imm will generate it.  */
6030               i.types[imm_slot].bitfield.imm8 = 1;
6031             }
6032
6033           gas_assert (operand_type_equal (&i.tm.operand_types[reg_slot],
6034                                           &regxmm)
6035                       || operand_type_equal (&i.tm.operand_types[reg_slot],
6036                                              &regymm)
6037                       || operand_type_equal (&i.tm.operand_types[reg_slot],
6038                                              &regzmm));
6039           i.op[imm_slot].imms->X_add_number
6040               |= register_number (i.op[reg_slot].regs) << 4;
6041           gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
6042         }
6043
6044       gas_assert (operand_type_equal (&i.tm.operand_types[nds], &regxmm)
6045                   || operand_type_equal (&i.tm.operand_types[nds],
6046                                          &regymm)
6047                   || operand_type_equal (&i.tm.operand_types[nds],
6048                                          &regzmm));
6049       i.vex.register_specifier = i.op[nds].regs;
6050     }
6051   else
6052     source = dest = 0;
6053
6054   /* i.reg_operands MUST be the number of real register operands;
6055      implicit registers do not count.  If there are 3 register
6056      operands, it must be a instruction with VexNDS.  For a
6057      instruction with VexNDD, the destination register is encoded
6058      in VEX prefix.  If there are 4 register operands, it must be
6059      a instruction with VEX prefix and 3 sources.  */
6060   if (i.mem_operands == 0
6061       && ((i.reg_operands == 2
6062            && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
6063           || (i.reg_operands == 3
6064               && i.tm.opcode_modifier.vexvvvv == VEXXDS)
6065           || (i.reg_operands == 4 && vex_3_sources)))
6066     {
6067       switch (i.operands)
6068         {
6069         case 2:
6070           source = 0;
6071           break;
6072         case 3:
6073           /* When there are 3 operands, one of them may be immediate,
6074              which may be the first or the last operand.  Otherwise,
6075              the first operand must be shift count register (cl) or it
6076              is an instruction with VexNDS. */
6077           gas_assert (i.imm_operands == 1
6078                       || (i.imm_operands == 0
6079                           && (i.tm.opcode_modifier.vexvvvv == VEXXDS
6080                               || i.types[0].bitfield.shiftcount)));
6081           if (operand_type_check (i.types[0], imm)
6082               || i.types[0].bitfield.shiftcount)
6083             source = 1;
6084           else
6085             source = 0;
6086           break;
6087         case 4:
6088           /* When there are 4 operands, the first two must be 8bit
6089              immediate operands. The source operand will be the 3rd
6090              one.
6091
6092              For instructions with VexNDS, if the first operand
6093              an imm8, the source operand is the 2nd one.  If the last
6094              operand is imm8, the source operand is the first one.  */
6095           gas_assert ((i.imm_operands == 2
6096                        && i.types[0].bitfield.imm8
6097                        && i.types[1].bitfield.imm8)
6098                       || (i.tm.opcode_modifier.vexvvvv == VEXXDS
6099                           && i.imm_operands == 1
6100                           && (i.types[0].bitfield.imm8
6101                               || i.types[i.operands - 1].bitfield.imm8
6102                               || i.rounding)));
6103           if (i.imm_operands == 2)
6104             source = 2;
6105           else
6106             {
6107               if (i.types[0].bitfield.imm8)
6108                 source = 1;
6109               else
6110                 source = 0;
6111             }
6112           break;
6113         case 5:
6114           if (i.tm.opcode_modifier.evex)
6115             {
6116               /* For EVEX instructions, when there are 5 operands, the
6117                  first one must be immediate operand.  If the second one
6118                  is immediate operand, the source operand is the 3th
6119                  one.  If the last one is immediate operand, the source
6120                  operand is the 2nd one.  */
6121               gas_assert (i.imm_operands == 2
6122                           && i.tm.opcode_modifier.sae
6123                           && operand_type_check (i.types[0], imm));
6124               if (operand_type_check (i.types[1], imm))
6125                 source = 2;
6126               else if (operand_type_check (i.types[4], imm))
6127                 source = 1;
6128               else
6129                 abort ();
6130             }
6131           break;
6132         default:
6133           abort ();
6134         }
6135
6136       if (!vex_3_sources)
6137         {
6138           dest = source + 1;
6139
6140           /* RC/SAE operand could be between DEST and SRC.  That happens
6141              when one operand is GPR and the other one is XMM/YMM/ZMM
6142              register.  */
6143           if (i.rounding && i.rounding->operand == (int) dest)
6144             dest++;
6145
6146           if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6147             {
6148               /* For instructions with VexNDS, the register-only source
6149                  operand must be 32/64bit integer, XMM, YMM or ZMM
6150                  register.  It is encoded in VEX prefix.  We need to
6151                  clear RegMem bit before calling operand_type_equal.  */
6152
6153               i386_operand_type op;
6154               unsigned int vvvv;
6155
6156               /* Check register-only source operand when two source
6157                  operands are swapped.  */
6158               if (!i.tm.operand_types[source].bitfield.baseindex
6159                   && i.tm.operand_types[dest].bitfield.baseindex)
6160                 {
6161                   vvvv = source;
6162                   source = dest;
6163                 }
6164               else
6165                 vvvv = dest;
6166
6167               op = i.tm.operand_types[vvvv];
6168               op.bitfield.regmem = 0;
6169               if ((dest + 1) >= i.operands
6170                   || (op.bitfield.reg32 != 1
6171                       && !op.bitfield.reg64 != 1
6172                       && !operand_type_equal (&op, &regxmm)
6173                       && !operand_type_equal (&op, &regymm)
6174                       && !operand_type_equal (&op, &regzmm)
6175                       && !operand_type_equal (&op, &regmask)))
6176                 abort ();
6177               i.vex.register_specifier = i.op[vvvv].regs;
6178               dest++;
6179             }
6180         }
6181
6182       i.rm.mode = 3;
6183       /* One of the register operands will be encoded in the i.tm.reg
6184          field, the other in the combined i.tm.mode and i.tm.regmem
6185          fields.  If no form of this instruction supports a memory
6186          destination operand, then we assume the source operand may
6187          sometimes be a memory operand and so we need to store the
6188          destination in the i.rm.reg field.  */
6189       if (!i.tm.operand_types[dest].bitfield.regmem
6190           && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
6191         {
6192           i.rm.reg = i.op[dest].regs->reg_num;
6193           i.rm.regmem = i.op[source].regs->reg_num;
6194           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6195             i.rex |= REX_R;
6196           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6197             i.vrex |= REX_R;
6198           if ((i.op[source].regs->reg_flags & RegRex) != 0)
6199             i.rex |= REX_B;
6200           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6201             i.vrex |= REX_B;
6202         }
6203       else
6204         {
6205           i.rm.reg = i.op[source].regs->reg_num;
6206           i.rm.regmem = i.op[dest].regs->reg_num;
6207           if ((i.op[dest].regs->reg_flags & RegRex) != 0)
6208             i.rex |= REX_B;
6209           if ((i.op[dest].regs->reg_flags & RegVRex) != 0)
6210             i.vrex |= REX_B;
6211           if ((i.op[source].regs->reg_flags & RegRex) != 0)
6212             i.rex |= REX_R;
6213           if ((i.op[source].regs->reg_flags & RegVRex) != 0)
6214             i.vrex |= REX_R;
6215         }
6216       if (flag_code != CODE_64BIT && (i.rex & (REX_R | REX_B)))
6217         {
6218           if (!i.types[0].bitfield.control
6219               && !i.types[1].bitfield.control)
6220             abort ();
6221           i.rex &= ~(REX_R | REX_B);
6222           add_prefix (LOCK_PREFIX_OPCODE);
6223         }
6224     }
6225   else
6226     {                   /* If it's not 2 reg operands...  */
6227       unsigned int mem;
6228
6229       if (i.mem_operands)
6230         {
6231           unsigned int fake_zero_displacement = 0;
6232           unsigned int op;
6233
6234           for (op = 0; op < i.operands; op++)
6235             if (operand_type_check (i.types[op], anymem))
6236               break;
6237           gas_assert (op < i.operands);
6238
6239           if (i.tm.opcode_modifier.vecsib)
6240             {
6241               if (i.index_reg->reg_num == RegEiz
6242                   || i.index_reg->reg_num == RegRiz)
6243                 abort ();
6244
6245               i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6246               if (!i.base_reg)
6247                 {
6248                   i.sib.base = NO_BASE_REGISTER;
6249                   i.sib.scale = i.log2_scale_factor;
6250                   /* No Vec_Disp8 if there is no base.  */
6251                   i.types[op].bitfield.vec_disp8 = 0;
6252                   i.types[op].bitfield.disp8 = 0;
6253                   i.types[op].bitfield.disp16 = 0;
6254                   i.types[op].bitfield.disp64 = 0;
6255                   if (flag_code != CODE_64BIT)
6256                     {
6257                       /* Must be 32 bit */
6258                       i.types[op].bitfield.disp32 = 1;
6259                       i.types[op].bitfield.disp32s = 0;
6260                     }
6261                   else
6262                     {
6263                       i.types[op].bitfield.disp32 = 0;
6264                       i.types[op].bitfield.disp32s = 1;
6265                     }
6266                 }
6267               i.sib.index = i.index_reg->reg_num;
6268               if ((i.index_reg->reg_flags & RegRex) != 0)
6269                 i.rex |= REX_X;
6270               if ((i.index_reg->reg_flags & RegVRex) != 0)
6271                 i.vrex |= REX_X;
6272             }
6273
6274           default_seg = &ds;
6275
6276           if (i.base_reg == 0)
6277             {
6278               i.rm.mode = 0;
6279               if (!i.disp_operands)
6280                 {
6281                   fake_zero_displacement = 1;
6282                   /* Instructions with VSIB byte need 32bit displacement
6283                      if there is no base register.  */
6284                   if (i.tm.opcode_modifier.vecsib)
6285                     i.types[op].bitfield.disp32 = 1;
6286                 }
6287               if (i.index_reg == 0)
6288                 {
6289                   gas_assert (!i.tm.opcode_modifier.vecsib);
6290                   /* Operand is just <disp>  */
6291                   if (flag_code == CODE_64BIT)
6292                     {
6293                       /* 64bit mode overwrites the 32bit absolute
6294                          addressing by RIP relative addressing and
6295                          absolute addressing is encoded by one of the
6296                          redundant SIB forms.  */
6297                       i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6298                       i.sib.base = NO_BASE_REGISTER;
6299                       i.sib.index = NO_INDEX_REGISTER;
6300                       i.types[op] = ((i.prefix[ADDR_PREFIX] == 0)
6301                                      ? disp32s : disp32);
6302                     }
6303                   else if ((flag_code == CODE_16BIT)
6304                            ^ (i.prefix[ADDR_PREFIX] != 0))
6305                     {
6306                       i.rm.regmem = NO_BASE_REGISTER_16;
6307                       i.types[op] = disp16;
6308                     }
6309                   else
6310                     {
6311                       i.rm.regmem = NO_BASE_REGISTER;
6312                       i.types[op] = disp32;
6313                     }
6314                 }
6315               else if (!i.tm.opcode_modifier.vecsib)
6316                 {
6317                   /* !i.base_reg && i.index_reg  */
6318                   if (i.index_reg->reg_num == RegEiz
6319                       || i.index_reg->reg_num == RegRiz)
6320                     i.sib.index = NO_INDEX_REGISTER;
6321                   else
6322                     i.sib.index = i.index_reg->reg_num;
6323                   i.sib.base = NO_BASE_REGISTER;
6324                   i.sib.scale = i.log2_scale_factor;
6325                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6326                   /* No Vec_Disp8 if there is no base.  */
6327                   i.types[op].bitfield.vec_disp8 = 0;
6328                   i.types[op].bitfield.disp8 = 0;
6329                   i.types[op].bitfield.disp16 = 0;
6330                   i.types[op].bitfield.disp64 = 0;
6331                   if (flag_code != CODE_64BIT)
6332                     {
6333                       /* Must be 32 bit */
6334                       i.types[op].bitfield.disp32 = 1;
6335                       i.types[op].bitfield.disp32s = 0;
6336                     }
6337                   else
6338                     {
6339                       i.types[op].bitfield.disp32 = 0;
6340                       i.types[op].bitfield.disp32s = 1;
6341                     }
6342                   if ((i.index_reg->reg_flags & RegRex) != 0)
6343                     i.rex |= REX_X;
6344                 }
6345             }
6346           /* RIP addressing for 64bit mode.  */
6347           else if (i.base_reg->reg_num == RegRip ||
6348                    i.base_reg->reg_num == RegEip)
6349             {
6350               gas_assert (!i.tm.opcode_modifier.vecsib);
6351               i.rm.regmem = NO_BASE_REGISTER;
6352               i.types[op].bitfield.disp8 = 0;
6353               i.types[op].bitfield.disp16 = 0;
6354               i.types[op].bitfield.disp32 = 0;
6355               i.types[op].bitfield.disp32s = 1;
6356               i.types[op].bitfield.disp64 = 0;
6357               i.types[op].bitfield.vec_disp8 = 0;
6358               i.flags[op] |= Operand_PCrel;
6359               if (! i.disp_operands)
6360                 fake_zero_displacement = 1;
6361             }
6362           else if (i.base_reg->reg_type.bitfield.reg16)
6363             {
6364               gas_assert (!i.tm.opcode_modifier.vecsib);
6365               switch (i.base_reg->reg_num)
6366                 {
6367                 case 3: /* (%bx)  */
6368                   if (i.index_reg == 0)
6369                     i.rm.regmem = 7;
6370                   else /* (%bx,%si) -> 0, or (%bx,%di) -> 1  */
6371                     i.rm.regmem = i.index_reg->reg_num - 6;
6372                   break;
6373                 case 5: /* (%bp)  */
6374                   default_seg = &ss;
6375                   if (i.index_reg == 0)
6376                     {
6377                       i.rm.regmem = 6;
6378                       if (operand_type_check (i.types[op], disp) == 0)
6379                         {
6380                           /* fake (%bp) into 0(%bp)  */
6381                           if (i.tm.operand_types[op].bitfield.vec_disp8)
6382                             i.types[op].bitfield.vec_disp8 = 1;
6383                           else
6384                             i.types[op].bitfield.disp8 = 1;
6385                           fake_zero_displacement = 1;
6386                         }
6387                     }
6388                   else /* (%bp,%si) -> 2, or (%bp,%di) -> 3  */
6389                     i.rm.regmem = i.index_reg->reg_num - 6 + 2;
6390                   break;
6391                 default: /* (%si) -> 4 or (%di) -> 5  */
6392                   i.rm.regmem = i.base_reg->reg_num - 6 + 4;
6393                 }
6394               i.rm.mode = mode_from_disp_size (i.types[op]);
6395             }
6396           else /* i.base_reg and 32/64 bit mode  */
6397             {
6398               if (flag_code == CODE_64BIT
6399                   && operand_type_check (i.types[op], disp))
6400                 {
6401                   i386_operand_type temp;
6402                   operand_type_set (&temp, 0);
6403                   temp.bitfield.disp8 = i.types[op].bitfield.disp8;
6404                   temp.bitfield.vec_disp8
6405                     = i.types[op].bitfield.vec_disp8;
6406                   i.types[op] = temp;
6407                   if (i.prefix[ADDR_PREFIX] == 0)
6408                     i.types[op].bitfield.disp32s = 1;
6409                   else
6410                     i.types[op].bitfield.disp32 = 1;
6411                 }
6412
6413               if (!i.tm.opcode_modifier.vecsib)
6414                 i.rm.regmem = i.base_reg->reg_num;
6415               if ((i.base_reg->reg_flags & RegRex) != 0)
6416                 i.rex |= REX_B;
6417               i.sib.base = i.base_reg->reg_num;
6418               /* x86-64 ignores REX prefix bit here to avoid decoder
6419                  complications.  */
6420               if (!(i.base_reg->reg_flags & RegRex)
6421                   && (i.base_reg->reg_num == EBP_REG_NUM
6422                    || i.base_reg->reg_num == ESP_REG_NUM))
6423                   default_seg = &ss;
6424               if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
6425                 {
6426                   fake_zero_displacement = 1;
6427                   if (i.tm.operand_types [op].bitfield.vec_disp8)
6428                     i.types[op].bitfield.vec_disp8 = 1;
6429                   else
6430                     i.types[op].bitfield.disp8 = 1;
6431                 }
6432               i.sib.scale = i.log2_scale_factor;
6433               if (i.index_reg == 0)
6434                 {
6435                   gas_assert (!i.tm.opcode_modifier.vecsib);
6436                   /* <disp>(%esp) becomes two byte modrm with no index
6437                      register.  We've already stored the code for esp
6438                      in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
6439                      Any base register besides %esp will not use the
6440                      extra modrm byte.  */
6441                   i.sib.index = NO_INDEX_REGISTER;
6442                 }
6443               else if (!i.tm.opcode_modifier.vecsib)
6444                 {
6445                   if (i.index_reg->reg_num == RegEiz
6446                       || i.index_reg->reg_num == RegRiz)
6447                     i.sib.index = NO_INDEX_REGISTER;
6448                   else
6449                     i.sib.index = i.index_reg->reg_num;
6450                   i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
6451                   if ((i.index_reg->reg_flags & RegRex) != 0)
6452                     i.rex |= REX_X;
6453                 }
6454
6455               if (i.disp_operands
6456                   && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
6457                       || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
6458                 i.rm.mode = 0;
6459               else
6460                 {
6461                   if (!fake_zero_displacement
6462                       && !i.disp_operands
6463                       && i.disp_encoding)
6464                     {
6465                       fake_zero_displacement = 1;
6466                       if (i.disp_encoding == disp_encoding_8bit)
6467                         i.types[op].bitfield.disp8 = 1;
6468                       else
6469                         i.types[op].bitfield.disp32 = 1;
6470                     }
6471                   i.rm.mode = mode_from_disp_size (i.types[op]);
6472                 }
6473             }
6474
6475           if (fake_zero_displacement)
6476             {
6477               /* Fakes a zero displacement assuming that i.types[op]
6478                  holds the correct displacement size.  */
6479               expressionS *exp;
6480
6481               gas_assert (i.op[op].disps == 0);
6482               exp = &disp_expressions[i.disp_operands++];
6483               i.op[op].disps = exp;
6484               exp->X_op = O_constant;
6485               exp->X_add_number = 0;
6486               exp->X_add_symbol = (symbolS *) 0;
6487               exp->X_op_symbol = (symbolS *) 0;
6488             }
6489
6490           mem = op;
6491         }
6492       else
6493         mem = ~0;
6494
6495       if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
6496         {
6497           if (operand_type_check (i.types[0], imm))
6498             i.vex.register_specifier = NULL;
6499           else
6500             {
6501               /* VEX.vvvv encodes one of the sources when the first
6502                  operand is not an immediate.  */
6503               if (i.tm.opcode_modifier.vexw == VEXW0)
6504                 i.vex.register_specifier = i.op[0].regs;
6505               else
6506                 i.vex.register_specifier = i.op[1].regs;
6507             }
6508
6509           /* Destination is a XMM register encoded in the ModRM.reg
6510              and VEX.R bit.  */
6511           i.rm.reg = i.op[2].regs->reg_num;
6512           if ((i.op[2].regs->reg_flags & RegRex) != 0)
6513             i.rex |= REX_R;
6514
6515           /* ModRM.rm and VEX.B encodes the other source.  */
6516           if (!i.mem_operands)
6517             {
6518               i.rm.mode = 3;
6519
6520               if (i.tm.opcode_modifier.vexw == VEXW0)
6521                 i.rm.regmem = i.op[1].regs->reg_num;
6522               else
6523                 i.rm.regmem = i.op[0].regs->reg_num;
6524
6525               if ((i.op[1].regs->reg_flags & RegRex) != 0)
6526                 i.rex |= REX_B;
6527             }
6528         }
6529       else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
6530         {
6531           i.vex.register_specifier = i.op[2].regs;
6532           if (!i.mem_operands)
6533             {
6534               i.rm.mode = 3;
6535               i.rm.regmem = i.op[1].regs->reg_num;
6536               if ((i.op[1].regs->reg_flags & RegRex) != 0)
6537                 i.rex |= REX_B;
6538             }
6539         }
6540       /* Fill in i.rm.reg or i.rm.regmem field with register operand
6541          (if any) based on i.tm.extension_opcode.  Again, we must be
6542          careful to make sure that segment/control/debug/test/MMX
6543          registers are coded into the i.rm.reg field.  */
6544       else if (i.reg_operands)
6545         {
6546           unsigned int op;
6547           unsigned int vex_reg = ~0;
6548
6549           for (op = 0; op < i.operands; op++)
6550             if (i.types[op].bitfield.reg8
6551                 || i.types[op].bitfield.reg16
6552                 || i.types[op].bitfield.reg32
6553                 || i.types[op].bitfield.reg64
6554                 || i.types[op].bitfield.regmmx
6555                 || i.types[op].bitfield.regxmm
6556                 || i.types[op].bitfield.regymm
6557                 || i.types[op].bitfield.regbnd
6558                 || i.types[op].bitfield.regzmm
6559                 || i.types[op].bitfield.regmask
6560                 || i.types[op].bitfield.sreg2
6561                 || i.types[op].bitfield.sreg3
6562                 || i.types[op].bitfield.control
6563                 || i.types[op].bitfield.debug
6564                 || i.types[op].bitfield.test)
6565               break;
6566
6567           if (vex_3_sources)
6568             op = dest;
6569           else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
6570             {
6571               /* For instructions with VexNDS, the register-only
6572                  source operand is encoded in VEX prefix. */
6573               gas_assert (mem != (unsigned int) ~0);
6574
6575               if (op > mem)
6576                 {
6577                   vex_reg = op++;
6578                   gas_assert (op < i.operands);
6579                 }
6580               else
6581                 {
6582                   /* Check register-only source operand when two source
6583                      operands are swapped.  */
6584                   if (!i.tm.operand_types[op].bitfield.baseindex
6585                       && i.tm.operand_types[op + 1].bitfield.baseindex)
6586                     {
6587                       vex_reg = op;
6588                       op += 2;
6589                       gas_assert (mem == (vex_reg + 1)
6590                                   && op < i.operands);
6591                     }
6592                   else
6593                     {
6594                       vex_reg = op + 1;
6595                       gas_assert (vex_reg < i.operands);
6596                     }
6597                 }
6598             }
6599           else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
6600             {
6601               /* For instructions with VexNDD, the register destination
6602                  is encoded in VEX prefix.  */
6603               if (i.mem_operands == 0)
6604                 {
6605                   /* There is no memory operand.  */
6606                   gas_assert ((op + 2) == i.operands);
6607                   vex_reg = op + 1;
6608                 }
6609               else
6610                 {
6611                   /* There are only 2 operands.  */
6612                   gas_assert (op < 2 && i.operands == 2);
6613                   vex_reg = 1;
6614                 }
6615             }
6616           else
6617             gas_assert (op < i.operands);
6618
6619           if (vex_reg != (unsigned int) ~0)
6620             {
6621               i386_operand_type *type = &i.tm.operand_types[vex_reg];
6622
6623               if (type->bitfield.reg32 != 1
6624                   && type->bitfield.reg64 != 1
6625                   && !operand_type_equal (type, &regxmm)
6626                   && !operand_type_equal (type, &regymm)
6627                   && !operand_type_equal (type, &regzmm)
6628                   && !operand_type_equal (type, &regmask))
6629                 abort ();
6630
6631               i.vex.register_specifier = i.op[vex_reg].regs;
6632             }
6633
6634           /* Don't set OP operand twice.  */
6635           if (vex_reg != op)
6636             {
6637               /* If there is an extension opcode to put here, the
6638                  register number must be put into the regmem field.  */
6639               if (i.tm.extension_opcode != None)
6640                 {
6641                   i.rm.regmem = i.op[op].regs->reg_num;
6642                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
6643                     i.rex |= REX_B;
6644                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6645                     i.vrex |= REX_B;
6646                 }
6647               else
6648                 {
6649                   i.rm.reg = i.op[op].regs->reg_num;
6650                   if ((i.op[op].regs->reg_flags & RegRex) != 0)
6651                     i.rex |= REX_R;
6652                   if ((i.op[op].regs->reg_flags & RegVRex) != 0)
6653                     i.vrex |= REX_R;
6654                 }
6655             }
6656
6657           /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
6658              must set it to 3 to indicate this is a register operand
6659              in the regmem field.  */
6660           if (!i.mem_operands)
6661             i.rm.mode = 3;
6662         }
6663
6664       /* Fill in i.rm.reg field with extension opcode (if any).  */
6665       if (i.tm.extension_opcode != None)
6666         i.rm.reg = i.tm.extension_opcode;
6667     }
6668   return default_seg;
6669 }
6670
6671 static void
6672 output_branch (void)
6673 {
6674   char *p;
6675   int size;
6676   int code16;
6677   int prefix;
6678   relax_substateT subtype;
6679   symbolS *sym;
6680   offsetT off;
6681
6682   code16 = flag_code == CODE_16BIT ? CODE16 : 0;
6683   size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
6684
6685   prefix = 0;
6686   if (i.prefix[DATA_PREFIX] != 0)
6687     {
6688       prefix = 1;
6689       i.prefixes -= 1;
6690       code16 ^= CODE16;
6691     }
6692   /* Pentium4 branch hints.  */
6693   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6694       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6695     {
6696       prefix++;
6697       i.prefixes--;
6698     }
6699   if (i.prefix[REX_PREFIX] != 0)
6700     {
6701       prefix++;
6702       i.prefixes--;
6703     }
6704
6705   /* BND prefixed jump.  */
6706   if (i.prefix[BND_PREFIX] != 0)
6707     {
6708       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6709       i.prefixes -= 1;
6710     }
6711
6712   if (i.prefixes != 0 && !intel_syntax)
6713     as_warn (_("skipping prefixes on this instruction"));
6714
6715   /* It's always a symbol;  End frag & setup for relax.
6716      Make sure there is enough room in this frag for the largest
6717      instruction we may generate in md_convert_frag.  This is 2
6718      bytes for the opcode and room for the prefix and largest
6719      displacement.  */
6720   frag_grow (prefix + 2 + 4);
6721   /* Prefix and 1 opcode byte go in fr_fix.  */
6722   p = frag_more (prefix + 1);
6723   if (i.prefix[DATA_PREFIX] != 0)
6724     *p++ = DATA_PREFIX_OPCODE;
6725   if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
6726       || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
6727     *p++ = i.prefix[SEG_PREFIX];
6728   if (i.prefix[REX_PREFIX] != 0)
6729     *p++ = i.prefix[REX_PREFIX];
6730   *p = i.tm.base_opcode;
6731
6732   if ((unsigned char) *p == JUMP_PC_RELATIVE)
6733     subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
6734   else if (cpu_arch_flags.bitfield.cpui386)
6735     subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
6736   else
6737     subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
6738   subtype |= code16;
6739
6740   sym = i.op[0].disps->X_add_symbol;
6741   off = i.op[0].disps->X_add_number;
6742
6743   if (i.op[0].disps->X_op != O_constant
6744       && i.op[0].disps->X_op != O_symbol)
6745     {
6746       /* Handle complex expressions.  */
6747       sym = make_expr_symbol (i.op[0].disps);
6748       off = 0;
6749     }
6750
6751   /* 1 possible extra opcode + 4 byte displacement go in var part.
6752      Pass reloc in fr_var.  */
6753   frag_var (rs_machine_dependent, 5,
6754             ((!object_64bit
6755               || i.reloc[0] != NO_RELOC
6756               || (i.bnd_prefix == NULL && !add_bnd_prefix))
6757              ? i.reloc[0]
6758              : BFD_RELOC_X86_64_PC32_BND),
6759             subtype, sym, off, p);
6760 }
6761
6762 static void
6763 output_jump (void)
6764 {
6765   char *p;
6766   int size;
6767   fixS *fixP;
6768
6769   if (i.tm.opcode_modifier.jumpbyte)
6770     {
6771       /* This is a loop or jecxz type instruction.  */
6772       size = 1;
6773       if (i.prefix[ADDR_PREFIX] != 0)
6774         {
6775           FRAG_APPEND_1_CHAR (ADDR_PREFIX_OPCODE);
6776           i.prefixes -= 1;
6777         }
6778       /* Pentium4 branch hints.  */
6779       if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
6780           || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
6781         {
6782           FRAG_APPEND_1_CHAR (i.prefix[SEG_PREFIX]);
6783           i.prefixes--;
6784         }
6785     }
6786   else
6787     {
6788       int code16;
6789
6790       code16 = 0;
6791       if (flag_code == CODE_16BIT)
6792         code16 = CODE16;
6793
6794       if (i.prefix[DATA_PREFIX] != 0)
6795         {
6796           FRAG_APPEND_1_CHAR (DATA_PREFIX_OPCODE);
6797           i.prefixes -= 1;
6798           code16 ^= CODE16;
6799         }
6800
6801       size = 4;
6802       if (code16)
6803         size = 2;
6804     }
6805
6806   if (i.prefix[REX_PREFIX] != 0)
6807     {
6808       FRAG_APPEND_1_CHAR (i.prefix[REX_PREFIX]);
6809       i.prefixes -= 1;
6810     }
6811
6812   /* BND prefixed jump.  */
6813   if (i.prefix[BND_PREFIX] != 0)
6814     {
6815       FRAG_APPEND_1_CHAR (i.prefix[BND_PREFIX]);
6816       i.prefixes -= 1;
6817     }
6818
6819   if (i.prefixes != 0 && !intel_syntax)
6820     as_warn (_("skipping prefixes on this instruction"));
6821
6822   p = frag_more (i.tm.opcode_length + size);
6823   switch (i.tm.opcode_length)
6824     {
6825     case 2:
6826       *p++ = i.tm.base_opcode >> 8;
6827     case 1:
6828       *p++ = i.tm.base_opcode;
6829       break;
6830     default:
6831       abort ();
6832     }
6833
6834   fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6835                       i.op[0].disps, 1, reloc (size, 1, 1,
6836                                                (i.bnd_prefix != NULL
6837                                                 || add_bnd_prefix),
6838                                                i.reloc[0]));
6839
6840   /* All jumps handled here are signed, but don't use a signed limit
6841      check for 32 and 16 bit jumps as we want to allow wrap around at
6842      4G and 64k respectively.  */
6843   if (size == 1)
6844     fixP->fx_signed = 1;
6845 }
6846
6847 static void
6848 output_interseg_jump (void)
6849 {
6850   char *p;
6851   int size;
6852   int prefix;
6853   int code16;
6854
6855   code16 = 0;
6856   if (flag_code == CODE_16BIT)
6857     code16 = CODE16;
6858
6859   prefix = 0;
6860   if (i.prefix[DATA_PREFIX] != 0)
6861     {
6862       prefix = 1;
6863       i.prefixes -= 1;
6864       code16 ^= CODE16;
6865     }
6866   if (i.prefix[REX_PREFIX] != 0)
6867     {
6868       prefix++;
6869       i.prefixes -= 1;
6870     }
6871
6872   size = 4;
6873   if (code16)
6874     size = 2;
6875
6876   if (i.prefixes != 0 && !intel_syntax)
6877     as_warn (_("skipping prefixes on this instruction"));
6878
6879   /* 1 opcode; 2 segment; offset  */
6880   p = frag_more (prefix + 1 + 2 + size);
6881
6882   if (i.prefix[DATA_PREFIX] != 0)
6883     *p++ = DATA_PREFIX_OPCODE;
6884
6885   if (i.prefix[REX_PREFIX] != 0)
6886     *p++ = i.prefix[REX_PREFIX];
6887
6888   *p++ = i.tm.base_opcode;
6889   if (i.op[1].imms->X_op == O_constant)
6890     {
6891       offsetT n = i.op[1].imms->X_add_number;
6892
6893       if (size == 2
6894           && !fits_in_unsigned_word (n)
6895           && !fits_in_signed_word (n))
6896         {
6897           as_bad (_("16-bit jump out of range"));
6898           return;
6899         }
6900       md_number_to_chars (p, n, size);
6901     }
6902   else
6903     fix_new_exp (frag_now, p - frag_now->fr_literal, size,
6904                  i.op[1].imms, 0, reloc (size, 0, 0, 0, i.reloc[1]));
6905   if (i.op[0].imms->X_op != O_constant)
6906     as_bad (_("can't handle non absolute segment in `%s'"),
6907             i.tm.name);
6908   md_number_to_chars (p + size, (valueT) i.op[0].imms->X_add_number, 2);
6909 }
6910
6911 static void
6912 output_insn (void)
6913 {
6914   fragS *insn_start_frag;
6915   offsetT insn_start_off;
6916
6917   /* Tie dwarf2 debug info to the address at the start of the insn.
6918      We can't do this after the insn has been output as the current
6919      frag may have been closed off.  eg. by frag_var.  */
6920   dwarf2_emit_insn (0);
6921
6922   insn_start_frag = frag_now;
6923   insn_start_off = frag_now_fix ();
6924
6925   /* Output jumps.  */
6926   if (i.tm.opcode_modifier.jump)
6927     output_branch ();
6928   else if (i.tm.opcode_modifier.jumpbyte
6929            || i.tm.opcode_modifier.jumpdword)
6930     output_jump ();
6931   else if (i.tm.opcode_modifier.jumpintersegment)
6932     output_interseg_jump ();
6933   else
6934     {
6935       /* Output normal instructions here.  */
6936       char *p;
6937       unsigned char *q;
6938       unsigned int j;
6939       unsigned int prefix;
6940
6941       /* Since the VEX/EVEX prefix contains the implicit prefix, we
6942          don't need the explicit prefix.  */
6943       if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
6944         {
6945           switch (i.tm.opcode_length)
6946             {
6947             case 3:
6948               if (i.tm.base_opcode & 0xff000000)
6949                 {
6950                   prefix = (i.tm.base_opcode >> 24) & 0xff;
6951                   goto check_prefix;
6952                 }
6953               break;
6954             case 2:
6955               if ((i.tm.base_opcode & 0xff0000) != 0)
6956                 {
6957                   prefix = (i.tm.base_opcode >> 16) & 0xff;
6958                   if (i.tm.cpu_flags.bitfield.cpupadlock)
6959                     {
6960 check_prefix:
6961                       if (prefix != REPE_PREFIX_OPCODE
6962                           || (i.prefix[REP_PREFIX]
6963                               != REPE_PREFIX_OPCODE))
6964                         add_prefix (prefix);
6965                     }
6966                   else
6967                     add_prefix (prefix);
6968                 }
6969               break;
6970             case 1:
6971               break;
6972             default:
6973               abort ();
6974             }
6975
6976           /* The prefix bytes.  */
6977           for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
6978             if (*q)
6979               FRAG_APPEND_1_CHAR (*q);
6980         }
6981       else
6982         {
6983           for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
6984             if (*q)
6985               switch (j)
6986                 {
6987                 case REX_PREFIX:
6988                   /* REX byte is encoded in VEX prefix.  */
6989                   break;
6990                 case SEG_PREFIX:
6991                 case ADDR_PREFIX:
6992                   FRAG_APPEND_1_CHAR (*q);
6993                   break;
6994                 default:
6995                   /* There should be no other prefixes for instructions
6996                      with VEX prefix.  */
6997                   abort ();
6998                 }
6999
7000           /* For EVEX instructions i.vrex should become 0 after
7001              build_evex_prefix.  For VEX instructions upper 16 registers
7002              aren't available, so VREX should be 0.  */
7003           if (i.vrex)
7004             abort ();
7005           /* Now the VEX prefix.  */
7006           p = frag_more (i.vex.length);
7007           for (j = 0; j < i.vex.length; j++)
7008             p[j] = i.vex.bytes[j];
7009         }
7010
7011       /* Now the opcode; be careful about word order here!  */
7012       if (i.tm.opcode_length == 1)
7013         {
7014           FRAG_APPEND_1_CHAR (i.tm.base_opcode);
7015         }
7016       else
7017         {
7018           switch (i.tm.opcode_length)
7019             {
7020             case 4:
7021               p = frag_more (4);
7022               *p++ = (i.tm.base_opcode >> 24) & 0xff;
7023               *p++ = (i.tm.base_opcode >> 16) & 0xff;
7024               break;
7025             case 3:
7026               p = frag_more (3);
7027               *p++ = (i.tm.base_opcode >> 16) & 0xff;
7028               break;
7029             case 2:
7030               p = frag_more (2);
7031               break;
7032             default:
7033               abort ();
7034               break;
7035             }
7036
7037           /* Put out high byte first: can't use md_number_to_chars!  */
7038           *p++ = (i.tm.base_opcode >> 8) & 0xff;
7039           *p = i.tm.base_opcode & 0xff;
7040         }
7041
7042       /* Now the modrm byte and sib byte (if present).  */
7043       if (i.tm.opcode_modifier.modrm)
7044         {
7045           FRAG_APPEND_1_CHAR ((i.rm.regmem << 0
7046                                | i.rm.reg << 3
7047                                | i.rm.mode << 6));
7048           /* If i.rm.regmem == ESP (4)
7049              && i.rm.mode != (Register mode)
7050              && not 16 bit
7051              ==> need second modrm byte.  */
7052           if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
7053               && i.rm.mode != 3
7054               && !(i.base_reg && i.base_reg->reg_type.bitfield.reg16))
7055             FRAG_APPEND_1_CHAR ((i.sib.base << 0
7056                                  | i.sib.index << 3
7057                                  | i.sib.scale << 6));
7058         }
7059
7060       if (i.disp_operands)
7061         output_disp (insn_start_frag, insn_start_off);
7062
7063       if (i.imm_operands)
7064         output_imm (insn_start_frag, insn_start_off);
7065     }
7066
7067 #ifdef DEBUG386
7068   if (flag_debug)
7069     {
7070       pi ("" /*line*/, &i);
7071     }
7072 #endif /* DEBUG386  */
7073 }
7074
7075 /* Return the size of the displacement operand N.  */
7076
7077 static int
7078 disp_size (unsigned int n)
7079 {
7080   int size = 4;
7081
7082   /* Vec_Disp8 has to be 8bit.  */
7083   if (i.types[n].bitfield.vec_disp8)
7084     size = 1;
7085   else if (i.types[n].bitfield.disp64)
7086     size = 8;
7087   else if (i.types[n].bitfield.disp8)
7088     size = 1;
7089   else if (i.types[n].bitfield.disp16)
7090     size = 2;
7091   return size;
7092 }
7093
7094 /* Return the size of the immediate operand N.  */
7095
7096 static int
7097 imm_size (unsigned int n)
7098 {
7099   int size = 4;
7100   if (i.types[n].bitfield.imm64)
7101     size = 8;
7102   else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
7103     size = 1;
7104   else if (i.types[n].bitfield.imm16)
7105     size = 2;
7106   return size;
7107 }
7108
7109 static void
7110 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
7111 {
7112   char *p;
7113   unsigned int n;
7114
7115   for (n = 0; n < i.operands; n++)
7116     {
7117       if (i.types[n].bitfield.vec_disp8
7118           || operand_type_check (i.types[n], disp))
7119         {
7120           if (i.op[n].disps->X_op == O_constant)
7121             {
7122               int size = disp_size (n);
7123               offsetT val = i.op[n].disps->X_add_number;
7124
7125               if (i.types[n].bitfield.vec_disp8)
7126                 val >>= i.memshift;
7127               val = offset_in_range (val, size);
7128               p = frag_more (size);
7129               md_number_to_chars (p, val, size);
7130             }
7131           else
7132             {
7133               enum bfd_reloc_code_real reloc_type;
7134               int size = disp_size (n);
7135               int sign = i.types[n].bitfield.disp32s;
7136               int pcrel = (i.flags[n] & Operand_PCrel) != 0;
7137
7138               /* We can't have 8 bit displacement here.  */
7139               gas_assert (!i.types[n].bitfield.disp8);
7140
7141               /* The PC relative address is computed relative
7142                  to the instruction boundary, so in case immediate
7143                  fields follows, we need to adjust the value.  */
7144               if (pcrel && i.imm_operands)
7145                 {
7146                   unsigned int n1;
7147                   int sz = 0;
7148
7149                   for (n1 = 0; n1 < i.operands; n1++)
7150                     if (operand_type_check (i.types[n1], imm))
7151                       {
7152                         /* Only one immediate is allowed for PC
7153                            relative address.  */
7154                         gas_assert (sz == 0);
7155                         sz = imm_size (n1);
7156                         i.op[n].disps->X_add_number -= sz;
7157                       }
7158                   /* We should find the immediate.  */
7159                   gas_assert (sz != 0);
7160                 }
7161
7162               p = frag_more (size);
7163               reloc_type = reloc (size, pcrel, sign,
7164                                   (i.bnd_prefix != NULL
7165                                    || add_bnd_prefix),
7166                                   i.reloc[n]);
7167               if (GOT_symbol
7168                   && GOT_symbol == i.op[n].disps->X_add_symbol
7169                   && (((reloc_type == BFD_RELOC_32
7170                         || reloc_type == BFD_RELOC_X86_64_32S
7171                         || (reloc_type == BFD_RELOC_64
7172                             && object_64bit))
7173                        && (i.op[n].disps->X_op == O_symbol
7174                            || (i.op[n].disps->X_op == O_add
7175                                && ((symbol_get_value_expression
7176                                     (i.op[n].disps->X_op_symbol)->X_op)
7177                                    == O_subtract))))
7178                       || reloc_type == BFD_RELOC_32_PCREL))
7179                 {
7180                   offsetT add;
7181
7182                   if (insn_start_frag == frag_now)
7183                     add = (p - frag_now->fr_literal) - insn_start_off;
7184                   else
7185                     {
7186                       fragS *fr;
7187
7188                       add = insn_start_frag->fr_fix - insn_start_off;
7189                       for (fr = insn_start_frag->fr_next;
7190                            fr && fr != frag_now; fr = fr->fr_next)
7191                         add += fr->fr_fix;
7192                       add += p - frag_now->fr_literal;
7193                     }
7194
7195                   if (!object_64bit)
7196                     {
7197                       reloc_type = BFD_RELOC_386_GOTPC;
7198                       i.op[n].imms->X_add_number += add;
7199                     }
7200                   else if (reloc_type == BFD_RELOC_64)
7201                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
7202                   else
7203                     /* Don't do the adjustment for x86-64, as there
7204                        the pcrel addressing is relative to the _next_
7205                        insn, and that is taken care of in other code.  */
7206                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
7207                 }
7208               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7209                            i.op[n].disps, pcrel, reloc_type);
7210             }
7211         }
7212     }
7213 }
7214
7215 static void
7216 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
7217 {
7218   char *p;
7219   unsigned int n;
7220
7221   for (n = 0; n < i.operands; n++)
7222     {
7223       /* Skip SAE/RC Imm operand in EVEX.  They are already handled.  */
7224       if (i.rounding && (int) n == i.rounding->operand)
7225         continue;
7226
7227       if (operand_type_check (i.types[n], imm))
7228         {
7229           if (i.op[n].imms->X_op == O_constant)
7230             {
7231               int size = imm_size (n);
7232               offsetT val;
7233
7234               val = offset_in_range (i.op[n].imms->X_add_number,
7235                                      size);
7236               p = frag_more (size);
7237               md_number_to_chars (p, val, size);
7238             }
7239           else
7240             {
7241               /* Not absolute_section.
7242                  Need a 32-bit fixup (don't support 8bit
7243                  non-absolute imms).  Try to support other
7244                  sizes ...  */
7245               enum bfd_reloc_code_real reloc_type;
7246               int size = imm_size (n);
7247               int sign;
7248
7249               if (i.types[n].bitfield.imm32s
7250                   && (i.suffix == QWORD_MNEM_SUFFIX
7251                       || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
7252                 sign = 1;
7253               else
7254                 sign = 0;
7255
7256               p = frag_more (size);
7257               reloc_type = reloc (size, 0, sign, 0, i.reloc[n]);
7258
7259               /*   This is tough to explain.  We end up with this one if we
7260                * have operands that look like
7261                * "_GLOBAL_OFFSET_TABLE_+[.-.L284]".  The goal here is to
7262                * obtain the absolute address of the GOT, and it is strongly
7263                * preferable from a performance point of view to avoid using
7264                * a runtime relocation for this.  The actual sequence of
7265                * instructions often look something like:
7266                *
7267                *        call    .L66
7268                * .L66:
7269                *        popl    %ebx
7270                *        addl    $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
7271                *
7272                *   The call and pop essentially return the absolute address
7273                * of the label .L66 and store it in %ebx.  The linker itself
7274                * will ultimately change the first operand of the addl so
7275                * that %ebx points to the GOT, but to keep things simple, the
7276                * .o file must have this operand set so that it generates not
7277                * the absolute address of .L66, but the absolute address of
7278                * itself.  This allows the linker itself simply treat a GOTPC
7279                * relocation as asking for a pcrel offset to the GOT to be
7280                * added in, and the addend of the relocation is stored in the
7281                * operand field for the instruction itself.
7282                *
7283                *   Our job here is to fix the operand so that it would add
7284                * the correct offset so that %ebx would point to itself.  The
7285                * thing that is tricky is that .-.L66 will point to the
7286                * beginning of the instruction, so we need to further modify
7287                * the operand so that it will point to itself.  There are
7288                * other cases where you have something like:
7289                *
7290                *        .long   $_GLOBAL_OFFSET_TABLE_+[.-.L66]
7291                *
7292                * and here no correction would be required.  Internally in
7293                * the assembler we treat operands of this form as not being
7294                * pcrel since the '.' is explicitly mentioned, and I wonder
7295                * whether it would simplify matters to do it this way.  Who
7296                * knows.  In earlier versions of the PIC patches, the
7297                * pcrel_adjust field was used to store the correction, but
7298                * since the expression is not pcrel, I felt it would be
7299                * confusing to do it this way.  */
7300
7301               if ((reloc_type == BFD_RELOC_32
7302                    || reloc_type == BFD_RELOC_X86_64_32S
7303                    || reloc_type == BFD_RELOC_64)
7304                   && GOT_symbol
7305                   && GOT_symbol == i.op[n].imms->X_add_symbol
7306                   && (i.op[n].imms->X_op == O_symbol
7307                       || (i.op[n].imms->X_op == O_add
7308                           && ((symbol_get_value_expression
7309                                (i.op[n].imms->X_op_symbol)->X_op)
7310                               == O_subtract))))
7311                 {
7312                   offsetT add;
7313
7314                   if (insn_start_frag == frag_now)
7315                     add = (p - frag_now->fr_literal) - insn_start_off;
7316                   else
7317                     {
7318                       fragS *fr;
7319
7320                       add = insn_start_frag->fr_fix - insn_start_off;
7321                       for (fr = insn_start_frag->fr_next;
7322                            fr && fr != frag_now; fr = fr->fr_next)
7323                         add += fr->fr_fix;
7324                       add += p - frag_now->fr_literal;
7325                     }
7326
7327                   if (!object_64bit)
7328                     reloc_type = BFD_RELOC_386_GOTPC;
7329                   else if (size == 4)
7330                     reloc_type = BFD_RELOC_X86_64_GOTPC32;
7331                   else if (size == 8)
7332                     reloc_type = BFD_RELOC_X86_64_GOTPC64;
7333                   i.op[n].imms->X_add_number += add;
7334                 }
7335               fix_new_exp (frag_now, p - frag_now->fr_literal, size,
7336                            i.op[n].imms, 0, reloc_type);
7337             }
7338         }
7339     }
7340 }
7341 \f
7342 /* x86_cons_fix_new is called via the expression parsing code when a
7343    reloc is needed.  We use this hook to get the correct .got reloc.  */
7344 static int cons_sign = -1;
7345
7346 void
7347 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
7348                   expressionS *exp, bfd_reloc_code_real_type r)
7349 {
7350   r = reloc (len, 0, cons_sign, 0, r);
7351
7352 #ifdef TE_PE
7353   if (exp->X_op == O_secrel)
7354     {
7355       exp->X_op = O_symbol;
7356       r = BFD_RELOC_32_SECREL;
7357     }
7358 #endif
7359
7360   fix_new_exp (frag, off, len, exp, 0, r);
7361 }
7362
7363 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
7364    purpose of the `.dc.a' internal pseudo-op.  */
7365
7366 int
7367 x86_address_bytes (void)
7368 {
7369   if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
7370     return 4;
7371   return stdoutput->arch_info->bits_per_address / 8;
7372 }
7373
7374 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
7375     || defined (LEX_AT)
7376 # define lex_got(reloc, adjust, types, bnd_prefix) NULL
7377 #else
7378 /* Parse operands of the form
7379    <symbol>@GOTOFF+<nnn>
7380    and similar .plt or .got references.
7381
7382    If we find one, set up the correct relocation in RELOC and copy the
7383    input string, minus the `@GOTOFF' into a malloc'd buffer for
7384    parsing by the calling routine.  Return this buffer, and if ADJUST
7385    is non-null set it to the length of the string we removed from the
7386    input line.  Otherwise return NULL.  */
7387 static char *
7388 lex_got (enum bfd_reloc_code_real *rel,
7389          int *adjust,
7390          i386_operand_type *types,
7391          int bnd_prefix)
7392 {
7393   /* Some of the relocations depend on the size of what field is to
7394      be relocated.  But in our callers i386_immediate and i386_displacement
7395      we don't yet know the operand size (this will be set by insn
7396      matching).  Hence we record the word32 relocation here,
7397      and adjust the reloc according to the real size in reloc().  */
7398   static const struct {
7399     const char *str;
7400     int len;
7401     const enum bfd_reloc_code_real rel[2];
7402     const i386_operand_type types64;
7403   } gotrel[] = {
7404 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
7405     { STRING_COMMA_LEN ("SIZE"),      { BFD_RELOC_SIZE32,
7406                                         BFD_RELOC_SIZE32 },
7407       OPERAND_TYPE_IMM32_64 },
7408 #endif
7409     { STRING_COMMA_LEN ("PLTOFF"),   { _dummy_first_bfd_reloc_code_real,
7410                                        BFD_RELOC_X86_64_PLTOFF64 },
7411       OPERAND_TYPE_IMM64 },
7412     { STRING_COMMA_LEN ("PLT"),      { BFD_RELOC_386_PLT32,
7413                                        BFD_RELOC_X86_64_PLT32    },
7414       OPERAND_TYPE_IMM32_32S_DISP32 },
7415     { STRING_COMMA_LEN ("GOTPLT"),   { _dummy_first_bfd_reloc_code_real,
7416                                        BFD_RELOC_X86_64_GOTPLT64 },
7417       OPERAND_TYPE_IMM64_DISP64 },
7418     { STRING_COMMA_LEN ("GOTOFF"),   { BFD_RELOC_386_GOTOFF,
7419                                        BFD_RELOC_X86_64_GOTOFF64 },
7420       OPERAND_TYPE_IMM64_DISP64 },
7421     { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
7422                                        BFD_RELOC_X86_64_GOTPCREL },
7423       OPERAND_TYPE_IMM32_32S_DISP32 },
7424     { STRING_COMMA_LEN ("TLSGD"),    { BFD_RELOC_386_TLS_GD,
7425                                        BFD_RELOC_X86_64_TLSGD    },
7426       OPERAND_TYPE_IMM32_32S_DISP32 },
7427     { STRING_COMMA_LEN ("TLSLDM"),   { BFD_RELOC_386_TLS_LDM,
7428                                        _dummy_first_bfd_reloc_code_real },
7429       OPERAND_TYPE_NONE },
7430     { STRING_COMMA_LEN ("TLSLD"),    { _dummy_first_bfd_reloc_code_real,
7431                                        BFD_RELOC_X86_64_TLSLD    },
7432       OPERAND_TYPE_IMM32_32S_DISP32 },
7433     { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
7434                                        BFD_RELOC_X86_64_GOTTPOFF },
7435       OPERAND_TYPE_IMM32_32S_DISP32 },
7436     { STRING_COMMA_LEN ("TPOFF"),    { BFD_RELOC_386_TLS_LE_32,
7437                                        BFD_RELOC_X86_64_TPOFF32  },
7438       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7439     { STRING_COMMA_LEN ("NTPOFF"),   { BFD_RELOC_386_TLS_LE,
7440                                        _dummy_first_bfd_reloc_code_real },
7441       OPERAND_TYPE_NONE },
7442     { STRING_COMMA_LEN ("DTPOFF"),   { BFD_RELOC_386_TLS_LDO_32,
7443                                        BFD_RELOC_X86_64_DTPOFF32 },
7444       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7445     { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
7446                                        _dummy_first_bfd_reloc_code_real },
7447       OPERAND_TYPE_NONE },
7448     { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
7449                                        _dummy_first_bfd_reloc_code_real },
7450       OPERAND_TYPE_NONE },
7451     { STRING_COMMA_LEN ("GOT"),      { BFD_RELOC_386_GOT32,
7452                                        BFD_RELOC_X86_64_GOT32    },
7453       OPERAND_TYPE_IMM32_32S_64_DISP32 },
7454     { STRING_COMMA_LEN ("TLSDESC"),  { BFD_RELOC_386_TLS_GOTDESC,
7455                                        BFD_RELOC_X86_64_GOTPC32_TLSDESC },
7456       OPERAND_TYPE_IMM32_32S_DISP32 },
7457     { STRING_COMMA_LEN ("TLSCALL"),  { BFD_RELOC_386_TLS_DESC_CALL,
7458                                        BFD_RELOC_X86_64_TLSDESC_CALL },
7459       OPERAND_TYPE_IMM32_32S_DISP32 },
7460   };
7461   char *cp;
7462   unsigned int j;
7463
7464 #if defined (OBJ_MAYBE_ELF)
7465   if (!IS_ELF)
7466     return NULL;
7467 #endif
7468
7469   for (cp = input_line_pointer; *cp != '@'; cp++)
7470     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7471       return NULL;
7472
7473   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7474     {
7475       int len = gotrel[j].len;
7476       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7477         {
7478           if (gotrel[j].rel[object_64bit] != 0)
7479             {
7480               int first, second;
7481               char *tmpbuf, *past_reloc;
7482
7483               *rel = gotrel[j].rel[object_64bit];
7484
7485               if (types)
7486                 {
7487                   if (flag_code != CODE_64BIT)
7488                     {
7489                       types->bitfield.imm32 = 1;
7490                       types->bitfield.disp32 = 1;
7491                     }
7492                   else
7493                     *types = gotrel[j].types64;
7494                 }
7495
7496               if (j != 0 && GOT_symbol == NULL)
7497                 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
7498
7499               /* The length of the first part of our input line.  */
7500               first = cp - input_line_pointer;
7501
7502               /* The second part goes from after the reloc token until
7503                  (and including) an end_of_line char or comma.  */
7504               past_reloc = cp + 1 + len;
7505               cp = past_reloc;
7506               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7507                 ++cp;
7508               second = cp + 1 - past_reloc;
7509
7510               /* Allocate and copy string.  The trailing NUL shouldn't
7511                  be necessary, but be safe.  */
7512               tmpbuf = (char *) xmalloc (first + second + 2);
7513               memcpy (tmpbuf, input_line_pointer, first);
7514               if (second != 0 && *past_reloc != ' ')
7515                 /* Replace the relocation token with ' ', so that
7516                    errors like foo@GOTOFF1 will be detected.  */
7517                 tmpbuf[first++] = ' ';
7518               else
7519                 /* Increment length by 1 if the relocation token is
7520                    removed.  */
7521                 len++;
7522               if (adjust)
7523                 *adjust = len;
7524               memcpy (tmpbuf + first, past_reloc, second);
7525               tmpbuf[first + second] = '\0';
7526               if (bnd_prefix && *rel == BFD_RELOC_X86_64_PLT32)
7527                 *rel = BFD_RELOC_X86_64_PLT32_BND;
7528               return tmpbuf;
7529             }
7530
7531           as_bad (_("@%s reloc is not supported with %d-bit output format"),
7532                   gotrel[j].str, 1 << (5 + object_64bit));
7533           return NULL;
7534         }
7535     }
7536
7537   /* Might be a symbol version string.  Don't as_bad here.  */
7538   return NULL;
7539 }
7540 #endif
7541
7542 #ifdef TE_PE
7543 #ifdef lex_got
7544 #undef lex_got
7545 #endif
7546 /* Parse operands of the form
7547    <symbol>@SECREL32+<nnn>
7548
7549    If we find one, set up the correct relocation in RELOC and copy the
7550    input string, minus the `@SECREL32' into a malloc'd buffer for
7551    parsing by the calling routine.  Return this buffer, and if ADJUST
7552    is non-null set it to the length of the string we removed from the
7553    input line.  Otherwise return NULL.
7554
7555    This function is copied from the ELF version above adjusted for PE targets.  */
7556
7557 static char *
7558 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
7559          int *adjust ATTRIBUTE_UNUSED,
7560          i386_operand_type *types,
7561          int bnd_prefix ATTRIBUTE_UNUSED)
7562 {
7563   static const struct
7564   {
7565     const char *str;
7566     int len;
7567     const enum bfd_reloc_code_real rel[2];
7568     const i386_operand_type types64;
7569   }
7570   gotrel[] =
7571   {
7572     { STRING_COMMA_LEN ("SECREL32"),    { BFD_RELOC_32_SECREL,
7573                                           BFD_RELOC_32_SECREL },
7574       OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
7575   };
7576
7577   char *cp;
7578   unsigned j;
7579
7580   for (cp = input_line_pointer; *cp != '@'; cp++)
7581     if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
7582       return NULL;
7583
7584   for (j = 0; j < ARRAY_SIZE (gotrel); j++)
7585     {
7586       int len = gotrel[j].len;
7587
7588       if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
7589         {
7590           if (gotrel[j].rel[object_64bit] != 0)
7591             {
7592               int first, second;
7593               char *tmpbuf, *past_reloc;
7594
7595               *rel = gotrel[j].rel[object_64bit];
7596               if (adjust)
7597                 *adjust = len;
7598
7599               if (types)
7600                 {
7601                   if (flag_code != CODE_64BIT)
7602                     {
7603                       types->bitfield.imm32 = 1;
7604                       types->bitfield.disp32 = 1;
7605                     }
7606                   else
7607                     *types = gotrel[j].types64;
7608                 }
7609
7610               /* The length of the first part of our input line.  */
7611               first = cp - input_line_pointer;
7612
7613               /* The second part goes from after the reloc token until
7614                  (and including) an end_of_line char or comma.  */
7615               past_reloc = cp + 1 + len;
7616               cp = past_reloc;
7617               while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
7618                 ++cp;
7619               second = cp + 1 - past_reloc;
7620
7621               /* Allocate and copy string.  The trailing NUL shouldn't
7622                  be necessary, but be safe.  */
7623               tmpbuf = (char *) xmalloc (first + second + 2);
7624               memcpy (tmpbuf, input_line_pointer, first);
7625               if (second != 0 && *past_reloc != ' ')
7626                 /* Replace the relocation token with ' ', so that
7627                    errors like foo@SECLREL321 will be detected.  */
7628                 tmpbuf[first++] = ' ';
7629               memcpy (tmpbuf + first, past_reloc, second);
7630               tmpbuf[first + second] = '\0';
7631               return tmpbuf;
7632             }
7633
7634           as_bad (_("@%s reloc is not supported with %d-bit output format"),
7635                   gotrel[j].str, 1 << (5 + object_64bit));
7636           return NULL;
7637         }
7638     }
7639
7640   /* Might be a symbol version string.  Don't as_bad here.  */
7641   return NULL;
7642 }
7643
7644 #endif /* TE_PE */
7645
7646 bfd_reloc_code_real_type
7647 x86_cons (expressionS *exp, int size)
7648 {
7649   bfd_reloc_code_real_type got_reloc = NO_RELOC;
7650
7651   intel_syntax = -intel_syntax;
7652
7653   exp->X_md = 0;
7654   if (size == 4 || (object_64bit && size == 8))
7655     {
7656       /* Handle @GOTOFF and the like in an expression.  */
7657       char *save;
7658       char *gotfree_input_line;
7659       int adjust = 0;
7660
7661       save = input_line_pointer;
7662       gotfree_input_line = lex_got (&got_reloc, &adjust, NULL, 0);
7663       if (gotfree_input_line)
7664         input_line_pointer = gotfree_input_line;
7665
7666       expression (exp);
7667
7668       if (gotfree_input_line)
7669         {
7670           /* expression () has merrily parsed up to the end of line,
7671              or a comma - in the wrong buffer.  Transfer how far
7672              input_line_pointer has moved to the right buffer.  */
7673           input_line_pointer = (save
7674                                 + (input_line_pointer - gotfree_input_line)
7675                                 + adjust);
7676           free (gotfree_input_line);
7677           if (exp->X_op == O_constant
7678               || exp->X_op == O_absent
7679               || exp->X_op == O_illegal
7680               || exp->X_op == O_register
7681               || exp->X_op == O_big)
7682             {
7683               char c = *input_line_pointer;
7684               *input_line_pointer = 0;
7685               as_bad (_("missing or invalid expression `%s'"), save);
7686               *input_line_pointer = c;
7687             }
7688         }
7689     }
7690   else
7691     expression (exp);
7692
7693   intel_syntax = -intel_syntax;
7694
7695   if (intel_syntax)
7696     i386_intel_simplify (exp);
7697
7698   return got_reloc;
7699 }
7700
7701 static void
7702 signed_cons (int size)
7703 {
7704   if (flag_code == CODE_64BIT)
7705     cons_sign = 1;
7706   cons (size);
7707   cons_sign = -1;
7708 }
7709
7710 #ifdef TE_PE
7711 static void
7712 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
7713 {
7714   expressionS exp;
7715
7716   do
7717     {
7718       expression (&exp);
7719       if (exp.X_op == O_symbol)
7720         exp.X_op = O_secrel;
7721
7722       emit_expr (&exp, 4);
7723     }
7724   while (*input_line_pointer++ == ',');
7725
7726   input_line_pointer--;
7727   demand_empty_rest_of_line ();
7728 }
7729 #endif
7730
7731 /* Handle Vector operations.  */
7732
7733 static char *
7734 check_VecOperations (char *op_string, char *op_end)
7735 {
7736   const reg_entry *mask;
7737   const char *saved;
7738   char *end_op;
7739
7740   while (*op_string
7741          && (op_end == NULL || op_string < op_end))
7742     {
7743       saved = op_string;
7744       if (*op_string == '{')
7745         {
7746           op_string++;
7747
7748           /* Check broadcasts.  */
7749           if (strncmp (op_string, "1to", 3) == 0)
7750             {
7751               int bcst_type;
7752
7753               if (i.broadcast)
7754                 goto duplicated_vec_op;
7755
7756               op_string += 3;
7757               if (*op_string == '8')
7758                 bcst_type = BROADCAST_1TO8;
7759               else if (*op_string == '4')
7760                 bcst_type = BROADCAST_1TO4;
7761               else if (*op_string == '2')
7762                 bcst_type = BROADCAST_1TO2;
7763               else if (*op_string == '1'
7764                        && *(op_string+1) == '6')
7765                 {
7766                   bcst_type = BROADCAST_1TO16;
7767                   op_string++;
7768                 }
7769               else
7770                 {
7771                   as_bad (_("Unsupported broadcast: `%s'"), saved);
7772                   return NULL;
7773                 }
7774               op_string++;
7775
7776               broadcast_op.type = bcst_type;
7777               broadcast_op.operand = this_operand;
7778               i.broadcast = &broadcast_op;
7779             }
7780           /* Check masking operation.  */
7781           else if ((mask = parse_register (op_string, &end_op)) != NULL)
7782             {
7783               /* k0 can't be used for write mask.  */
7784               if (mask->reg_num == 0)
7785                 {
7786                   as_bad (_("`%s' can't be used for write mask"),
7787                           op_string);
7788                   return NULL;
7789                 }
7790
7791               if (!i.mask)
7792                 {
7793                   mask_op.mask = mask;
7794                   mask_op.zeroing = 0;
7795                   mask_op.operand = this_operand;
7796                   i.mask = &mask_op;
7797                 }
7798               else
7799                 {
7800                   if (i.mask->mask)
7801                     goto duplicated_vec_op;
7802
7803                   i.mask->mask = mask;
7804
7805                   /* Only "{z}" is allowed here.  No need to check
7806                      zeroing mask explicitly.  */
7807                   if (i.mask->operand != this_operand)
7808                     {
7809                       as_bad (_("invalid write mask `%s'"), saved);
7810                       return NULL;
7811                     }
7812                 }
7813
7814               op_string = end_op;
7815             }
7816           /* Check zeroing-flag for masking operation.  */
7817           else if (*op_string == 'z')
7818             {
7819               if (!i.mask)
7820                 {
7821                   mask_op.mask = NULL;
7822                   mask_op.zeroing = 1;
7823                   mask_op.operand = this_operand;
7824                   i.mask = &mask_op;
7825                 }
7826               else
7827                 {
7828                   if (i.mask->zeroing)
7829                     {
7830                     duplicated_vec_op:
7831                       as_bad (_("duplicated `%s'"), saved);
7832                       return NULL;
7833                     }
7834
7835                   i.mask->zeroing = 1;
7836
7837                   /* Only "{%k}" is allowed here.  No need to check mask
7838                      register explicitly.  */
7839                   if (i.mask->operand != this_operand)
7840                     {
7841                       as_bad (_("invalid zeroing-masking `%s'"),
7842                               saved);
7843                       return NULL;
7844                     }
7845                 }
7846
7847               op_string++;
7848             }
7849           else
7850             goto unknown_vec_op;
7851
7852           if (*op_string != '}')
7853             {
7854               as_bad (_("missing `}' in `%s'"), saved);
7855               return NULL;
7856             }
7857           op_string++;
7858           continue;
7859         }
7860     unknown_vec_op:
7861       /* We don't know this one.  */
7862       as_bad (_("unknown vector operation: `%s'"), saved);
7863       return NULL;
7864     }
7865
7866   return op_string;
7867 }
7868
7869 static int
7870 i386_immediate (char *imm_start)
7871 {
7872   char *save_input_line_pointer;
7873   char *gotfree_input_line;
7874   segT exp_seg = 0;
7875   expressionS *exp;
7876   i386_operand_type types;
7877
7878   operand_type_set (&types, ~0);
7879
7880   if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
7881     {
7882       as_bad (_("at most %d immediate operands are allowed"),
7883               MAX_IMMEDIATE_OPERANDS);
7884       return 0;
7885     }
7886
7887   exp = &im_expressions[i.imm_operands++];
7888   i.op[this_operand].imms = exp;
7889
7890   if (is_space_char (*imm_start))
7891     ++imm_start;
7892
7893   save_input_line_pointer = input_line_pointer;
7894   input_line_pointer = imm_start;
7895
7896   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types,
7897                                 (i.bnd_prefix != NULL
7898                                  || add_bnd_prefix));
7899   if (gotfree_input_line)
7900     input_line_pointer = gotfree_input_line;
7901
7902   exp_seg = expression (exp);
7903
7904   SKIP_WHITESPACE ();
7905
7906   /* Handle vector operations.  */
7907   if (*input_line_pointer == '{')
7908     {
7909       input_line_pointer = check_VecOperations (input_line_pointer,
7910                                                 NULL);
7911       if (input_line_pointer == NULL)
7912         return 0;
7913     }
7914
7915   if (*input_line_pointer)
7916     as_bad (_("junk `%s' after expression"), input_line_pointer);
7917
7918   input_line_pointer = save_input_line_pointer;
7919   if (gotfree_input_line)
7920     {
7921       free (gotfree_input_line);
7922
7923       if (exp->X_op == O_constant || exp->X_op == O_register)
7924         exp->X_op = O_illegal;
7925     }
7926
7927   return i386_finalize_immediate (exp_seg, exp, types, imm_start);
7928 }
7929
7930 static int
7931 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
7932                          i386_operand_type types, const char *imm_start)
7933 {
7934   if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
7935     {
7936       if (imm_start)
7937         as_bad (_("missing or invalid immediate expression `%s'"),
7938                 imm_start);
7939       return 0;
7940     }
7941   else if (exp->X_op == O_constant)
7942     {
7943       /* Size it properly later.  */
7944       i.types[this_operand].bitfield.imm64 = 1;
7945       /* If not 64bit, sign extend val.  */
7946       if (flag_code != CODE_64BIT
7947           && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
7948         exp->X_add_number
7949           = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
7950     }
7951 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
7952   else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
7953            && exp_seg != absolute_section
7954            && exp_seg != text_section
7955            && exp_seg != data_section
7956            && exp_seg != bss_section
7957            && exp_seg != undefined_section
7958            && !bfd_is_com_section (exp_seg))
7959     {
7960       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
7961       return 0;
7962     }
7963 #endif
7964   else if (!intel_syntax && exp->X_op == O_register)
7965     {
7966       if (imm_start)
7967         as_bad (_("illegal immediate register operand %s"), imm_start);
7968       return 0;
7969     }
7970   else
7971     {
7972       /* This is an address.  The size of the address will be
7973          determined later, depending on destination register,
7974          suffix, or the default for the section.  */
7975       i.types[this_operand].bitfield.imm8 = 1;
7976       i.types[this_operand].bitfield.imm16 = 1;
7977       i.types[this_operand].bitfield.imm32 = 1;
7978       i.types[this_operand].bitfield.imm32s = 1;
7979       i.types[this_operand].bitfield.imm64 = 1;
7980       i.types[this_operand] = operand_type_and (i.types[this_operand],
7981                                                 types);
7982     }
7983
7984   return 1;
7985 }
7986
7987 static char *
7988 i386_scale (char *scale)
7989 {
7990   offsetT val;
7991   char *save = input_line_pointer;
7992
7993   input_line_pointer = scale;
7994   val = get_absolute_expression ();
7995
7996   switch (val)
7997     {
7998     case 1:
7999       i.log2_scale_factor = 0;
8000       break;
8001     case 2:
8002       i.log2_scale_factor = 1;
8003       break;
8004     case 4:
8005       i.log2_scale_factor = 2;
8006       break;
8007     case 8:
8008       i.log2_scale_factor = 3;
8009       break;
8010     default:
8011       {
8012         char sep = *input_line_pointer;
8013
8014         *input_line_pointer = '\0';
8015         as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
8016                 scale);
8017         *input_line_pointer = sep;
8018         input_line_pointer = save;
8019         return NULL;
8020       }
8021     }
8022   if (i.log2_scale_factor != 0 && i.index_reg == 0)
8023     {
8024       as_warn (_("scale factor of %d without an index register"),
8025                1 << i.log2_scale_factor);
8026       i.log2_scale_factor = 0;
8027     }
8028   scale = input_line_pointer;
8029   input_line_pointer = save;
8030   return scale;
8031 }
8032
8033 static int
8034 i386_displacement (char *disp_start, char *disp_end)
8035 {
8036   expressionS *exp;
8037   segT exp_seg = 0;
8038   char *save_input_line_pointer;
8039   char *gotfree_input_line;
8040   int override;
8041   i386_operand_type bigdisp, types = anydisp;
8042   int ret;
8043
8044   if (i.disp_operands == MAX_MEMORY_OPERANDS)
8045     {
8046       as_bad (_("at most %d displacement operands are allowed"),
8047               MAX_MEMORY_OPERANDS);
8048       return 0;
8049     }
8050
8051   operand_type_set (&bigdisp, 0);
8052   if ((i.types[this_operand].bitfield.jumpabsolute)
8053       || (!current_templates->start->opcode_modifier.jump
8054           && !current_templates->start->opcode_modifier.jumpdword))
8055     {
8056       bigdisp.bitfield.disp32 = 1;
8057       override = (i.prefix[ADDR_PREFIX] != 0);
8058       if (flag_code == CODE_64BIT)
8059         {
8060           if (!override)
8061             {
8062               bigdisp.bitfield.disp32s = 1;
8063               bigdisp.bitfield.disp64 = 1;
8064             }
8065         }
8066       else if ((flag_code == CODE_16BIT) ^ override)
8067         {
8068           bigdisp.bitfield.disp32 = 0;
8069           bigdisp.bitfield.disp16 = 1;
8070         }
8071     }
8072   else
8073     {
8074       /* For PC-relative branches, the width of the displacement
8075          is dependent upon data size, not address size.  */
8076       override = (i.prefix[DATA_PREFIX] != 0);
8077       if (flag_code == CODE_64BIT)
8078         {
8079           if (override || i.suffix == WORD_MNEM_SUFFIX)
8080             bigdisp.bitfield.disp16 = 1;
8081           else
8082             {
8083               bigdisp.bitfield.disp32 = 1;
8084               bigdisp.bitfield.disp32s = 1;
8085             }
8086         }
8087       else
8088         {
8089           if (!override)
8090             override = (i.suffix == (flag_code != CODE_16BIT
8091                                      ? WORD_MNEM_SUFFIX
8092                                      : LONG_MNEM_SUFFIX));
8093           bigdisp.bitfield.disp32 = 1;
8094           if ((flag_code == CODE_16BIT) ^ override)
8095             {
8096               bigdisp.bitfield.disp32 = 0;
8097               bigdisp.bitfield.disp16 = 1;
8098             }
8099         }
8100     }
8101   i.types[this_operand] = operand_type_or (i.types[this_operand],
8102                                            bigdisp);
8103
8104   exp = &disp_expressions[i.disp_operands];
8105   i.op[this_operand].disps = exp;
8106   i.disp_operands++;
8107   save_input_line_pointer = input_line_pointer;
8108   input_line_pointer = disp_start;
8109   END_STRING_AND_SAVE (disp_end);
8110
8111 #ifndef GCC_ASM_O_HACK
8112 #define GCC_ASM_O_HACK 0
8113 #endif
8114 #if GCC_ASM_O_HACK
8115   END_STRING_AND_SAVE (disp_end + 1);
8116   if (i.types[this_operand].bitfield.baseIndex
8117       && displacement_string_end[-1] == '+')
8118     {
8119       /* This hack is to avoid a warning when using the "o"
8120          constraint within gcc asm statements.
8121          For instance:
8122
8123          #define _set_tssldt_desc(n,addr,limit,type) \
8124          __asm__ __volatile__ ( \
8125          "movw %w2,%0\n\t" \
8126          "movw %w1,2+%0\n\t" \
8127          "rorl $16,%1\n\t" \
8128          "movb %b1,4+%0\n\t" \
8129          "movb %4,5+%0\n\t" \
8130          "movb $0,6+%0\n\t" \
8131          "movb %h1,7+%0\n\t" \
8132          "rorl $16,%1" \
8133          : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
8134
8135          This works great except that the output assembler ends
8136          up looking a bit weird if it turns out that there is
8137          no offset.  You end up producing code that looks like:
8138
8139          #APP
8140          movw $235,(%eax)
8141          movw %dx,2+(%eax)
8142          rorl $16,%edx
8143          movb %dl,4+(%eax)
8144          movb $137,5+(%eax)
8145          movb $0,6+(%eax)
8146          movb %dh,7+(%eax)
8147          rorl $16,%edx
8148          #NO_APP
8149
8150          So here we provide the missing zero.  */
8151
8152       *displacement_string_end = '0';
8153     }
8154 #endif
8155   gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types,
8156                                 (i.bnd_prefix != NULL
8157                                  || add_bnd_prefix));
8158   if (gotfree_input_line)
8159     input_line_pointer = gotfree_input_line;
8160
8161   exp_seg = expression (exp);
8162
8163   SKIP_WHITESPACE ();
8164   if (*input_line_pointer)
8165     as_bad (_("junk `%s' after expression"), input_line_pointer);
8166 #if GCC_ASM_O_HACK
8167   RESTORE_END_STRING (disp_end + 1);
8168 #endif
8169   input_line_pointer = save_input_line_pointer;
8170   if (gotfree_input_line)
8171     {
8172       free (gotfree_input_line);
8173
8174       if (exp->X_op == O_constant || exp->X_op == O_register)
8175         exp->X_op = O_illegal;
8176     }
8177
8178   ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
8179
8180   RESTORE_END_STRING (disp_end);
8181
8182   return ret;
8183 }
8184
8185 static int
8186 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
8187                             i386_operand_type types, const char *disp_start)
8188 {
8189   i386_operand_type bigdisp;
8190   int ret = 1;
8191
8192   /* We do this to make sure that the section symbol is in
8193      the symbol table.  We will ultimately change the relocation
8194      to be relative to the beginning of the section.  */
8195   if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
8196       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
8197       || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8198     {
8199       if (exp->X_op != O_symbol)
8200         goto inv_disp;
8201
8202       if (S_IS_LOCAL (exp->X_add_symbol)
8203           && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
8204           && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
8205         section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
8206       exp->X_op = O_subtract;
8207       exp->X_op_symbol = GOT_symbol;
8208       if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
8209         i.reloc[this_operand] = BFD_RELOC_32_PCREL;
8210       else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
8211         i.reloc[this_operand] = BFD_RELOC_64;
8212       else
8213         i.reloc[this_operand] = BFD_RELOC_32;
8214     }
8215
8216   else if (exp->X_op == O_absent
8217            || exp->X_op == O_illegal
8218            || exp->X_op == O_big)
8219     {
8220     inv_disp:
8221       as_bad (_("missing or invalid displacement expression `%s'"),
8222               disp_start);
8223       ret = 0;
8224     }
8225
8226   else if (flag_code == CODE_64BIT
8227            && !i.prefix[ADDR_PREFIX]
8228            && exp->X_op == O_constant)
8229     {
8230       /* Since displacement is signed extended to 64bit, don't allow
8231          disp32 and turn off disp32s if they are out of range.  */
8232       i.types[this_operand].bitfield.disp32 = 0;
8233       if (!fits_in_signed_long (exp->X_add_number))
8234         {
8235           i.types[this_operand].bitfield.disp32s = 0;
8236           if (i.types[this_operand].bitfield.baseindex)
8237             {
8238               as_bad (_("0x%lx out range of signed 32bit displacement"),
8239                       (long) exp->X_add_number);
8240               ret = 0;
8241             }
8242         }
8243     }
8244
8245 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
8246   else if (exp->X_op != O_constant
8247            && OUTPUT_FLAVOR == bfd_target_aout_flavour
8248            && exp_seg != absolute_section
8249            && exp_seg != text_section
8250            && exp_seg != data_section
8251            && exp_seg != bss_section
8252            && exp_seg != undefined_section
8253            && !bfd_is_com_section (exp_seg))
8254     {
8255       as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
8256       ret = 0;
8257     }
8258 #endif
8259
8260   /* Check if this is a displacement only operand.  */
8261   bigdisp = i.types[this_operand];
8262   bigdisp.bitfield.disp8 = 0;
8263   bigdisp.bitfield.disp16 = 0;
8264   bigdisp.bitfield.disp32 = 0;
8265   bigdisp.bitfield.disp32s = 0;
8266   bigdisp.bitfield.disp64 = 0;
8267   if (operand_type_all_zero (&bigdisp))
8268     i.types[this_operand] = operand_type_and (i.types[this_operand],
8269                                               types);
8270
8271   return ret;
8272 }
8273
8274 /* Make sure the memory operand we've been dealt is valid.
8275    Return 1 on success, 0 on a failure.  */
8276
8277 static int
8278 i386_index_check (const char *operand_string)
8279 {
8280   const char *kind = "base/index";
8281   enum flag_code addr_mode;
8282
8283   if (i.prefix[ADDR_PREFIX])
8284     addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
8285   else
8286     {
8287       addr_mode = flag_code;
8288
8289 #if INFER_ADDR_PREFIX
8290       if (i.mem_operands == 0)
8291         {
8292           /* Infer address prefix from the first memory operand.  */
8293           const reg_entry *addr_reg = i.base_reg;
8294
8295           if (addr_reg == NULL)
8296             addr_reg = i.index_reg;
8297
8298           if (addr_reg)
8299             {
8300               if (addr_reg->reg_num == RegEip
8301                   || addr_reg->reg_num == RegEiz
8302                   || addr_reg->reg_type.bitfield.reg32)
8303                 addr_mode = CODE_32BIT;
8304               else if (flag_code != CODE_64BIT
8305                        && addr_reg->reg_type.bitfield.reg16)
8306                 addr_mode = CODE_16BIT;
8307
8308               if (addr_mode != flag_code)
8309                 {
8310                   i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
8311                   i.prefixes += 1;
8312                   /* Change the size of any displacement too.  At most one
8313                      of Disp16 or Disp32 is set.
8314                      FIXME.  There doesn't seem to be any real need for
8315                      separate Disp16 and Disp32 flags.  The same goes for
8316                      Imm16 and Imm32.  Removing them would probably clean
8317                      up the code quite a lot.  */
8318                   if (flag_code != CODE_64BIT
8319                       && (i.types[this_operand].bitfield.disp16
8320                           || i.types[this_operand].bitfield.disp32))
8321                     i.types[this_operand]
8322                       = operand_type_xor (i.types[this_operand], disp16_32);
8323                 }
8324             }
8325         }
8326 #endif
8327     }
8328
8329   if (current_templates->start->opcode_modifier.isstring
8330       && !current_templates->start->opcode_modifier.immext
8331       && (current_templates->end[-1].opcode_modifier.isstring
8332           || i.mem_operands))
8333     {
8334       /* Memory operands of string insns are special in that they only allow
8335          a single register (rDI, rSI, or rBX) as their memory address.  */
8336       const reg_entry *expected_reg;
8337       static const char *di_si[][2] =
8338         {
8339           { "esi", "edi" },
8340           { "si", "di" },
8341           { "rsi", "rdi" }
8342         };
8343       static const char *bx[] = { "ebx", "bx", "rbx" };
8344
8345       kind = "string address";
8346
8347       if (current_templates->start->opcode_modifier.w)
8348         {
8349           i386_operand_type type = current_templates->end[-1].operand_types[0];
8350
8351           if (!type.bitfield.baseindex
8352               || ((!i.mem_operands != !intel_syntax)
8353                   && current_templates->end[-1].operand_types[1]
8354                      .bitfield.baseindex))
8355             type = current_templates->end[-1].operand_types[1];
8356           expected_reg = hash_find (reg_hash,
8357                                     di_si[addr_mode][type.bitfield.esseg]);
8358
8359         }
8360       else
8361         expected_reg = hash_find (reg_hash, bx[addr_mode]);
8362
8363       if (i.base_reg != expected_reg
8364           || i.index_reg
8365           || operand_type_check (i.types[this_operand], disp))
8366         {
8367           /* The second memory operand must have the same size as
8368              the first one.  */
8369           if (i.mem_operands
8370               && i.base_reg
8371               && !((addr_mode == CODE_64BIT
8372                     && i.base_reg->reg_type.bitfield.reg64)
8373                    || (addr_mode == CODE_32BIT
8374                        ? i.base_reg->reg_type.bitfield.reg32
8375                        : i.base_reg->reg_type.bitfield.reg16)))
8376             goto bad_address;
8377
8378           as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
8379                    operand_string,
8380                    intel_syntax ? '[' : '(',
8381                    register_prefix,
8382                    expected_reg->reg_name,
8383                    intel_syntax ? ']' : ')');
8384           return 1;
8385         }
8386       else
8387         return 1;
8388
8389 bad_address:
8390       as_bad (_("`%s' is not a valid %s expression"),
8391               operand_string, kind);
8392       return 0;
8393     }
8394   else
8395     {
8396       if (addr_mode != CODE_16BIT)
8397         {
8398           /* 32-bit/64-bit checks.  */
8399           if ((i.base_reg
8400                && (addr_mode == CODE_64BIT
8401                    ? !i.base_reg->reg_type.bitfield.reg64
8402                    : !i.base_reg->reg_type.bitfield.reg32)
8403                && (i.index_reg
8404                    || (i.base_reg->reg_num
8405                        != (addr_mode == CODE_64BIT ? RegRip : RegEip))))
8406               || (i.index_reg
8407                   && !i.index_reg->reg_type.bitfield.regxmm
8408                   && !i.index_reg->reg_type.bitfield.regymm
8409                   && !i.index_reg->reg_type.bitfield.regzmm
8410                   && ((addr_mode == CODE_64BIT
8411                        ? !(i.index_reg->reg_type.bitfield.reg64
8412                            || i.index_reg->reg_num == RegRiz)
8413                        : !(i.index_reg->reg_type.bitfield.reg32
8414                            || i.index_reg->reg_num == RegEiz))
8415                       || !i.index_reg->reg_type.bitfield.baseindex)))
8416             goto bad_address;
8417         }
8418       else
8419         {
8420           /* 16-bit checks.  */
8421           if ((i.base_reg
8422                && (!i.base_reg->reg_type.bitfield.reg16
8423                    || !i.base_reg->reg_type.bitfield.baseindex))
8424               || (i.index_reg
8425                   && (!i.index_reg->reg_type.bitfield.reg16
8426                       || !i.index_reg->reg_type.bitfield.baseindex
8427                       || !(i.base_reg
8428                            && i.base_reg->reg_num < 6
8429                            && i.index_reg->reg_num >= 6
8430                            && i.log2_scale_factor == 0))))
8431             goto bad_address;
8432         }
8433     }
8434   return 1;
8435 }
8436
8437 /* Handle vector immediates.  */
8438
8439 static int
8440 RC_SAE_immediate (const char *imm_start)
8441 {
8442   unsigned int match_found, j;
8443   const char *pstr = imm_start;
8444   expressionS *exp;
8445
8446   if (*pstr != '{')
8447     return 0;
8448
8449   pstr++;
8450   match_found = 0;
8451   for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
8452     {
8453       if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
8454         {
8455           if (!i.rounding)
8456             {
8457               rc_op.type = RC_NamesTable[j].type;
8458               rc_op.operand = this_operand;
8459               i.rounding = &rc_op;
8460             }
8461           else
8462             {
8463               as_bad (_("duplicated `%s'"), imm_start);
8464               return 0;
8465             }
8466           pstr += RC_NamesTable[j].len;
8467           match_found = 1;
8468           break;
8469         }
8470     }
8471   if (!match_found)
8472     return 0;
8473
8474   if (*pstr++ != '}')
8475     {
8476       as_bad (_("Missing '}': '%s'"), imm_start);
8477       return 0;
8478     }
8479   /* RC/SAE immediate string should contain nothing more.  */;
8480   if (*pstr != 0)
8481     {
8482       as_bad (_("Junk after '}': '%s'"), imm_start);
8483       return 0;
8484     }
8485
8486   exp = &im_expressions[i.imm_operands++];
8487   i.op[this_operand].imms = exp;
8488
8489   exp->X_op = O_constant;
8490   exp->X_add_number = 0;
8491   exp->X_add_symbol = (symbolS *) 0;
8492   exp->X_op_symbol = (symbolS *) 0;
8493
8494   i.types[this_operand].bitfield.imm8 = 1;
8495   return 1;
8496 }
8497
8498 /* Parse OPERAND_STRING into the i386_insn structure I.  Returns zero
8499    on error.  */
8500
8501 static int
8502 i386_att_operand (char *operand_string)
8503 {
8504   const reg_entry *r;
8505   char *end_op;
8506   char *op_string = operand_string;
8507
8508   if (is_space_char (*op_string))
8509     ++op_string;
8510
8511   /* We check for an absolute prefix (differentiating,
8512      for example, 'jmp pc_relative_label' from 'jmp *absolute_label'.  */
8513   if (*op_string == ABSOLUTE_PREFIX)
8514     {
8515       ++op_string;
8516       if (is_space_char (*op_string))
8517         ++op_string;
8518       i.types[this_operand].bitfield.jumpabsolute = 1;
8519     }
8520
8521   /* Check if operand is a register.  */
8522   if ((r = parse_register (op_string, &end_op)) != NULL)
8523     {
8524       i386_operand_type temp;
8525
8526       /* Check for a segment override by searching for ':' after a
8527          segment register.  */
8528       op_string = end_op;
8529       if (is_space_char (*op_string))
8530         ++op_string;
8531       if (*op_string == ':'
8532           && (r->reg_type.bitfield.sreg2
8533               || r->reg_type.bitfield.sreg3))
8534         {
8535           switch (r->reg_num)
8536             {
8537             case 0:
8538               i.seg[i.mem_operands] = &es;
8539               break;
8540             case 1:
8541               i.seg[i.mem_operands] = &cs;
8542               break;
8543             case 2:
8544               i.seg[i.mem_operands] = &ss;
8545               break;
8546             case 3:
8547               i.seg[i.mem_operands] = &ds;
8548               break;
8549             case 4:
8550               i.seg[i.mem_operands] = &fs;
8551               break;
8552             case 5:
8553               i.seg[i.mem_operands] = &gs;
8554               break;
8555             }
8556
8557           /* Skip the ':' and whitespace.  */
8558           ++op_string;
8559           if (is_space_char (*op_string))
8560             ++op_string;
8561
8562           if (!is_digit_char (*op_string)
8563               && !is_identifier_char (*op_string)
8564               && *op_string != '('
8565               && *op_string != ABSOLUTE_PREFIX)
8566             {
8567               as_bad (_("bad memory operand `%s'"), op_string);
8568               return 0;
8569             }
8570           /* Handle case of %es:*foo.  */
8571           if (*op_string == ABSOLUTE_PREFIX)
8572             {
8573               ++op_string;
8574               if (is_space_char (*op_string))
8575                 ++op_string;
8576               i.types[this_operand].bitfield.jumpabsolute = 1;
8577             }
8578           goto do_memory_reference;
8579         }
8580
8581       /* Handle vector operations.  */
8582       if (*op_string == '{')
8583         {
8584           op_string = check_VecOperations (op_string, NULL);
8585           if (op_string == NULL)
8586             return 0;
8587         }
8588
8589       if (*op_string)
8590         {
8591           as_bad (_("junk `%s' after register"), op_string);
8592           return 0;
8593         }
8594       temp = r->reg_type;
8595       temp.bitfield.baseindex = 0;
8596       i.types[this_operand] = operand_type_or (i.types[this_operand],
8597                                                temp);
8598       i.types[this_operand].bitfield.unspecified = 0;
8599       i.op[this_operand].regs = r;
8600       i.reg_operands++;
8601     }
8602   else if (*op_string == REGISTER_PREFIX)
8603     {
8604       as_bad (_("bad register name `%s'"), op_string);
8605       return 0;
8606     }
8607   else if (*op_string == IMMEDIATE_PREFIX)
8608     {
8609       ++op_string;
8610       if (i.types[this_operand].bitfield.jumpabsolute)
8611         {
8612           as_bad (_("immediate operand illegal with absolute jump"));
8613           return 0;
8614         }
8615       if (!i386_immediate (op_string))
8616         return 0;
8617     }
8618   else if (RC_SAE_immediate (operand_string))
8619     {
8620       /* If it is a RC or SAE immediate, do nothing.  */
8621       ;
8622     }
8623   else if (is_digit_char (*op_string)
8624            || is_identifier_char (*op_string)
8625            || *op_string == '(')
8626     {
8627       /* This is a memory reference of some sort.  */
8628       char *base_string;
8629
8630       /* Start and end of displacement string expression (if found).  */
8631       char *displacement_string_start;
8632       char *displacement_string_end;
8633       char *vop_start;
8634
8635     do_memory_reference:
8636       if ((i.mem_operands == 1
8637            && !current_templates->start->opcode_modifier.isstring)
8638           || i.mem_operands == 2)
8639         {
8640           as_bad (_("too many memory references for `%s'"),
8641                   current_templates->start->name);
8642           return 0;
8643         }
8644
8645       /* Check for base index form.  We detect the base index form by
8646          looking for an ')' at the end of the operand, searching
8647          for the '(' matching it, and finding a REGISTER_PREFIX or ','
8648          after the '('.  */
8649       base_string = op_string + strlen (op_string);
8650
8651       /* Handle vector operations.  */
8652       vop_start = strchr (op_string, '{');
8653       if (vop_start && vop_start < base_string)
8654         {
8655           if (check_VecOperations (vop_start, base_string) == NULL)
8656             return 0;
8657           base_string = vop_start;
8658         }
8659
8660       --base_string;
8661       if (is_space_char (*base_string))
8662         --base_string;
8663
8664       /* If we only have a displacement, set-up for it to be parsed later.  */
8665       displacement_string_start = op_string;
8666       displacement_string_end = base_string + 1;
8667
8668       if (*base_string == ')')
8669         {
8670           char *temp_string;
8671           unsigned int parens_balanced = 1;
8672           /* We've already checked that the number of left & right ()'s are
8673              equal, so this loop will not be infinite.  */
8674           do
8675             {
8676               base_string--;
8677               if (*base_string == ')')
8678                 parens_balanced++;
8679               if (*base_string == '(')
8680                 parens_balanced--;
8681             }
8682           while (parens_balanced);
8683
8684           temp_string = base_string;
8685
8686           /* Skip past '(' and whitespace.  */
8687           ++base_string;
8688           if (is_space_char (*base_string))
8689             ++base_string;
8690
8691           if (*base_string == ','
8692               || ((i.base_reg = parse_register (base_string, &end_op))
8693                   != NULL))
8694             {
8695               displacement_string_end = temp_string;
8696
8697               i.types[this_operand].bitfield.baseindex = 1;
8698
8699               if (i.base_reg)
8700                 {
8701                   base_string = end_op;
8702                   if (is_space_char (*base_string))
8703                     ++base_string;
8704                 }
8705
8706               /* There may be an index reg or scale factor here.  */
8707               if (*base_string == ',')
8708                 {
8709                   ++base_string;
8710                   if (is_space_char (*base_string))
8711                     ++base_string;
8712
8713                   if ((i.index_reg = parse_register (base_string, &end_op))
8714                       != NULL)
8715                     {
8716                       base_string = end_op;
8717                       if (is_space_char (*base_string))
8718                         ++base_string;
8719                       if (*base_string == ',')
8720                         {
8721                           ++base_string;
8722                           if (is_space_char (*base_string))
8723                             ++base_string;
8724                         }
8725                       else if (*base_string != ')')
8726                         {
8727                           as_bad (_("expecting `,' or `)' "
8728                                     "after index register in `%s'"),
8729                                   operand_string);
8730                           return 0;
8731                         }
8732                     }
8733                   else if (*base_string == REGISTER_PREFIX)
8734                     {
8735                       end_op = strchr (base_string, ',');
8736                       if (end_op)
8737                         *end_op = '\0';
8738                       as_bad (_("bad register name `%s'"), base_string);
8739                       return 0;
8740                     }
8741
8742                   /* Check for scale factor.  */
8743                   if (*base_string != ')')
8744                     {
8745                       char *end_scale = i386_scale (base_string);
8746
8747                       if (!end_scale)
8748                         return 0;
8749
8750                       base_string = end_scale;
8751                       if (is_space_char (*base_string))
8752                         ++base_string;
8753                       if (*base_string != ')')
8754                         {
8755                           as_bad (_("expecting `)' "
8756                                     "after scale factor in `%s'"),
8757                                   operand_string);
8758                           return 0;
8759                         }
8760                     }
8761                   else if (!i.index_reg)
8762                     {
8763                       as_bad (_("expecting index register or scale factor "
8764                                 "after `,'; got '%c'"),
8765                               *base_string);
8766                       return 0;
8767                     }
8768                 }
8769               else if (*base_string != ')')
8770                 {
8771                   as_bad (_("expecting `,' or `)' "
8772                             "after base register in `%s'"),
8773                           operand_string);
8774                   return 0;
8775                 }
8776             }
8777           else if (*base_string == REGISTER_PREFIX)
8778             {
8779               end_op = strchr (base_string, ',');
8780               if (end_op)
8781                 *end_op = '\0';
8782               as_bad (_("bad register name `%s'"), base_string);
8783               return 0;
8784             }
8785         }
8786
8787       /* If there's an expression beginning the operand, parse it,
8788          assuming displacement_string_start and
8789          displacement_string_end are meaningful.  */
8790       if (displacement_string_start != displacement_string_end)
8791         {
8792           if (!i386_displacement (displacement_string_start,
8793                                   displacement_string_end))
8794             return 0;
8795         }
8796
8797       /* Special case for (%dx) while doing input/output op.  */
8798       if (i.base_reg
8799           && operand_type_equal (&i.base_reg->reg_type,
8800                                  &reg16_inoutportreg)
8801           && i.index_reg == 0
8802           && i.log2_scale_factor == 0
8803           && i.seg[i.mem_operands] == 0
8804           && !operand_type_check (i.types[this_operand], disp))
8805         {
8806           i.types[this_operand] = inoutportreg;
8807           return 1;
8808         }
8809
8810       if (i386_index_check (operand_string) == 0)
8811         return 0;
8812       i.types[this_operand].bitfield.mem = 1;
8813       i.mem_operands++;
8814     }
8815   else
8816     {
8817       /* It's not a memory operand; argh!  */
8818       as_bad (_("invalid char %s beginning operand %d `%s'"),
8819               output_invalid (*op_string),
8820               this_operand + 1,
8821               op_string);
8822       return 0;
8823     }
8824   return 1;                     /* Normal return.  */
8825 }
8826 \f
8827 /* Calculate the maximum variable size (i.e., excluding fr_fix)
8828    that an rs_machine_dependent frag may reach.  */
8829
8830 unsigned int
8831 i386_frag_max_var (fragS *frag)
8832 {
8833   /* The only relaxable frags are for jumps.
8834      Unconditional jumps can grow by 4 bytes and others by 5 bytes.  */
8835   gas_assert (frag->fr_type == rs_machine_dependent);
8836   return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
8837 }
8838
8839 /* md_estimate_size_before_relax()
8840
8841    Called just before relax() for rs_machine_dependent frags.  The x86
8842    assembler uses these frags to handle variable size jump
8843    instructions.
8844
8845    Any symbol that is now undefined will not become defined.
8846    Return the correct fr_subtype in the frag.
8847    Return the initial "guess for variable size of frag" to caller.
8848    The guess is actually the growth beyond the fixed part.  Whatever
8849    we do to grow the fixed or variable part contributes to our
8850    returned value.  */
8851
8852 int
8853 md_estimate_size_before_relax (fragS *fragP, segT segment)
8854 {
8855   /* We've already got fragP->fr_subtype right;  all we have to do is
8856      check for un-relaxable symbols.  On an ELF system, we can't relax
8857      an externally visible symbol, because it may be overridden by a
8858      shared library.  */
8859   if (S_GET_SEGMENT (fragP->fr_symbol) != segment
8860 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8861       || (IS_ELF
8862           && (S_IS_EXTERNAL (fragP->fr_symbol)
8863               || S_IS_WEAK (fragP->fr_symbol)
8864               || ((symbol_get_bfdsym (fragP->fr_symbol)->flags
8865                    & BSF_GNU_INDIRECT_FUNCTION))))
8866 #endif
8867 #if defined (OBJ_COFF) && defined (TE_PE)
8868       || (OUTPUT_FLAVOR == bfd_target_coff_flavour
8869           && S_IS_WEAK (fragP->fr_symbol))
8870 #endif
8871       )
8872     {
8873       /* Symbol is undefined in this segment, or we need to keep a
8874          reloc so that weak symbols can be overridden.  */
8875       int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
8876       enum bfd_reloc_code_real reloc_type;
8877       unsigned char *opcode;
8878       int old_fr_fix;
8879
8880       if (fragP->fr_var != NO_RELOC)
8881         reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
8882       else if (size == 2)
8883         reloc_type = BFD_RELOC_16_PCREL;
8884       else
8885         reloc_type = BFD_RELOC_32_PCREL;
8886
8887       old_fr_fix = fragP->fr_fix;
8888       opcode = (unsigned char *) fragP->fr_opcode;
8889
8890       switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
8891         {
8892         case UNCOND_JUMP:
8893           /* Make jmp (0xeb) a (d)word displacement jump.  */
8894           opcode[0] = 0xe9;
8895           fragP->fr_fix += size;
8896           fix_new (fragP, old_fr_fix, size,
8897                    fragP->fr_symbol,
8898                    fragP->fr_offset, 1,
8899                    reloc_type);
8900           break;
8901
8902         case COND_JUMP86:
8903           if (size == 2
8904               && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
8905             {
8906               /* Negate the condition, and branch past an
8907                  unconditional jump.  */
8908               opcode[0] ^= 1;
8909               opcode[1] = 3;
8910               /* Insert an unconditional jump.  */
8911               opcode[2] = 0xe9;
8912               /* We added two extra opcode bytes, and have a two byte
8913                  offset.  */
8914               fragP->fr_fix += 2 + 2;
8915               fix_new (fragP, old_fr_fix + 2, 2,
8916                        fragP->fr_symbol,
8917                        fragP->fr_offset, 1,
8918                        reloc_type);
8919               break;
8920             }
8921           /* Fall through.  */
8922
8923         case COND_JUMP:
8924           if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
8925             {
8926               fixS *fixP;
8927
8928               fragP->fr_fix += 1;
8929               fixP = fix_new (fragP, old_fr_fix, 1,
8930                               fragP->fr_symbol,
8931                               fragP->fr_offset, 1,
8932                               BFD_RELOC_8_PCREL);
8933               fixP->fx_signed = 1;
8934               break;
8935             }
8936
8937           /* This changes the byte-displacement jump 0x7N
8938              to the (d)word-displacement jump 0x0f,0x8N.  */
8939           opcode[1] = opcode[0] + 0x10;
8940           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
8941           /* We've added an opcode byte.  */
8942           fragP->fr_fix += 1 + size;
8943           fix_new (fragP, old_fr_fix + 1, size,
8944                    fragP->fr_symbol,
8945                    fragP->fr_offset, 1,
8946                    reloc_type);
8947           break;
8948
8949         default:
8950           BAD_CASE (fragP->fr_subtype);
8951           break;
8952         }
8953       frag_wane (fragP);
8954       return fragP->fr_fix - old_fr_fix;
8955     }
8956
8957   /* Guess size depending on current relax state.  Initially the relax
8958      state will correspond to a short jump and we return 1, because
8959      the variable part of the frag (the branch offset) is one byte
8960      long.  However, we can relax a section more than once and in that
8961      case we must either set fr_subtype back to the unrelaxed state,
8962      or return the value for the appropriate branch.  */
8963   return md_relax_table[fragP->fr_subtype].rlx_length;
8964 }
8965
8966 /* Called after relax() is finished.
8967
8968    In:  Address of frag.
8969         fr_type == rs_machine_dependent.
8970         fr_subtype is what the address relaxed to.
8971
8972    Out: Any fixSs and constants are set up.
8973         Caller will turn frag into a ".space 0".  */
8974
8975 void
8976 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
8977                  fragS *fragP)
8978 {
8979   unsigned char *opcode;
8980   unsigned char *where_to_put_displacement = NULL;
8981   offsetT target_address;
8982   offsetT opcode_address;
8983   unsigned int extension = 0;
8984   offsetT displacement_from_opcode_start;
8985
8986   opcode = (unsigned char *) fragP->fr_opcode;
8987
8988   /* Address we want to reach in file space.  */
8989   target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
8990
8991   /* Address opcode resides at in file space.  */
8992   opcode_address = fragP->fr_address + fragP->fr_fix;
8993
8994   /* Displacement from opcode start to fill into instruction.  */
8995   displacement_from_opcode_start = target_address - opcode_address;
8996
8997   if ((fragP->fr_subtype & BIG) == 0)
8998     {
8999       /* Don't have to change opcode.  */
9000       extension = 1;            /* 1 opcode + 1 displacement  */
9001       where_to_put_displacement = &opcode[1];
9002     }
9003   else
9004     {
9005       if (no_cond_jump_promotion
9006           && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
9007         as_warn_where (fragP->fr_file, fragP->fr_line,
9008                        _("long jump required"));
9009
9010       switch (fragP->fr_subtype)
9011         {
9012         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
9013           extension = 4;                /* 1 opcode + 4 displacement  */
9014           opcode[0] = 0xe9;
9015           where_to_put_displacement = &opcode[1];
9016           break;
9017
9018         case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
9019           extension = 2;                /* 1 opcode + 2 displacement  */
9020           opcode[0] = 0xe9;
9021           where_to_put_displacement = &opcode[1];
9022           break;
9023
9024         case ENCODE_RELAX_STATE (COND_JUMP, BIG):
9025         case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
9026           extension = 5;                /* 2 opcode + 4 displacement  */
9027           opcode[1] = opcode[0] + 0x10;
9028           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9029           where_to_put_displacement = &opcode[2];
9030           break;
9031
9032         case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
9033           extension = 3;                /* 2 opcode + 2 displacement  */
9034           opcode[1] = opcode[0] + 0x10;
9035           opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
9036           where_to_put_displacement = &opcode[2];
9037           break;
9038
9039         case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
9040           extension = 4;
9041           opcode[0] ^= 1;
9042           opcode[1] = 3;
9043           opcode[2] = 0xe9;
9044           where_to_put_displacement = &opcode[3];
9045           break;
9046
9047         default:
9048           BAD_CASE (fragP->fr_subtype);
9049           break;
9050         }
9051     }
9052
9053   /* If size if less then four we are sure that the operand fits,
9054      but if it's 4, then it could be that the displacement is larger
9055      then -/+ 2GB.  */
9056   if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
9057       && object_64bit
9058       && ((addressT) (displacement_from_opcode_start - extension
9059                       + ((addressT) 1 << 31))
9060           > (((addressT) 2 << 31) - 1)))
9061     {
9062       as_bad_where (fragP->fr_file, fragP->fr_line,
9063                     _("jump target out of range"));
9064       /* Make us emit 0.  */
9065       displacement_from_opcode_start = extension;
9066     }
9067   /* Now put displacement after opcode.  */
9068   md_number_to_chars ((char *) where_to_put_displacement,
9069                       (valueT) (displacement_from_opcode_start - extension),
9070                       DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
9071   fragP->fr_fix += extension;
9072 }
9073 \f
9074 /* Apply a fixup (fixP) to segment data, once it has been determined
9075    by our caller that we have all the info we need to fix it up.
9076
9077    Parameter valP is the pointer to the value of the bits.
9078
9079    On the 386, immediates, displacements, and data pointers are all in
9080    the same (little-endian) format, so we don't need to care about which
9081    we are handling.  */
9082
9083 void
9084 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
9085 {
9086   char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
9087   valueT value = *valP;
9088
9089 #if !defined (TE_Mach)
9090   if (fixP->fx_pcrel)
9091     {
9092       switch (fixP->fx_r_type)
9093         {
9094         default:
9095           break;
9096
9097         case BFD_RELOC_64:
9098           fixP->fx_r_type = BFD_RELOC_64_PCREL;
9099           break;
9100         case BFD_RELOC_32:
9101         case BFD_RELOC_X86_64_32S:
9102           fixP->fx_r_type = BFD_RELOC_32_PCREL;
9103           break;
9104         case BFD_RELOC_16:
9105           fixP->fx_r_type = BFD_RELOC_16_PCREL;
9106           break;
9107         case BFD_RELOC_8:
9108           fixP->fx_r_type = BFD_RELOC_8_PCREL;
9109           break;
9110         }
9111     }
9112
9113   if (fixP->fx_addsy != NULL
9114       && (fixP->fx_r_type == BFD_RELOC_32_PCREL
9115           || fixP->fx_r_type == BFD_RELOC_64_PCREL
9116           || fixP->fx_r_type == BFD_RELOC_16_PCREL
9117           || fixP->fx_r_type == BFD_RELOC_8_PCREL
9118           || fixP->fx_r_type == BFD_RELOC_X86_64_PC32_BND)
9119       && !use_rela_relocations)
9120     {
9121       /* This is a hack.  There should be a better way to handle this.
9122          This covers for the fact that bfd_install_relocation will
9123          subtract the current location (for partial_inplace, PC relative
9124          relocations); see more below.  */
9125 #ifndef OBJ_AOUT
9126       if (IS_ELF
9127 #ifdef TE_PE
9128           || OUTPUT_FLAVOR == bfd_target_coff_flavour
9129 #endif
9130           )
9131         value += fixP->fx_where + fixP->fx_frag->fr_address;
9132 #endif
9133 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9134       if (IS_ELF)
9135         {
9136           segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
9137
9138           if ((sym_seg == seg
9139                || (symbol_section_p (fixP->fx_addsy)
9140                    && sym_seg != absolute_section))
9141               && !generic_force_reloc (fixP))
9142             {
9143               /* Yes, we add the values in twice.  This is because
9144                  bfd_install_relocation subtracts them out again.  I think
9145                  bfd_install_relocation is broken, but I don't dare change
9146                  it.  FIXME.  */
9147               value += fixP->fx_where + fixP->fx_frag->fr_address;
9148             }
9149         }
9150 #endif
9151 #if defined (OBJ_COFF) && defined (TE_PE)
9152       /* For some reason, the PE format does not store a
9153          section address offset for a PC relative symbol.  */
9154       if (S_GET_SEGMENT (fixP->fx_addsy) != seg
9155           || S_IS_WEAK (fixP->fx_addsy))
9156         value += md_pcrel_from (fixP);
9157 #endif
9158     }
9159 #if defined (OBJ_COFF) && defined (TE_PE)
9160   if (fixP->fx_addsy != NULL
9161       && S_IS_WEAK (fixP->fx_addsy)
9162       /* PR 16858: Do not modify weak function references.  */
9163       && ! fixP->fx_pcrel)
9164     {
9165 #if !defined (TE_PEP)
9166       /* For x86 PE weak function symbols are neither PC-relative
9167          nor do they set S_IS_FUNCTION.  So the only reliable way
9168          to detect them is to check the flags of their containing
9169          section.  */
9170       if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
9171           && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
9172         ;
9173       else
9174 #endif
9175       value -= S_GET_VALUE (fixP->fx_addsy);
9176     }
9177 #endif
9178
9179   /* Fix a few things - the dynamic linker expects certain values here,
9180      and we must not disappoint it.  */
9181 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9182   if (IS_ELF && fixP->fx_addsy)
9183     switch (fixP->fx_r_type)
9184       {
9185       case BFD_RELOC_386_PLT32:
9186       case BFD_RELOC_X86_64_PLT32:
9187       case BFD_RELOC_X86_64_PLT32_BND:
9188         /* Make the jump instruction point to the address of the operand.  At
9189            runtime we merely add the offset to the actual PLT entry.  */
9190         value = -4;
9191         break;
9192
9193       case BFD_RELOC_386_TLS_GD:
9194       case BFD_RELOC_386_TLS_LDM:
9195       case BFD_RELOC_386_TLS_IE_32:
9196       case BFD_RELOC_386_TLS_IE:
9197       case BFD_RELOC_386_TLS_GOTIE:
9198       case BFD_RELOC_386_TLS_GOTDESC:
9199       case BFD_RELOC_X86_64_TLSGD:
9200       case BFD_RELOC_X86_64_TLSLD:
9201       case BFD_RELOC_X86_64_GOTTPOFF:
9202       case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9203         value = 0; /* Fully resolved at runtime.  No addend.  */
9204         /* Fallthrough */
9205       case BFD_RELOC_386_TLS_LE:
9206       case BFD_RELOC_386_TLS_LDO_32:
9207       case BFD_RELOC_386_TLS_LE_32:
9208       case BFD_RELOC_X86_64_DTPOFF32:
9209       case BFD_RELOC_X86_64_DTPOFF64:
9210       case BFD_RELOC_X86_64_TPOFF32:
9211       case BFD_RELOC_X86_64_TPOFF64:
9212         S_SET_THREAD_LOCAL (fixP->fx_addsy);
9213         break;
9214
9215       case BFD_RELOC_386_TLS_DESC_CALL:
9216       case BFD_RELOC_X86_64_TLSDESC_CALL:
9217         value = 0; /* Fully resolved at runtime.  No addend.  */
9218         S_SET_THREAD_LOCAL (fixP->fx_addsy);
9219         fixP->fx_done = 0;
9220         return;
9221
9222       case BFD_RELOC_386_GOT32:
9223       case BFD_RELOC_X86_64_GOT32:
9224         value = 0; /* Fully resolved at runtime.  No addend.  */
9225         break;
9226
9227       case BFD_RELOC_VTABLE_INHERIT:
9228       case BFD_RELOC_VTABLE_ENTRY:
9229         fixP->fx_done = 0;
9230         return;
9231
9232       default:
9233         break;
9234       }
9235 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)  */
9236   *valP = value;
9237 #endif /* !defined (TE_Mach)  */
9238
9239   /* Are we finished with this relocation now?  */
9240   if (fixP->fx_addsy == NULL)
9241     fixP->fx_done = 1;
9242 #if defined (OBJ_COFF) && defined (TE_PE)
9243   else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
9244     {
9245       fixP->fx_done = 0;
9246       /* Remember value for tc_gen_reloc.  */
9247       fixP->fx_addnumber = value;
9248       /* Clear out the frag for now.  */
9249       value = 0;
9250     }
9251 #endif
9252   else if (use_rela_relocations)
9253     {
9254       fixP->fx_no_overflow = 1;
9255       /* Remember value for tc_gen_reloc.  */
9256       fixP->fx_addnumber = value;
9257       value = 0;
9258     }
9259
9260   md_number_to_chars (p, value, fixP->fx_size);
9261 }
9262 \f
9263 char *
9264 md_atof (int type, char *litP, int *sizeP)
9265 {
9266   /* This outputs the LITTLENUMs in REVERSE order;
9267      in accord with the bigendian 386.  */
9268   return ieee_md_atof (type, litP, sizeP, FALSE);
9269 }
9270 \f
9271 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
9272
9273 static char *
9274 output_invalid (int c)
9275 {
9276   if (ISPRINT (c))
9277     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9278               "'%c'", c);
9279   else
9280     snprintf (output_invalid_buf, sizeof (output_invalid_buf),
9281               "(0x%x)", (unsigned char) c);
9282   return output_invalid_buf;
9283 }
9284
9285 /* REG_STRING starts *before* REGISTER_PREFIX.  */
9286
9287 static const reg_entry *
9288 parse_real_register (char *reg_string, char **end_op)
9289 {
9290   char *s = reg_string;
9291   char *p;
9292   char reg_name_given[MAX_REG_NAME_SIZE + 1];
9293   const reg_entry *r;
9294
9295   /* Skip possible REGISTER_PREFIX and possible whitespace.  */
9296   if (*s == REGISTER_PREFIX)
9297     ++s;
9298
9299   if (is_space_char (*s))
9300     ++s;
9301
9302   p = reg_name_given;
9303   while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
9304     {
9305       if (p >= reg_name_given + MAX_REG_NAME_SIZE)
9306         return (const reg_entry *) NULL;
9307       s++;
9308     }
9309
9310   /* For naked regs, make sure that we are not dealing with an identifier.
9311      This prevents confusing an identifier like `eax_var' with register
9312      `eax'.  */
9313   if (allow_naked_reg && identifier_chars[(unsigned char) *s])
9314     return (const reg_entry *) NULL;
9315
9316   *end_op = s;
9317
9318   r = (const reg_entry *) hash_find (reg_hash, reg_name_given);
9319
9320   /* Handle floating point regs, allowing spaces in the (i) part.  */
9321   if (r == i386_regtab /* %st is first entry of table  */)
9322     {
9323       if (is_space_char (*s))
9324         ++s;
9325       if (*s == '(')
9326         {
9327           ++s;
9328           if (is_space_char (*s))
9329             ++s;
9330           if (*s >= '0' && *s <= '7')
9331             {
9332               int fpr = *s - '0';
9333               ++s;
9334               if (is_space_char (*s))
9335                 ++s;
9336               if (*s == ')')
9337                 {
9338                   *end_op = s + 1;
9339                   r = (const reg_entry *) hash_find (reg_hash, "st(0)");
9340                   know (r);
9341                   return r + fpr;
9342                 }
9343             }
9344           /* We have "%st(" then garbage.  */
9345           return (const reg_entry *) NULL;
9346         }
9347     }
9348
9349   if (r == NULL || allow_pseudo_reg)
9350     return r;
9351
9352   if (operand_type_all_zero (&r->reg_type))
9353     return (const reg_entry *) NULL;
9354
9355   if ((r->reg_type.bitfield.reg32
9356        || r->reg_type.bitfield.sreg3
9357        || r->reg_type.bitfield.control
9358        || r->reg_type.bitfield.debug
9359        || r->reg_type.bitfield.test)
9360       && !cpu_arch_flags.bitfield.cpui386)
9361     return (const reg_entry *) NULL;
9362
9363   if (r->reg_type.bitfield.floatreg
9364       && !cpu_arch_flags.bitfield.cpu8087
9365       && !cpu_arch_flags.bitfield.cpu287
9366       && !cpu_arch_flags.bitfield.cpu387)
9367     return (const reg_entry *) NULL;
9368
9369   if (r->reg_type.bitfield.regmmx && !cpu_arch_flags.bitfield.cpummx)
9370     return (const reg_entry *) NULL;
9371
9372   if (r->reg_type.bitfield.regxmm && !cpu_arch_flags.bitfield.cpusse)
9373     return (const reg_entry *) NULL;
9374
9375   if (r->reg_type.bitfield.regymm && !cpu_arch_flags.bitfield.cpuavx)
9376     return (const reg_entry *) NULL;
9377
9378   if ((r->reg_type.bitfield.regzmm || r->reg_type.bitfield.regmask)
9379        && !cpu_arch_flags.bitfield.cpuavx512f)
9380     return (const reg_entry *) NULL;
9381
9382   /* Don't allow fake index register unless allow_index_reg isn't 0. */
9383   if (!allow_index_reg
9384       && (r->reg_num == RegEiz || r->reg_num == RegRiz))
9385     return (const reg_entry *) NULL;
9386
9387   /* Upper 16 vector register is only available with VREX in 64bit
9388      mode.  */
9389   if ((r->reg_flags & RegVRex))
9390     {
9391       if (!cpu_arch_flags.bitfield.cpuvrex
9392           || flag_code != CODE_64BIT)
9393         return (const reg_entry *) NULL;
9394
9395       i.need_vrex = 1;
9396     }
9397
9398   if (((r->reg_flags & (RegRex64 | RegRex))
9399        || r->reg_type.bitfield.reg64)
9400       && (!cpu_arch_flags.bitfield.cpulm
9401           || !operand_type_equal (&r->reg_type, &control))
9402       && flag_code != CODE_64BIT)
9403     return (const reg_entry *) NULL;
9404
9405   if (r->reg_type.bitfield.sreg3 && r->reg_num == RegFlat && !intel_syntax)
9406     return (const reg_entry *) NULL;
9407
9408   return r;
9409 }
9410
9411 /* REG_STRING starts *before* REGISTER_PREFIX.  */
9412
9413 static const reg_entry *
9414 parse_register (char *reg_string, char **end_op)
9415 {
9416   const reg_entry *r;
9417
9418   if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
9419     r = parse_real_register (reg_string, end_op);
9420   else
9421     r = NULL;
9422   if (!r)
9423     {
9424       char *save = input_line_pointer;
9425       char c;
9426       symbolS *symbolP;
9427
9428       input_line_pointer = reg_string;
9429       c = get_symbol_end ();
9430       symbolP = symbol_find (reg_string);
9431       if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
9432         {
9433           const expressionS *e = symbol_get_value_expression (symbolP);
9434
9435           know (e->X_op == O_register);
9436           know (e->X_add_number >= 0
9437                 && (valueT) e->X_add_number < i386_regtab_size);
9438           r = i386_regtab + e->X_add_number;
9439           if ((r->reg_flags & RegVRex))
9440             i.need_vrex = 1;
9441           *end_op = input_line_pointer;
9442         }
9443       *input_line_pointer = c;
9444       input_line_pointer = save;
9445     }
9446   return r;
9447 }
9448
9449 int
9450 i386_parse_name (char *name, expressionS *e, char *nextcharP)
9451 {
9452   const reg_entry *r;
9453   char *end = input_line_pointer;
9454
9455   *end = *nextcharP;
9456   r = parse_register (name, &input_line_pointer);
9457   if (r && end <= input_line_pointer)
9458     {
9459       *nextcharP = *input_line_pointer;
9460       *input_line_pointer = 0;
9461       e->X_op = O_register;
9462       e->X_add_number = r - i386_regtab;
9463       return 1;
9464     }
9465   input_line_pointer = end;
9466   *end = 0;
9467   return intel_syntax ? i386_intel_parse_name (name, e) : 0;
9468 }
9469
9470 void
9471 md_operand (expressionS *e)
9472 {
9473   char *end;
9474   const reg_entry *r;
9475
9476   switch (*input_line_pointer)
9477     {
9478     case REGISTER_PREFIX:
9479       r = parse_real_register (input_line_pointer, &end);
9480       if (r)
9481         {
9482           e->X_op = O_register;
9483           e->X_add_number = r - i386_regtab;
9484           input_line_pointer = end;
9485         }
9486       break;
9487
9488     case '[':
9489       gas_assert (intel_syntax);
9490       end = input_line_pointer++;
9491       expression (e);
9492       if (*input_line_pointer == ']')
9493         {
9494           ++input_line_pointer;
9495           e->X_op_symbol = make_expr_symbol (e);
9496           e->X_add_symbol = NULL;
9497           e->X_add_number = 0;
9498           e->X_op = O_index;
9499         }
9500       else
9501         {
9502           e->X_op = O_absent;
9503           input_line_pointer = end;
9504         }
9505       break;
9506     }
9507 }
9508
9509 \f
9510 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9511 const char *md_shortopts = "kVQ:sqn";
9512 #else
9513 const char *md_shortopts = "qn";
9514 #endif
9515
9516 #define OPTION_32 (OPTION_MD_BASE + 0)
9517 #define OPTION_64 (OPTION_MD_BASE + 1)
9518 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
9519 #define OPTION_MARCH (OPTION_MD_BASE + 3)
9520 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
9521 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
9522 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
9523 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
9524 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
9525 #define OPTION_MOLD_GCC (OPTION_MD_BASE + 9)
9526 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
9527 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
9528 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
9529 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
9530 #define OPTION_X32 (OPTION_MD_BASE + 14)
9531 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
9532 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
9533 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
9534 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
9535
9536 struct option md_longopts[] =
9537 {
9538   {"32", no_argument, NULL, OPTION_32},
9539 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9540      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9541   {"64", no_argument, NULL, OPTION_64},
9542 #endif
9543 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9544   {"x32", no_argument, NULL, OPTION_X32},
9545 #endif
9546   {"divide", no_argument, NULL, OPTION_DIVIDE},
9547   {"march", required_argument, NULL, OPTION_MARCH},
9548   {"mtune", required_argument, NULL, OPTION_MTUNE},
9549   {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
9550   {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
9551   {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
9552   {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
9553   {"mold-gcc", no_argument, NULL, OPTION_MOLD_GCC},
9554   {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
9555   {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
9556   {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
9557   {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
9558   {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
9559   {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
9560   {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
9561 # if defined (TE_PE) || defined (TE_PEP)
9562   {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
9563 #endif
9564   {NULL, no_argument, NULL, 0}
9565 };
9566 size_t md_longopts_size = sizeof (md_longopts);
9567
9568 int
9569 md_parse_option (int c, char *arg)
9570 {
9571   unsigned int j;
9572   char *arch, *next;
9573
9574   switch (c)
9575     {
9576     case 'n':
9577       optimize_align_code = 0;
9578       break;
9579
9580     case 'q':
9581       quiet_warnings = 1;
9582       break;
9583
9584 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9585       /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
9586          should be emitted or not.  FIXME: Not implemented.  */
9587     case 'Q':
9588       break;
9589
9590       /* -V: SVR4 argument to print version ID.  */
9591     case 'V':
9592       print_version_id ();
9593       break;
9594
9595       /* -k: Ignore for FreeBSD compatibility.  */
9596     case 'k':
9597       break;
9598
9599     case 's':
9600       /* -s: On i386 Solaris, this tells the native assembler to use
9601          .stab instead of .stab.excl.  We always use .stab anyhow.  */
9602       break;
9603 #endif
9604 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9605      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
9606     case OPTION_64:
9607       {
9608         const char **list, **l;
9609
9610         list = bfd_target_list ();
9611         for (l = list; *l != NULL; l++)
9612           if (CONST_STRNEQ (*l, "elf64-x86-64")
9613               || strcmp (*l, "coff-x86-64") == 0
9614               || strcmp (*l, "pe-x86-64") == 0
9615               || strcmp (*l, "pei-x86-64") == 0
9616               || strcmp (*l, "mach-o-x86-64") == 0)
9617             {
9618               default_arch = "x86_64";
9619               break;
9620             }
9621         if (*l == NULL)
9622           as_fatal (_("no compiled in support for x86_64"));
9623         free (list);
9624       }
9625       break;
9626 #endif
9627
9628 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9629     case OPTION_X32:
9630       if (IS_ELF)
9631         {
9632           const char **list, **l;
9633
9634           list = bfd_target_list ();
9635           for (l = list; *l != NULL; l++)
9636             if (CONST_STRNEQ (*l, "elf32-x86-64"))
9637               {
9638                 default_arch = "x86_64:32";
9639                 break;
9640               }
9641           if (*l == NULL)
9642             as_fatal (_("no compiled in support for 32bit x86_64"));
9643           free (list);
9644         }
9645       else
9646         as_fatal (_("32bit x86_64 is only supported for ELF"));
9647       break;
9648 #endif
9649
9650     case OPTION_32:
9651       default_arch = "i386";
9652       break;
9653
9654     case OPTION_DIVIDE:
9655 #ifdef SVR4_COMMENT_CHARS
9656       {
9657         char *n, *t;
9658         const char *s;
9659
9660         n = (char *) xmalloc (strlen (i386_comment_chars) + 1);
9661         t = n;
9662         for (s = i386_comment_chars; *s != '\0'; s++)
9663           if (*s != '/')
9664             *t++ = *s;
9665         *t = '\0';
9666         i386_comment_chars = n;
9667       }
9668 #endif
9669       break;
9670
9671     case OPTION_MARCH:
9672       arch = xstrdup (arg);
9673       do
9674         {
9675           if (*arch == '.')
9676             as_fatal (_("invalid -march= option: `%s'"), arg);
9677           next = strchr (arch, '+');
9678           if (next)
9679             *next++ = '\0';
9680           for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9681             {
9682               if (strcmp (arch, cpu_arch [j].name) == 0)
9683                 {
9684                   /* Processor.  */
9685                   if (! cpu_arch[j].flags.bitfield.cpui386)
9686                     continue;
9687
9688                   cpu_arch_name = cpu_arch[j].name;
9689                   cpu_sub_arch_name = NULL;
9690                   cpu_arch_flags = cpu_arch[j].flags;
9691                   cpu_arch_isa = cpu_arch[j].type;
9692                   cpu_arch_isa_flags = cpu_arch[j].flags;
9693                   if (!cpu_arch_tune_set)
9694                     {
9695                       cpu_arch_tune = cpu_arch_isa;
9696                       cpu_arch_tune_flags = cpu_arch_isa_flags;
9697                     }
9698                   break;
9699                 }
9700               else if (*cpu_arch [j].name == '.'
9701                        && strcmp (arch, cpu_arch [j].name + 1) == 0)
9702                 {
9703                   /* ISA entension.  */
9704                   i386_cpu_flags flags;
9705
9706                   if (!cpu_arch[j].negated)
9707                     flags = cpu_flags_or (cpu_arch_flags,
9708                                           cpu_arch[j].flags);
9709                   else
9710                     flags = cpu_flags_and_not (cpu_arch_flags,
9711                                                cpu_arch[j].flags);
9712                   if (!cpu_flags_equal (&flags, &cpu_arch_flags))
9713                     {
9714                       if (cpu_sub_arch_name)
9715                         {
9716                           char *name = cpu_sub_arch_name;
9717                           cpu_sub_arch_name = concat (name,
9718                                                       cpu_arch[j].name,
9719                                                       (const char *) NULL);
9720                           free (name);
9721                         }
9722                       else
9723                         cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
9724                       cpu_arch_flags = flags;
9725                       cpu_arch_isa_flags = flags;
9726                     }
9727                   break;
9728                 }
9729             }
9730
9731           if (j >= ARRAY_SIZE (cpu_arch))
9732             as_fatal (_("invalid -march= option: `%s'"), arg);
9733
9734           arch = next;
9735         }
9736       while (next != NULL );
9737       break;
9738
9739     case OPTION_MTUNE:
9740       if (*arg == '.')
9741         as_fatal (_("invalid -mtune= option: `%s'"), arg);
9742       for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9743         {
9744           if (strcmp (arg, cpu_arch [j].name) == 0)
9745             {
9746               cpu_arch_tune_set = 1;
9747               cpu_arch_tune = cpu_arch [j].type;
9748               cpu_arch_tune_flags = cpu_arch[j].flags;
9749               break;
9750             }
9751         }
9752       if (j >= ARRAY_SIZE (cpu_arch))
9753         as_fatal (_("invalid -mtune= option: `%s'"), arg);
9754       break;
9755
9756     case OPTION_MMNEMONIC:
9757       if (strcasecmp (arg, "att") == 0)
9758         intel_mnemonic = 0;
9759       else if (strcasecmp (arg, "intel") == 0)
9760         intel_mnemonic = 1;
9761       else
9762         as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
9763       break;
9764
9765     case OPTION_MSYNTAX:
9766       if (strcasecmp (arg, "att") == 0)
9767         intel_syntax = 0;
9768       else if (strcasecmp (arg, "intel") == 0)
9769         intel_syntax = 1;
9770       else
9771         as_fatal (_("invalid -msyntax= option: `%s'"), arg);
9772       break;
9773
9774     case OPTION_MINDEX_REG:
9775       allow_index_reg = 1;
9776       break;
9777
9778     case OPTION_MNAKED_REG:
9779       allow_naked_reg = 1;
9780       break;
9781
9782     case OPTION_MOLD_GCC:
9783       old_gcc = 1;
9784       break;
9785
9786     case OPTION_MSSE2AVX:
9787       sse2avx = 1;
9788       break;
9789
9790     case OPTION_MSSE_CHECK:
9791       if (strcasecmp (arg, "error") == 0)
9792         sse_check = check_error;
9793       else if (strcasecmp (arg, "warning") == 0)
9794         sse_check = check_warning;
9795       else if (strcasecmp (arg, "none") == 0)
9796         sse_check = check_none;
9797       else
9798         as_fatal (_("invalid -msse-check= option: `%s'"), arg);
9799       break;
9800
9801     case OPTION_MOPERAND_CHECK:
9802       if (strcasecmp (arg, "error") == 0)
9803         operand_check = check_error;
9804       else if (strcasecmp (arg, "warning") == 0)
9805         operand_check = check_warning;
9806       else if (strcasecmp (arg, "none") == 0)
9807         operand_check = check_none;
9808       else
9809         as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
9810       break;
9811
9812     case OPTION_MAVXSCALAR:
9813       if (strcasecmp (arg, "128") == 0)
9814         avxscalar = vex128;
9815       else if (strcasecmp (arg, "256") == 0)
9816         avxscalar = vex256;
9817       else
9818         as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
9819       break;
9820
9821     case OPTION_MADD_BND_PREFIX:
9822       add_bnd_prefix = 1;
9823       break;
9824
9825     case OPTION_MEVEXLIG:
9826       if (strcmp (arg, "128") == 0)
9827         evexlig = evexl128;
9828       else if (strcmp (arg, "256") == 0)
9829         evexlig = evexl256;
9830       else  if (strcmp (arg, "512") == 0)
9831         evexlig = evexl512;
9832       else
9833         as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
9834       break;
9835
9836     case OPTION_MEVEXWIG:
9837       if (strcmp (arg, "0") == 0)
9838         evexwig = evexw0;
9839       else if (strcmp (arg, "1") == 0)
9840         evexwig = evexw1;
9841       else
9842         as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
9843       break;
9844
9845 # if defined (TE_PE) || defined (TE_PEP)
9846     case OPTION_MBIG_OBJ:
9847       use_big_obj = 1;
9848       break;
9849 #endif
9850
9851     default:
9852       return 0;
9853     }
9854   return 1;
9855 }
9856
9857 #define MESSAGE_TEMPLATE \
9858 "                                                                                "
9859
9860 static void
9861 show_arch (FILE *stream, int ext, int check)
9862 {
9863   static char message[] = MESSAGE_TEMPLATE;
9864   char *start = message + 27;
9865   char *p;
9866   int size = sizeof (MESSAGE_TEMPLATE);
9867   int left;
9868   const char *name;
9869   int len;
9870   unsigned int j;
9871
9872   p = start;
9873   left = size - (start - message);
9874   for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
9875     {
9876       /* Should it be skipped?  */
9877       if (cpu_arch [j].skip)
9878         continue;
9879
9880       name = cpu_arch [j].name;
9881       len = cpu_arch [j].len;
9882       if (*name == '.')
9883         {
9884           /* It is an extension.  Skip if we aren't asked to show it.  */
9885           if (ext)
9886             {
9887               name++;
9888               len--;
9889             }
9890           else
9891             continue;
9892         }
9893       else if (ext)
9894         {
9895           /* It is an processor.  Skip if we show only extension.  */
9896           continue;
9897         }
9898       else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
9899         {
9900           /* It is an impossible processor - skip.  */
9901           continue;
9902         }
9903
9904       /* Reserve 2 spaces for ", " or ",\0" */
9905       left -= len + 2;
9906
9907       /* Check if there is any room.  */
9908       if (left >= 0)
9909         {
9910           if (p != start)
9911             {
9912               *p++ = ',';
9913               *p++ = ' ';
9914             }
9915           p = mempcpy (p, name, len);
9916         }
9917       else
9918         {
9919           /* Output the current message now and start a new one.  */
9920           *p++ = ',';
9921           *p = '\0';
9922           fprintf (stream, "%s\n", message);
9923           p = start;
9924           left = size - (start - message) - len - 2;
9925
9926           gas_assert (left >= 0);
9927
9928           p = mempcpy (p, name, len);
9929         }
9930     }
9931
9932   *p = '\0';
9933   fprintf (stream, "%s\n", message);
9934 }
9935
9936 void
9937 md_show_usage (FILE *stream)
9938 {
9939 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9940   fprintf (stream, _("\
9941   -Q                      ignored\n\
9942   -V                      print assembler version number\n\
9943   -k                      ignored\n"));
9944 #endif
9945   fprintf (stream, _("\
9946   -n                      Do not optimize code alignment\n\
9947   -q                      quieten some warnings\n"));
9948 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9949   fprintf (stream, _("\
9950   -s                      ignored\n"));
9951 #endif
9952 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
9953      || defined (TE_PE) || defined (TE_PEP))
9954   fprintf (stream, _("\
9955   --32/--64/--x32         generate 32bit/64bit/x32 code\n"));
9956 #endif
9957 #ifdef SVR4_COMMENT_CHARS
9958   fprintf (stream, _("\
9959   --divide                do not treat `/' as a comment character\n"));
9960 #else
9961   fprintf (stream, _("\
9962   --divide                ignored\n"));
9963 #endif
9964   fprintf (stream, _("\
9965   -march=CPU[,+EXTENSION...]\n\
9966                           generate code for CPU and EXTENSION, CPU is one of:\n"));
9967   show_arch (stream, 0, 1);
9968   fprintf (stream, _("\
9969                           EXTENSION is combination of:\n"));
9970   show_arch (stream, 1, 0);
9971   fprintf (stream, _("\
9972   -mtune=CPU              optimize for CPU, CPU is one of:\n"));
9973   show_arch (stream, 0, 0);
9974   fprintf (stream, _("\
9975   -msse2avx               encode SSE instructions with VEX prefix\n"));
9976   fprintf (stream, _("\
9977   -msse-check=[none|error|warning]\n\
9978                           check SSE instructions\n"));
9979   fprintf (stream, _("\
9980   -moperand-check=[none|error|warning]\n\
9981                           check operand combinations for validity\n"));
9982   fprintf (stream, _("\
9983   -mavxscalar=[128|256]   encode scalar AVX instructions with specific vector\n\
9984                            length\n"));
9985   fprintf (stream, _("\
9986   -mevexlig=[128|256|512] encode scalar EVEX instructions with specific vector\n\
9987                            length\n"));
9988   fprintf (stream, _("\
9989   -mevexwig=[0|1]         encode EVEX instructions with specific EVEX.W value\n\
9990                            for EVEX.W bit ignored instructions\n"));
9991   fprintf (stream, _("\
9992   -mmnemonic=[att|intel]  use AT&T/Intel mnemonic\n"));
9993   fprintf (stream, _("\
9994   -msyntax=[att|intel]    use AT&T/Intel syntax\n"));
9995   fprintf (stream, _("\
9996   -mindex-reg             support pseudo index registers\n"));
9997   fprintf (stream, _("\
9998   -mnaked-reg             don't require `%%' prefix for registers\n"));
9999   fprintf (stream, _("\
10000   -mold-gcc               support old (<= 2.8.1) versions of gcc\n"));
10001   fprintf (stream, _("\
10002   -madd-bnd-prefix        add BND prefix for all valid branches\n"));
10003 # if defined (TE_PE) || defined (TE_PEP)
10004   fprintf (stream, _("\
10005   -mbig-obj               generate big object files\n"));
10006 #endif
10007 }
10008
10009 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
10010      || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
10011      || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
10012
10013 /* Pick the target format to use.  */
10014
10015 const char *
10016 i386_target_format (void)
10017 {
10018   if (!strncmp (default_arch, "x86_64", 6))
10019     {
10020       update_code_flag (CODE_64BIT, 1);
10021       if (default_arch[6] == '\0')
10022         x86_elf_abi = X86_64_ABI;
10023       else
10024         x86_elf_abi = X86_64_X32_ABI;
10025     }
10026   else if (!strcmp (default_arch, "i386"))
10027     update_code_flag (CODE_32BIT, 1);
10028   else
10029     as_fatal (_("unknown architecture"));
10030
10031   if (cpu_flags_all_zero (&cpu_arch_isa_flags))
10032     cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
10033   if (cpu_flags_all_zero (&cpu_arch_tune_flags))
10034     cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
10035
10036   switch (OUTPUT_FLAVOR)
10037     {
10038 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
10039     case bfd_target_aout_flavour:
10040       return AOUT_TARGET_FORMAT;
10041 #endif
10042 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
10043 # if defined (TE_PE) || defined (TE_PEP)
10044     case bfd_target_coff_flavour:
10045       if (flag_code == CODE_64BIT)
10046         return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
10047       else
10048         return "pe-i386";
10049 # elif defined (TE_GO32)
10050     case bfd_target_coff_flavour:
10051       return "coff-go32";
10052 # else
10053     case bfd_target_coff_flavour:
10054       return "coff-i386";
10055 # endif
10056 #endif
10057 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10058     case bfd_target_elf_flavour:
10059       {
10060         const char *format;
10061
10062         switch (x86_elf_abi)
10063           {
10064           default:
10065             format = ELF_TARGET_FORMAT;
10066             break;
10067           case X86_64_ABI:
10068             use_rela_relocations = 1;
10069             object_64bit = 1;
10070             format = ELF_TARGET_FORMAT64;
10071             break;
10072           case X86_64_X32_ABI:
10073             use_rela_relocations = 1;
10074             object_64bit = 1;
10075             disallow_64bit_reloc = 1;
10076             format = ELF_TARGET_FORMAT32;
10077             break;
10078           }
10079         if (cpu_arch_isa == PROCESSOR_L1OM)
10080           {
10081             if (x86_elf_abi != X86_64_ABI)
10082               as_fatal (_("Intel L1OM is 64bit only"));
10083             return ELF_TARGET_L1OM_FORMAT;
10084           }
10085         if (cpu_arch_isa == PROCESSOR_K1OM)
10086           {
10087             if (x86_elf_abi != X86_64_ABI)
10088               as_fatal (_("Intel K1OM is 64bit only"));
10089             return ELF_TARGET_K1OM_FORMAT;
10090           }
10091         else
10092           return format;
10093       }
10094 #endif
10095 #if defined (OBJ_MACH_O)
10096     case bfd_target_mach_o_flavour:
10097       if (flag_code == CODE_64BIT)
10098         {
10099           use_rela_relocations = 1;
10100           object_64bit = 1;
10101           return "mach-o-x86-64";
10102         }
10103       else
10104         return "mach-o-i386";
10105 #endif
10106     default:
10107       abort ();
10108       return NULL;
10109     }
10110 }
10111
10112 #endif /* OBJ_MAYBE_ more than one  */
10113
10114 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF))
10115 void
10116 i386_elf_emit_arch_note (void)
10117 {
10118   if (IS_ELF && cpu_arch_name != NULL)
10119     {
10120       char *p;
10121       asection *seg = now_seg;
10122       subsegT subseg = now_subseg;
10123       Elf_Internal_Note i_note;
10124       Elf_External_Note e_note;
10125       asection *note_secp;
10126       int len;
10127
10128       /* Create the .note section.  */
10129       note_secp = subseg_new (".note", 0);
10130       bfd_set_section_flags (stdoutput,
10131                              note_secp,
10132                              SEC_HAS_CONTENTS | SEC_READONLY);
10133
10134       /* Process the arch string.  */
10135       len = strlen (cpu_arch_name);
10136
10137       i_note.namesz = len + 1;
10138       i_note.descsz = 0;
10139       i_note.type = NT_ARCH;
10140       p = frag_more (sizeof (e_note.namesz));
10141       md_number_to_chars (p, (valueT) i_note.namesz, sizeof (e_note.namesz));
10142       p = frag_more (sizeof (e_note.descsz));
10143       md_number_to_chars (p, (valueT) i_note.descsz, sizeof (e_note.descsz));
10144       p = frag_more (sizeof (e_note.type));
10145       md_number_to_chars (p, (valueT) i_note.type, sizeof (e_note.type));
10146       p = frag_more (len + 1);
10147       strcpy (p, cpu_arch_name);
10148
10149       frag_align (2, 0, 0);
10150
10151       subseg_set (seg, subseg);
10152     }
10153 }
10154 #endif
10155 \f
10156 symbolS *
10157 md_undefined_symbol (char *name)
10158 {
10159   if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
10160       && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
10161       && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
10162       && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
10163     {
10164       if (!GOT_symbol)
10165         {
10166           if (symbol_find (name))
10167             as_bad (_("GOT already in symbol table"));
10168           GOT_symbol = symbol_new (name, undefined_section,
10169                                    (valueT) 0, &zero_address_frag);
10170         };
10171       return GOT_symbol;
10172     }
10173   return 0;
10174 }
10175
10176 /* Round up a section size to the appropriate boundary.  */
10177
10178 valueT
10179 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
10180 {
10181 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10182   if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
10183     {
10184       /* For a.out, force the section size to be aligned.  If we don't do
10185          this, BFD will align it for us, but it will not write out the
10186          final bytes of the section.  This may be a bug in BFD, but it is
10187          easier to fix it here since that is how the other a.out targets
10188          work.  */
10189       int align;
10190
10191       align = bfd_get_section_alignment (stdoutput, segment);
10192       size = ((size + (1 << align) - 1) & ((valueT) -1 << align));
10193     }
10194 #endif
10195
10196   return size;
10197 }
10198
10199 /* On the i386, PC-relative offsets are relative to the start of the
10200    next instruction.  That is, the address of the offset, plus its
10201    size, since the offset is always the last part of the insn.  */
10202
10203 long
10204 md_pcrel_from (fixS *fixP)
10205 {
10206   return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
10207 }
10208
10209 #ifndef I386COFF
10210
10211 static void
10212 s_bss (int ignore ATTRIBUTE_UNUSED)
10213 {
10214   int temp;
10215
10216 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10217   if (IS_ELF)
10218     obj_elf_section_change_hook ();
10219 #endif
10220   temp = get_absolute_expression ();
10221   subseg_set (bss_section, (subsegT) temp);
10222   demand_empty_rest_of_line ();
10223 }
10224
10225 #endif
10226
10227 void
10228 i386_validate_fix (fixS *fixp)
10229 {
10230   if (fixp->fx_subsy && fixp->fx_subsy == GOT_symbol)
10231     {
10232       if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
10233         {
10234           if (!object_64bit)
10235             abort ();
10236           fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
10237         }
10238       else
10239         {
10240           if (!object_64bit)
10241             fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
10242           else
10243             fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
10244         }
10245       fixp->fx_subsy = 0;
10246     }
10247 }
10248
10249 arelent *
10250 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
10251 {
10252   arelent *rel;
10253   bfd_reloc_code_real_type code;
10254
10255   switch (fixp->fx_r_type)
10256     {
10257 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10258     case BFD_RELOC_SIZE32:
10259     case BFD_RELOC_SIZE64:
10260       if (S_IS_DEFINED (fixp->fx_addsy)
10261           && !S_IS_EXTERNAL (fixp->fx_addsy))
10262         {
10263           /* Resolve size relocation against local symbol to size of
10264              the symbol plus addend.  */
10265           valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
10266           if (fixp->fx_r_type == BFD_RELOC_SIZE32
10267               && !fits_in_unsigned_long (value))
10268             as_bad_where (fixp->fx_file, fixp->fx_line,
10269                           _("symbol size computation overflow"));
10270           fixp->fx_addsy = NULL;
10271           fixp->fx_subsy = NULL;
10272           md_apply_fix (fixp, (valueT *) &value, NULL);
10273           return NULL;
10274         }
10275 #endif
10276
10277     case BFD_RELOC_X86_64_PLT32:
10278     case BFD_RELOC_X86_64_PLT32_BND:
10279     case BFD_RELOC_X86_64_GOT32:
10280     case BFD_RELOC_X86_64_GOTPCREL:
10281     case BFD_RELOC_386_PLT32:
10282     case BFD_RELOC_386_GOT32:
10283     case BFD_RELOC_386_GOTOFF:
10284     case BFD_RELOC_386_GOTPC:
10285     case BFD_RELOC_386_TLS_GD:
10286     case BFD_RELOC_386_TLS_LDM:
10287     case BFD_RELOC_386_TLS_LDO_32:
10288     case BFD_RELOC_386_TLS_IE_32:
10289     case BFD_RELOC_386_TLS_IE:
10290     case BFD_RELOC_386_TLS_GOTIE:
10291     case BFD_RELOC_386_TLS_LE_32:
10292     case BFD_RELOC_386_TLS_LE:
10293     case BFD_RELOC_386_TLS_GOTDESC:
10294     case BFD_RELOC_386_TLS_DESC_CALL:
10295     case BFD_RELOC_X86_64_TLSGD:
10296     case BFD_RELOC_X86_64_TLSLD:
10297     case BFD_RELOC_X86_64_DTPOFF32:
10298     case BFD_RELOC_X86_64_DTPOFF64:
10299     case BFD_RELOC_X86_64_GOTTPOFF:
10300     case BFD_RELOC_X86_64_TPOFF32:
10301     case BFD_RELOC_X86_64_TPOFF64:
10302     case BFD_RELOC_X86_64_GOTOFF64:
10303     case BFD_RELOC_X86_64_GOTPC32:
10304     case BFD_RELOC_X86_64_GOT64:
10305     case BFD_RELOC_X86_64_GOTPCREL64:
10306     case BFD_RELOC_X86_64_GOTPC64:
10307     case BFD_RELOC_X86_64_GOTPLT64:
10308     case BFD_RELOC_X86_64_PLTOFF64:
10309     case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10310     case BFD_RELOC_X86_64_TLSDESC_CALL:
10311     case BFD_RELOC_RVA:
10312     case BFD_RELOC_VTABLE_ENTRY:
10313     case BFD_RELOC_VTABLE_INHERIT:
10314 #ifdef TE_PE
10315     case BFD_RELOC_32_SECREL:
10316 #endif
10317       code = fixp->fx_r_type;
10318       break;
10319     case BFD_RELOC_X86_64_32S:
10320       if (!fixp->fx_pcrel)
10321         {
10322           /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32.  */
10323           code = fixp->fx_r_type;
10324           break;
10325         }
10326     default:
10327       if (fixp->fx_pcrel)
10328         {
10329           switch (fixp->fx_size)
10330             {
10331             default:
10332               as_bad_where (fixp->fx_file, fixp->fx_line,
10333                             _("can not do %d byte pc-relative relocation"),
10334                             fixp->fx_size);
10335               code = BFD_RELOC_32_PCREL;
10336               break;
10337             case 1: code = BFD_RELOC_8_PCREL;  break;
10338             case 2: code = BFD_RELOC_16_PCREL; break;
10339             case 4:
10340               code = (fixp->fx_r_type == BFD_RELOC_X86_64_PC32_BND
10341                       ? fixp-> fx_r_type : BFD_RELOC_32_PCREL);
10342               break;
10343 #ifdef BFD64
10344             case 8: code = BFD_RELOC_64_PCREL; break;
10345 #endif
10346             }
10347         }
10348       else
10349         {
10350           switch (fixp->fx_size)
10351             {
10352             default:
10353               as_bad_where (fixp->fx_file, fixp->fx_line,
10354                             _("can not do %d byte relocation"),
10355                             fixp->fx_size);
10356               code = BFD_RELOC_32;
10357               break;
10358             case 1: code = BFD_RELOC_8;  break;
10359             case 2: code = BFD_RELOC_16; break;
10360             case 4: code = BFD_RELOC_32; break;
10361 #ifdef BFD64
10362             case 8: code = BFD_RELOC_64; break;
10363 #endif
10364             }
10365         }
10366       break;
10367     }
10368
10369   if ((code == BFD_RELOC_32
10370        || code == BFD_RELOC_32_PCREL
10371        || code == BFD_RELOC_X86_64_32S)
10372       && GOT_symbol
10373       && fixp->fx_addsy == GOT_symbol)
10374     {
10375       if (!object_64bit)
10376         code = BFD_RELOC_386_GOTPC;
10377       else
10378         code = BFD_RELOC_X86_64_GOTPC32;
10379     }
10380   if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
10381       && GOT_symbol
10382       && fixp->fx_addsy == GOT_symbol)
10383     {
10384       code = BFD_RELOC_X86_64_GOTPC64;
10385     }
10386
10387   rel = (arelent *) xmalloc (sizeof (arelent));
10388   rel->sym_ptr_ptr = (asymbol **) xmalloc (sizeof (asymbol *));
10389   *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
10390
10391   rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
10392
10393   if (!use_rela_relocations)
10394     {
10395       /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
10396          vtable entry to be used in the relocation's section offset.  */
10397       if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
10398         rel->address = fixp->fx_offset;
10399 #if defined (OBJ_COFF) && defined (TE_PE)
10400       else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
10401         rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
10402       else
10403 #endif
10404       rel->addend = 0;
10405     }
10406   /* Use the rela in 64bit mode.  */
10407   else
10408     {
10409       if (disallow_64bit_reloc)
10410         switch (code)
10411           {
10412           case BFD_RELOC_X86_64_DTPOFF64:
10413           case BFD_RELOC_X86_64_TPOFF64:
10414           case BFD_RELOC_64_PCREL:
10415           case BFD_RELOC_X86_64_GOTOFF64:
10416           case BFD_RELOC_X86_64_GOT64:
10417           case BFD_RELOC_X86_64_GOTPCREL64:
10418           case BFD_RELOC_X86_64_GOTPC64:
10419           case BFD_RELOC_X86_64_GOTPLT64:
10420           case BFD_RELOC_X86_64_PLTOFF64:
10421             as_bad_where (fixp->fx_file, fixp->fx_line,
10422                           _("cannot represent relocation type %s in x32 mode"),
10423                           bfd_get_reloc_code_name (code));
10424             break;
10425           default:
10426             break;
10427           }
10428
10429       if (!fixp->fx_pcrel)
10430         rel->addend = fixp->fx_offset;
10431       else
10432         switch (code)
10433           {
10434           case BFD_RELOC_X86_64_PLT32:
10435           case BFD_RELOC_X86_64_PLT32_BND:
10436           case BFD_RELOC_X86_64_GOT32:
10437           case BFD_RELOC_X86_64_GOTPCREL:
10438           case BFD_RELOC_X86_64_TLSGD:
10439           case BFD_RELOC_X86_64_TLSLD:
10440           case BFD_RELOC_X86_64_GOTTPOFF:
10441           case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
10442           case BFD_RELOC_X86_64_TLSDESC_CALL:
10443             rel->addend = fixp->fx_offset - fixp->fx_size;
10444             break;
10445           default:
10446             rel->addend = (section->vma
10447                            - fixp->fx_size
10448                            + fixp->fx_addnumber
10449                            + md_pcrel_from (fixp));
10450             break;
10451           }
10452     }
10453
10454   rel->howto = bfd_reloc_type_lookup (stdoutput, code);
10455   if (rel->howto == NULL)
10456     {
10457       as_bad_where (fixp->fx_file, fixp->fx_line,
10458                     _("cannot represent relocation type %s"),
10459                     bfd_get_reloc_code_name (code));
10460       /* Set howto to a garbage value so that we can keep going.  */
10461       rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
10462       gas_assert (rel->howto != NULL);
10463     }
10464
10465   return rel;
10466 }
10467
10468 #include "tc-i386-intel.c"
10469
10470 void
10471 tc_x86_parse_to_dw2regnum (expressionS *exp)
10472 {
10473   int saved_naked_reg;
10474   char saved_register_dot;
10475
10476   saved_naked_reg = allow_naked_reg;
10477   allow_naked_reg = 1;
10478   saved_register_dot = register_chars['.'];
10479   register_chars['.'] = '.';
10480   allow_pseudo_reg = 1;
10481   expression_and_evaluate (exp);
10482   allow_pseudo_reg = 0;
10483   register_chars['.'] = saved_register_dot;
10484   allow_naked_reg = saved_naked_reg;
10485
10486   if (exp->X_op == O_register && exp->X_add_number >= 0)
10487     {
10488       if ((addressT) exp->X_add_number < i386_regtab_size)
10489         {
10490           exp->X_op = O_constant;
10491           exp->X_add_number = i386_regtab[exp->X_add_number]
10492                               .dw2_regnum[flag_code >> 1];
10493         }
10494       else
10495         exp->X_op = O_illegal;
10496     }
10497 }
10498
10499 void
10500 tc_x86_frame_initial_instructions (void)
10501 {
10502   static unsigned int sp_regno[2];
10503
10504   if (!sp_regno[flag_code >> 1])
10505     {
10506       char *saved_input = input_line_pointer;
10507       char sp[][4] = {"esp", "rsp"};
10508       expressionS exp;
10509
10510       input_line_pointer = sp[flag_code >> 1];
10511       tc_x86_parse_to_dw2regnum (&exp);
10512       gas_assert (exp.X_op == O_constant);
10513       sp_regno[flag_code >> 1] = exp.X_add_number;
10514       input_line_pointer = saved_input;
10515     }
10516
10517   cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
10518   cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
10519 }
10520
10521 int
10522 x86_dwarf2_addr_size (void)
10523 {
10524 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
10525   if (x86_elf_abi == X86_64_X32_ABI)
10526     return 4;
10527 #endif
10528   return bfd_arch_bits_per_address (stdoutput) / 8;
10529 }
10530
10531 int
10532 i386_elf_section_type (const char *str, size_t len)
10533 {
10534   if (flag_code == CODE_64BIT
10535       && len == sizeof ("unwind") - 1
10536       && strncmp (str, "unwind", 6) == 0)
10537     return SHT_X86_64_UNWIND;
10538
10539   return -1;
10540 }
10541
10542 #ifdef TE_SOLARIS
10543 void
10544 i386_solaris_fix_up_eh_frame (segT sec)
10545 {
10546   if (flag_code == CODE_64BIT)
10547     elf_section_type (sec) = SHT_X86_64_UNWIND;
10548 }
10549 #endif
10550
10551 #ifdef TE_PE
10552 void
10553 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
10554 {
10555   expressionS exp;
10556
10557   exp.X_op = O_secrel;
10558   exp.X_add_symbol = symbol;
10559   exp.X_add_number = 0;
10560   emit_expr (&exp, size);
10561 }
10562 #endif
10563
10564 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10565 /* For ELF on x86-64, add support for SHF_X86_64_LARGE.  */
10566
10567 bfd_vma
10568 x86_64_section_letter (int letter, char **ptr_msg)
10569 {
10570   if (flag_code == CODE_64BIT)
10571     {
10572       if (letter == 'l')
10573         return SHF_X86_64_LARGE;
10574
10575       *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
10576     }
10577   else
10578     *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
10579   return -1;
10580 }
10581
10582 bfd_vma
10583 x86_64_section_word (char *str, size_t len)
10584 {
10585   if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
10586     return SHF_X86_64_LARGE;
10587
10588   return -1;
10589 }
10590
10591 static void
10592 handle_large_common (int small ATTRIBUTE_UNUSED)
10593 {
10594   if (flag_code != CODE_64BIT)
10595     {
10596       s_comm_internal (0, elf_common_parse);
10597       as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
10598     }
10599   else
10600     {
10601       static segT lbss_section;
10602       asection *saved_com_section_ptr = elf_com_section_ptr;
10603       asection *saved_bss_section = bss_section;
10604
10605       if (lbss_section == NULL)
10606         {
10607           flagword applicable;
10608           segT seg = now_seg;
10609           subsegT subseg = now_subseg;
10610
10611           /* The .lbss section is for local .largecomm symbols.  */
10612           lbss_section = subseg_new (".lbss", 0);
10613           applicable = bfd_applicable_section_flags (stdoutput);
10614           bfd_set_section_flags (stdoutput, lbss_section,
10615                                  applicable & SEC_ALLOC);
10616           seg_info (lbss_section)->bss = 1;
10617
10618           subseg_set (seg, subseg);
10619         }
10620
10621       elf_com_section_ptr = &_bfd_elf_large_com_section;
10622       bss_section = lbss_section;
10623
10624       s_comm_internal (0, elf_common_parse);
10625
10626       elf_com_section_ptr = saved_com_section_ptr;
10627       bss_section = saved_bss_section;
10628     }
10629 }
10630 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */