i386: Allow non-absolute segment values for lcall/ljmp
[binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2020 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* parse_register() returns this when a register alias cannot be used. */
214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
217 /* This struct describes rounding control and SAE in the instruction. */
218 struct RC_Operation
219 {
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229 };
230
231 static struct RC_Operation rc_op;
232
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
237 {
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242 };
243
244 static struct Mask_Operation mask_op;
245
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248 struct Broadcast_Operation
249 {
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
255
256 /* Number of bytes to broadcast. */
257 int bytes;
258 };
259
260 static struct Broadcast_Operation broadcast_op;
261
262 /* VEX prefix. */
263 typedef struct
264 {
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270 } vex_prefix;
271
272 /* 'md_assemble ()' gathers together information and puts it into a
273 i386_insn. */
274
275 union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
282 enum i386_error
283 {
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
292 unsupported,
293 invalid_sib_address,
294 invalid_vsib_address,
295 invalid_vector_register_set,
296 invalid_tmm_register_set,
297 unsupported_vector_index_register,
298 unsupported_broadcast,
299 broadcast_needed,
300 unsupported_masking,
301 mask_not_on_destination,
302 no_default_mask,
303 unsupported_rc_sae,
304 rc_sae_operand_not_last_imm,
305 invalid_register_operand,
306 };
307
308 struct _i386_insn
309 {
310 /* TM holds the template for the insn were currently assembling. */
311 insn_template tm;
312
313 /* SUFFIX holds the instruction size suffix for byte, word, dword
314 or qword, if given. */
315 char suffix;
316
317 /* OPERANDS gives the number of given operands. */
318 unsigned int operands;
319
320 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
321 of given register, displacement, memory operands and immediate
322 operands. */
323 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
324
325 /* TYPES [i] is the type (see above #defines) which tells us how to
326 use OP[i] for the corresponding operand. */
327 i386_operand_type types[MAX_OPERANDS];
328
329 /* Displacement expression, immediate expression, or register for each
330 operand. */
331 union i386_op op[MAX_OPERANDS];
332
333 /* Flags for operands. */
334 unsigned int flags[MAX_OPERANDS];
335 #define Operand_PCrel 1
336 #define Operand_Mem 2
337
338 /* Relocation type for operand */
339 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
340
341 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
342 the base index byte below. */
343 const reg_entry *base_reg;
344 const reg_entry *index_reg;
345 unsigned int log2_scale_factor;
346
347 /* SEG gives the seg_entries of this insn. They are zero unless
348 explicit segment overrides are given. */
349 const seg_entry *seg[2];
350
351 /* Copied first memory operand string, for re-checking. */
352 char *memop1_string;
353
354 /* PREFIX holds all the given prefix opcodes (usually null).
355 PREFIXES is the number of prefix opcodes. */
356 unsigned int prefixes;
357 unsigned char prefix[MAX_PREFIXES];
358
359 /* Register is in low 3 bits of opcode. */
360 bfd_boolean short_form;
361
362 /* The operand to a branch insn indicates an absolute branch. */
363 bfd_boolean jumpabsolute;
364
365 /* Extended states. */
366 enum
367 {
368 /* Use MMX state. */
369 xstate_mmx = 1 << 0,
370 /* Use XMM state. */
371 xstate_xmm = 1 << 1,
372 /* Use YMM state. */
373 xstate_ymm = 1 << 2 | xstate_xmm,
374 /* Use ZMM state. */
375 xstate_zmm = 1 << 3 | xstate_ymm,
376 /* Use TMM state. */
377 xstate_tmm = 1 << 4
378 } xstate;
379
380 /* Has GOTPC or TLS relocation. */
381 bfd_boolean has_gotpc_tls_reloc;
382
383 /* RM and SIB are the modrm byte and the sib byte where the
384 addressing modes of this insn are encoded. */
385 modrm_byte rm;
386 rex_byte rex;
387 rex_byte vrex;
388 sib_byte sib;
389 vex_prefix vex;
390
391 /* Masking attributes. */
392 struct Mask_Operation *mask;
393
394 /* Rounding control and SAE attributes. */
395 struct RC_Operation *rounding;
396
397 /* Broadcasting attributes. */
398 struct Broadcast_Operation *broadcast;
399
400 /* Compressed disp8*N attribute. */
401 unsigned int memshift;
402
403 /* Prefer load or store in encoding. */
404 enum
405 {
406 dir_encoding_default = 0,
407 dir_encoding_load,
408 dir_encoding_store,
409 dir_encoding_swap
410 } dir_encoding;
411
412 /* Prefer 8bit, 16bit, 32bit displacement in encoding. */
413 enum
414 {
415 disp_encoding_default = 0,
416 disp_encoding_8bit,
417 disp_encoding_16bit,
418 disp_encoding_32bit
419 } disp_encoding;
420
421 /* Prefer the REX byte in encoding. */
422 bfd_boolean rex_encoding;
423
424 /* Disable instruction size optimization. */
425 bfd_boolean no_optimize;
426
427 /* How to encode vector instructions. */
428 enum
429 {
430 vex_encoding_default = 0,
431 vex_encoding_vex,
432 vex_encoding_vex3,
433 vex_encoding_evex,
434 vex_encoding_error
435 } vec_encoding;
436
437 /* REP prefix. */
438 const char *rep_prefix;
439
440 /* HLE prefix. */
441 const char *hle_prefix;
442
443 /* Have BND prefix. */
444 const char *bnd_prefix;
445
446 /* Have NOTRACK prefix. */
447 const char *notrack_prefix;
448
449 /* Error message. */
450 enum i386_error error;
451 };
452
453 typedef struct _i386_insn i386_insn;
454
455 /* Link RC type with corresponding string, that'll be looked for in
456 asm. */
457 struct RC_name
458 {
459 enum rc_type type;
460 const char *name;
461 unsigned int len;
462 };
463
464 static const struct RC_name RC_NamesTable[] =
465 {
466 { rne, STRING_COMMA_LEN ("rn-sae") },
467 { rd, STRING_COMMA_LEN ("rd-sae") },
468 { ru, STRING_COMMA_LEN ("ru-sae") },
469 { rz, STRING_COMMA_LEN ("rz-sae") },
470 { saeonly, STRING_COMMA_LEN ("sae") },
471 };
472
473 /* List of chars besides those in app.c:symbol_chars that can start an
474 operand. Used to prevent the scrubber eating vital white-space. */
475 const char extra_symbol_chars[] = "*%-([{}"
476 #ifdef LEX_AT
477 "@"
478 #endif
479 #ifdef LEX_QM
480 "?"
481 #endif
482 ;
483
484 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
485 && !defined (TE_GNU) \
486 && !defined (TE_LINUX) \
487 && !defined (TE_FreeBSD) \
488 && !defined (TE_DragonFly) \
489 && !defined (TE_NetBSD))
490 /* This array holds the chars that always start a comment. If the
491 pre-processor is disabled, these aren't very useful. The option
492 --divide will remove '/' from this list. */
493 const char *i386_comment_chars = "#/";
494 #define SVR4_COMMENT_CHARS 1
495 #define PREFIX_SEPARATOR '\\'
496
497 #else
498 const char *i386_comment_chars = "#";
499 #define PREFIX_SEPARATOR '/'
500 #endif
501
502 /* This array holds the chars that only start a comment at the beginning of
503 a line. If the line seems to have the form '# 123 filename'
504 .line and .file directives will appear in the pre-processed output.
505 Note that input_file.c hand checks for '#' at the beginning of the
506 first line of the input file. This is because the compiler outputs
507 #NO_APP at the beginning of its output.
508 Also note that comments started like this one will always work if
509 '/' isn't otherwise defined. */
510 const char line_comment_chars[] = "#/";
511
512 const char line_separator_chars[] = ";";
513
514 /* Chars that can be used to separate mant from exp in floating point
515 nums. */
516 const char EXP_CHARS[] = "eE";
517
518 /* Chars that mean this number is a floating point constant
519 As in 0f12.456
520 or 0d1.2345e12. */
521 const char FLT_CHARS[] = "fFdDxX";
522
523 /* Tables for lexical analysis. */
524 static char mnemonic_chars[256];
525 static char register_chars[256];
526 static char operand_chars[256];
527 static char identifier_chars[256];
528 static char digit_chars[256];
529
530 /* Lexical macros. */
531 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
532 #define is_operand_char(x) (operand_chars[(unsigned char) x])
533 #define is_register_char(x) (register_chars[(unsigned char) x])
534 #define is_space_char(x) ((x) == ' ')
535 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
536 #define is_digit_char(x) (digit_chars[(unsigned char) x])
537
538 /* All non-digit non-letter characters that may occur in an operand. */
539 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
540
541 /* md_assemble() always leaves the strings it's passed unaltered. To
542 effect this we maintain a stack of saved characters that we've smashed
543 with '\0's (indicating end of strings for various sub-fields of the
544 assembler instruction). */
545 static char save_stack[32];
546 static char *save_stack_p;
547 #define END_STRING_AND_SAVE(s) \
548 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
549 #define RESTORE_END_STRING(s) \
550 do { *(s) = *--save_stack_p; } while (0)
551
552 /* The instruction we're assembling. */
553 static i386_insn i;
554
555 /* Possible templates for current insn. */
556 static const templates *current_templates;
557
558 /* Per instruction expressionS buffers: max displacements & immediates. */
559 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
560 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
561
562 /* Current operand we are working on. */
563 static int this_operand = -1;
564
565 /* We support four different modes. FLAG_CODE variable is used to distinguish
566 these. */
567
568 enum flag_code {
569 CODE_32BIT,
570 CODE_16BIT,
571 CODE_64BIT };
572
573 static enum flag_code flag_code;
574 static unsigned int object_64bit;
575 static unsigned int disallow_64bit_reloc;
576 static int use_rela_relocations = 0;
577 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
578 static const char *tls_get_addr;
579
580 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
581 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
582 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
583
584 /* The ELF ABI to use. */
585 enum x86_elf_abi
586 {
587 I386_ABI,
588 X86_64_ABI,
589 X86_64_X32_ABI
590 };
591
592 static enum x86_elf_abi x86_elf_abi = I386_ABI;
593 #endif
594
595 #if defined (TE_PE) || defined (TE_PEP)
596 /* Use big object file format. */
597 static int use_big_obj = 0;
598 #endif
599
600 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
601 /* 1 if generating code for a shared library. */
602 static int shared = 0;
603 #endif
604
605 /* 1 for intel syntax,
606 0 if att syntax. */
607 static int intel_syntax = 0;
608
609 static enum x86_64_isa
610 {
611 amd64 = 1, /* AMD64 ISA. */
612 intel64 /* Intel64 ISA. */
613 } isa64;
614
615 /* 1 for intel mnemonic,
616 0 if att mnemonic. */
617 static int intel_mnemonic = !SYSV386_COMPAT;
618
619 /* 1 if pseudo registers are permitted. */
620 static int allow_pseudo_reg = 0;
621
622 /* 1 if register prefix % not required. */
623 static int allow_naked_reg = 0;
624
625 /* 1 if the assembler should add BND prefix for all control-transferring
626 instructions supporting it, even if this prefix wasn't specified
627 explicitly. */
628 static int add_bnd_prefix = 0;
629
630 /* 1 if pseudo index register, eiz/riz, is allowed . */
631 static int allow_index_reg = 0;
632
633 /* 1 if the assembler should ignore LOCK prefix, even if it was
634 specified explicitly. */
635 static int omit_lock_prefix = 0;
636
637 /* 1 if the assembler should encode lfence, mfence, and sfence as
638 "lock addl $0, (%{re}sp)". */
639 static int avoid_fence = 0;
640
641 /* 1 if lfence should be inserted after every load. */
642 static int lfence_after_load = 0;
643
644 /* Non-zero if lfence should be inserted before indirect branch. */
645 static enum lfence_before_indirect_branch_kind
646 {
647 lfence_branch_none = 0,
648 lfence_branch_register,
649 lfence_branch_memory,
650 lfence_branch_all
651 }
652 lfence_before_indirect_branch;
653
654 /* Non-zero if lfence should be inserted before ret. */
655 static enum lfence_before_ret_kind
656 {
657 lfence_before_ret_none = 0,
658 lfence_before_ret_not,
659 lfence_before_ret_or,
660 lfence_before_ret_shl
661 }
662 lfence_before_ret;
663
664 /* Types of previous instruction is .byte or prefix. */
665 static struct
666 {
667 segT seg;
668 const char *file;
669 const char *name;
670 unsigned int line;
671 enum last_insn_kind
672 {
673 last_insn_other = 0,
674 last_insn_directive,
675 last_insn_prefix
676 } kind;
677 } last_insn;
678
679 /* 1 if the assembler should generate relax relocations. */
680
681 static int generate_relax_relocations
682 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
683
684 static enum check_kind
685 {
686 check_none = 0,
687 check_warning,
688 check_error
689 }
690 sse_check, operand_check = check_warning;
691
692 /* Non-zero if branches should be aligned within power of 2 boundary. */
693 static int align_branch_power = 0;
694
695 /* Types of branches to align. */
696 enum align_branch_kind
697 {
698 align_branch_none = 0,
699 align_branch_jcc = 1,
700 align_branch_fused = 2,
701 align_branch_jmp = 3,
702 align_branch_call = 4,
703 align_branch_indirect = 5,
704 align_branch_ret = 6
705 };
706
707 /* Type bits of branches to align. */
708 enum align_branch_bit
709 {
710 align_branch_jcc_bit = 1 << align_branch_jcc,
711 align_branch_fused_bit = 1 << align_branch_fused,
712 align_branch_jmp_bit = 1 << align_branch_jmp,
713 align_branch_call_bit = 1 << align_branch_call,
714 align_branch_indirect_bit = 1 << align_branch_indirect,
715 align_branch_ret_bit = 1 << align_branch_ret
716 };
717
718 static unsigned int align_branch = (align_branch_jcc_bit
719 | align_branch_fused_bit
720 | align_branch_jmp_bit);
721
722 /* Types of condition jump used by macro-fusion. */
723 enum mf_jcc_kind
724 {
725 mf_jcc_jo = 0, /* base opcode 0x70 */
726 mf_jcc_jc, /* base opcode 0x72 */
727 mf_jcc_je, /* base opcode 0x74 */
728 mf_jcc_jna, /* base opcode 0x76 */
729 mf_jcc_js, /* base opcode 0x78 */
730 mf_jcc_jp, /* base opcode 0x7a */
731 mf_jcc_jl, /* base opcode 0x7c */
732 mf_jcc_jle, /* base opcode 0x7e */
733 };
734
735 /* Types of compare flag-modifying insntructions used by macro-fusion. */
736 enum mf_cmp_kind
737 {
738 mf_cmp_test_and, /* test/cmp */
739 mf_cmp_alu_cmp, /* add/sub/cmp */
740 mf_cmp_incdec /* inc/dec */
741 };
742
743 /* The maximum padding size for fused jcc. CMP like instruction can
744 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
745 prefixes. */
746 #define MAX_FUSED_JCC_PADDING_SIZE 20
747
748 /* The maximum number of prefixes added for an instruction. */
749 static unsigned int align_branch_prefix_size = 5;
750
751 /* Optimization:
752 1. Clear the REX_W bit with register operand if possible.
753 2. Above plus use 128bit vector instruction to clear the full vector
754 register.
755 */
756 static int optimize = 0;
757
758 /* Optimization:
759 1. Clear the REX_W bit with register operand if possible.
760 2. Above plus use 128bit vector instruction to clear the full vector
761 register.
762 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
763 "testb $imm7,%r8".
764 */
765 static int optimize_for_space = 0;
766
767 /* Register prefix used for error message. */
768 static const char *register_prefix = "%";
769
770 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
771 leave, push, and pop instructions so that gcc has the same stack
772 frame as in 32 bit mode. */
773 static char stackop_size = '\0';
774
775 /* Non-zero to optimize code alignment. */
776 int optimize_align_code = 1;
777
778 /* Non-zero to quieten some warnings. */
779 static int quiet_warnings = 0;
780
781 /* CPU name. */
782 static const char *cpu_arch_name = NULL;
783 static char *cpu_sub_arch_name = NULL;
784
785 /* CPU feature flags. */
786 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
787
788 /* If we have selected a cpu we are generating instructions for. */
789 static int cpu_arch_tune_set = 0;
790
791 /* Cpu we are generating instructions for. */
792 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
793
794 /* CPU feature flags of cpu we are generating instructions for. */
795 static i386_cpu_flags cpu_arch_tune_flags;
796
797 /* CPU instruction set architecture used. */
798 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
799
800 /* CPU feature flags of instruction set architecture used. */
801 i386_cpu_flags cpu_arch_isa_flags;
802
803 /* If set, conditional jumps are not automatically promoted to handle
804 larger than a byte offset. */
805 static unsigned int no_cond_jump_promotion = 0;
806
807 /* Encode SSE instructions with VEX prefix. */
808 static unsigned int sse2avx;
809
810 /* Encode scalar AVX instructions with specific vector length. */
811 static enum
812 {
813 vex128 = 0,
814 vex256
815 } avxscalar;
816
817 /* Encode VEX WIG instructions with specific vex.w. */
818 static enum
819 {
820 vexw0 = 0,
821 vexw1
822 } vexwig;
823
824 /* Encode scalar EVEX LIG instructions with specific vector length. */
825 static enum
826 {
827 evexl128 = 0,
828 evexl256,
829 evexl512
830 } evexlig;
831
832 /* Encode EVEX WIG instructions with specific evex.w. */
833 static enum
834 {
835 evexw0 = 0,
836 evexw1
837 } evexwig;
838
839 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
840 static enum rc_type evexrcig = rne;
841
842 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
843 static symbolS *GOT_symbol;
844
845 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
846 unsigned int x86_dwarf2_return_column;
847
848 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
849 int x86_cie_data_alignment;
850
851 /* Interface to relax_segment.
852 There are 3 major relax states for 386 jump insns because the
853 different types of jumps add different sizes to frags when we're
854 figuring out what sort of jump to choose to reach a given label.
855
856 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
857 branches which are handled by md_estimate_size_before_relax() and
858 i386_generic_table_relax_frag(). */
859
860 /* Types. */
861 #define UNCOND_JUMP 0
862 #define COND_JUMP 1
863 #define COND_JUMP86 2
864 #define BRANCH_PADDING 3
865 #define BRANCH_PREFIX 4
866 #define FUSED_JCC_PADDING 5
867
868 /* Sizes. */
869 #define CODE16 1
870 #define SMALL 0
871 #define SMALL16 (SMALL | CODE16)
872 #define BIG 2
873 #define BIG16 (BIG | CODE16)
874
875 #ifndef INLINE
876 #ifdef __GNUC__
877 #define INLINE __inline__
878 #else
879 #define INLINE
880 #endif
881 #endif
882
883 #define ENCODE_RELAX_STATE(type, size) \
884 ((relax_substateT) (((type) << 2) | (size)))
885 #define TYPE_FROM_RELAX_STATE(s) \
886 ((s) >> 2)
887 #define DISP_SIZE_FROM_RELAX_STATE(s) \
888 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
889
890 /* This table is used by relax_frag to promote short jumps to long
891 ones where necessary. SMALL (short) jumps may be promoted to BIG
892 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
893 don't allow a short jump in a 32 bit code segment to be promoted to
894 a 16 bit offset jump because it's slower (requires data size
895 prefix), and doesn't work, unless the destination is in the bottom
896 64k of the code segment (The top 16 bits of eip are zeroed). */
897
898 const relax_typeS md_relax_table[] =
899 {
900 /* The fields are:
901 1) most positive reach of this state,
902 2) most negative reach of this state,
903 3) how many bytes this mode will have in the variable part of the frag
904 4) which index into the table to try if we can't fit into this one. */
905
906 /* UNCOND_JUMP states. */
907 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
908 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
909 /* dword jmp adds 4 bytes to frag:
910 0 extra opcode bytes, 4 displacement bytes. */
911 {0, 0, 4, 0},
912 /* word jmp adds 2 byte2 to frag:
913 0 extra opcode bytes, 2 displacement bytes. */
914 {0, 0, 2, 0},
915
916 /* COND_JUMP states. */
917 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
918 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
919 /* dword conditionals adds 5 bytes to frag:
920 1 extra opcode byte, 4 displacement bytes. */
921 {0, 0, 5, 0},
922 /* word conditionals add 3 bytes to frag:
923 1 extra opcode byte, 2 displacement bytes. */
924 {0, 0, 3, 0},
925
926 /* COND_JUMP86 states. */
927 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
928 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
929 /* dword conditionals adds 5 bytes to frag:
930 1 extra opcode byte, 4 displacement bytes. */
931 {0, 0, 5, 0},
932 /* word conditionals add 4 bytes to frag:
933 1 displacement byte and a 3 byte long branch insn. */
934 {0, 0, 4, 0}
935 };
936
937 static const arch_entry cpu_arch[] =
938 {
939 /* Do not replace the first two entries - i386_target_format()
940 relies on them being there in this order. */
941 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
942 CPU_GENERIC32_FLAGS, 0 },
943 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
944 CPU_GENERIC64_FLAGS, 0 },
945 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
946 CPU_NONE_FLAGS, 0 },
947 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
948 CPU_I186_FLAGS, 0 },
949 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
950 CPU_I286_FLAGS, 0 },
951 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
952 CPU_I386_FLAGS, 0 },
953 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
954 CPU_I486_FLAGS, 0 },
955 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
956 CPU_I586_FLAGS, 0 },
957 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
958 CPU_I686_FLAGS, 0 },
959 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
960 CPU_I586_FLAGS, 0 },
961 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
962 CPU_PENTIUMPRO_FLAGS, 0 },
963 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
964 CPU_P2_FLAGS, 0 },
965 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
966 CPU_P3_FLAGS, 0 },
967 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
968 CPU_P4_FLAGS, 0 },
969 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
970 CPU_CORE_FLAGS, 0 },
971 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
972 CPU_NOCONA_FLAGS, 0 },
973 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
974 CPU_CORE_FLAGS, 1 },
975 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
976 CPU_CORE_FLAGS, 0 },
977 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
978 CPU_CORE2_FLAGS, 1 },
979 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
980 CPU_CORE2_FLAGS, 0 },
981 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
982 CPU_COREI7_FLAGS, 0 },
983 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
984 CPU_L1OM_FLAGS, 0 },
985 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
986 CPU_K1OM_FLAGS, 0 },
987 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
988 CPU_IAMCU_FLAGS, 0 },
989 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
990 CPU_K6_FLAGS, 0 },
991 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
992 CPU_K6_2_FLAGS, 0 },
993 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
994 CPU_ATHLON_FLAGS, 0 },
995 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
996 CPU_K8_FLAGS, 1 },
997 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
998 CPU_K8_FLAGS, 0 },
999 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1000 CPU_K8_FLAGS, 0 },
1001 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1002 CPU_AMDFAM10_FLAGS, 0 },
1003 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1004 CPU_BDVER1_FLAGS, 0 },
1005 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1006 CPU_BDVER2_FLAGS, 0 },
1007 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1008 CPU_BDVER3_FLAGS, 0 },
1009 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1010 CPU_BDVER4_FLAGS, 0 },
1011 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1012 CPU_ZNVER1_FLAGS, 0 },
1013 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1014 CPU_ZNVER2_FLAGS, 0 },
1015 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1016 CPU_BTVER1_FLAGS, 0 },
1017 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1018 CPU_BTVER2_FLAGS, 0 },
1019 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1020 CPU_8087_FLAGS, 0 },
1021 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1022 CPU_287_FLAGS, 0 },
1023 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1024 CPU_387_FLAGS, 0 },
1025 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1026 CPU_687_FLAGS, 0 },
1027 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1028 CPU_CMOV_FLAGS, 0 },
1029 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1030 CPU_FXSR_FLAGS, 0 },
1031 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1032 CPU_MMX_FLAGS, 0 },
1033 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1034 CPU_SSE_FLAGS, 0 },
1035 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1036 CPU_SSE2_FLAGS, 0 },
1037 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1038 CPU_SSE3_FLAGS, 0 },
1039 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1040 CPU_SSE4A_FLAGS, 0 },
1041 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1042 CPU_SSSE3_FLAGS, 0 },
1043 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1044 CPU_SSE4_1_FLAGS, 0 },
1045 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1046 CPU_SSE4_2_FLAGS, 0 },
1047 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1048 CPU_SSE4_2_FLAGS, 0 },
1049 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1050 CPU_AVX_FLAGS, 0 },
1051 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1052 CPU_AVX2_FLAGS, 0 },
1053 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1054 CPU_AVX512F_FLAGS, 0 },
1055 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1056 CPU_AVX512CD_FLAGS, 0 },
1057 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1058 CPU_AVX512ER_FLAGS, 0 },
1059 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1060 CPU_AVX512PF_FLAGS, 0 },
1061 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1062 CPU_AVX512DQ_FLAGS, 0 },
1063 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1064 CPU_AVX512BW_FLAGS, 0 },
1065 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1066 CPU_AVX512VL_FLAGS, 0 },
1067 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1068 CPU_VMX_FLAGS, 0 },
1069 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1070 CPU_VMFUNC_FLAGS, 0 },
1071 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1072 CPU_SMX_FLAGS, 0 },
1073 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1074 CPU_XSAVE_FLAGS, 0 },
1075 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1076 CPU_XSAVEOPT_FLAGS, 0 },
1077 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1078 CPU_XSAVEC_FLAGS, 0 },
1079 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1080 CPU_XSAVES_FLAGS, 0 },
1081 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1082 CPU_AES_FLAGS, 0 },
1083 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1084 CPU_PCLMUL_FLAGS, 0 },
1085 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1086 CPU_PCLMUL_FLAGS, 1 },
1087 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1088 CPU_FSGSBASE_FLAGS, 0 },
1089 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1090 CPU_RDRND_FLAGS, 0 },
1091 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1092 CPU_F16C_FLAGS, 0 },
1093 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1094 CPU_BMI2_FLAGS, 0 },
1095 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1096 CPU_FMA_FLAGS, 0 },
1097 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1098 CPU_FMA4_FLAGS, 0 },
1099 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1100 CPU_XOP_FLAGS, 0 },
1101 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1102 CPU_LWP_FLAGS, 0 },
1103 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1104 CPU_MOVBE_FLAGS, 0 },
1105 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1106 CPU_CX16_FLAGS, 0 },
1107 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1108 CPU_EPT_FLAGS, 0 },
1109 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1110 CPU_LZCNT_FLAGS, 0 },
1111 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1112 CPU_POPCNT_FLAGS, 0 },
1113 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1114 CPU_HLE_FLAGS, 0 },
1115 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1116 CPU_RTM_FLAGS, 0 },
1117 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1118 CPU_INVPCID_FLAGS, 0 },
1119 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1120 CPU_CLFLUSH_FLAGS, 0 },
1121 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1122 CPU_NOP_FLAGS, 0 },
1123 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1124 CPU_SYSCALL_FLAGS, 0 },
1125 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1126 CPU_RDTSCP_FLAGS, 0 },
1127 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1128 CPU_3DNOW_FLAGS, 0 },
1129 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1130 CPU_3DNOWA_FLAGS, 0 },
1131 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1132 CPU_PADLOCK_FLAGS, 0 },
1133 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1134 CPU_SVME_FLAGS, 1 },
1135 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1136 CPU_SVME_FLAGS, 0 },
1137 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1138 CPU_SSE4A_FLAGS, 0 },
1139 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1140 CPU_ABM_FLAGS, 0 },
1141 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1142 CPU_BMI_FLAGS, 0 },
1143 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1144 CPU_TBM_FLAGS, 0 },
1145 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1146 CPU_ADX_FLAGS, 0 },
1147 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1148 CPU_RDSEED_FLAGS, 0 },
1149 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1150 CPU_PRFCHW_FLAGS, 0 },
1151 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1152 CPU_SMAP_FLAGS, 0 },
1153 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1154 CPU_MPX_FLAGS, 0 },
1155 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1156 CPU_SHA_FLAGS, 0 },
1157 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1158 CPU_CLFLUSHOPT_FLAGS, 0 },
1159 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1160 CPU_PREFETCHWT1_FLAGS, 0 },
1161 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1162 CPU_SE1_FLAGS, 0 },
1163 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1164 CPU_CLWB_FLAGS, 0 },
1165 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1166 CPU_AVX512IFMA_FLAGS, 0 },
1167 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1168 CPU_AVX512VBMI_FLAGS, 0 },
1169 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1170 CPU_AVX512_4FMAPS_FLAGS, 0 },
1171 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1172 CPU_AVX512_4VNNIW_FLAGS, 0 },
1173 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1174 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1175 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1176 CPU_AVX512_VBMI2_FLAGS, 0 },
1177 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1178 CPU_AVX512_VNNI_FLAGS, 0 },
1179 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1180 CPU_AVX512_BITALG_FLAGS, 0 },
1181 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1182 CPU_CLZERO_FLAGS, 0 },
1183 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1184 CPU_MWAITX_FLAGS, 0 },
1185 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1186 CPU_OSPKE_FLAGS, 0 },
1187 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1188 CPU_RDPID_FLAGS, 0 },
1189 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1190 CPU_PTWRITE_FLAGS, 0 },
1191 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1192 CPU_IBT_FLAGS, 0 },
1193 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1194 CPU_SHSTK_FLAGS, 0 },
1195 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1196 CPU_GFNI_FLAGS, 0 },
1197 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1198 CPU_VAES_FLAGS, 0 },
1199 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1200 CPU_VPCLMULQDQ_FLAGS, 0 },
1201 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1202 CPU_WBNOINVD_FLAGS, 0 },
1203 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1204 CPU_PCONFIG_FLAGS, 0 },
1205 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1206 CPU_WAITPKG_FLAGS, 0 },
1207 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1208 CPU_CLDEMOTE_FLAGS, 0 },
1209 { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1210 CPU_AMX_INT8_FLAGS, 0 },
1211 { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1212 CPU_AMX_BF16_FLAGS, 0 },
1213 { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1214 CPU_AMX_TILE_FLAGS, 0 },
1215 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1216 CPU_MOVDIRI_FLAGS, 0 },
1217 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1218 CPU_MOVDIR64B_FLAGS, 0 },
1219 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1220 CPU_AVX512_BF16_FLAGS, 0 },
1221 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1222 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1223 { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1224 CPU_TDX_FLAGS, 0 },
1225 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1226 CPU_ENQCMD_FLAGS, 0 },
1227 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1228 CPU_SERIALIZE_FLAGS, 0 },
1229 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1230 CPU_RDPRU_FLAGS, 0 },
1231 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1232 CPU_MCOMMIT_FLAGS, 0 },
1233 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1234 CPU_SEV_ES_FLAGS, 0 },
1235 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1236 CPU_TSXLDTRK_FLAGS, 0 },
1237 { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1238 CPU_KL_FLAGS, 0 },
1239 { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1240 CPU_WIDEKL_FLAGS, 0 },
1241 };
1242
1243 static const noarch_entry cpu_noarch[] =
1244 {
1245 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1246 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1247 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1248 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1249 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1250 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1251 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1252 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1253 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1254 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1255 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1256 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1257 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1258 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1259 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1260 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1261 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1262 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1263 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1264 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1265 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1266 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1267 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1268 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1269 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1270 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1271 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1272 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1273 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1274 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1275 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1276 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1277 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1278 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1279 { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1280 { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1281 { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1282 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1283 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1284 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1285 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1286 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1287 { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1288 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1289 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1290 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1291 { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1292 { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1293 };
1294
1295 #ifdef I386COFF
1296 /* Like s_lcomm_internal in gas/read.c but the alignment string
1297 is allowed to be optional. */
1298
1299 static symbolS *
1300 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1301 {
1302 addressT align = 0;
1303
1304 SKIP_WHITESPACE ();
1305
1306 if (needs_align
1307 && *input_line_pointer == ',')
1308 {
1309 align = parse_align (needs_align - 1);
1310
1311 if (align == (addressT) -1)
1312 return NULL;
1313 }
1314 else
1315 {
1316 if (size >= 8)
1317 align = 3;
1318 else if (size >= 4)
1319 align = 2;
1320 else if (size >= 2)
1321 align = 1;
1322 else
1323 align = 0;
1324 }
1325
1326 bss_alloc (symbolP, size, align);
1327 return symbolP;
1328 }
1329
1330 static void
1331 pe_lcomm (int needs_align)
1332 {
1333 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1334 }
1335 #endif
1336
1337 const pseudo_typeS md_pseudo_table[] =
1338 {
1339 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1340 {"align", s_align_bytes, 0},
1341 #else
1342 {"align", s_align_ptwo, 0},
1343 #endif
1344 {"arch", set_cpu_arch, 0},
1345 #ifndef I386COFF
1346 {"bss", s_bss, 0},
1347 #else
1348 {"lcomm", pe_lcomm, 1},
1349 #endif
1350 {"ffloat", float_cons, 'f'},
1351 {"dfloat", float_cons, 'd'},
1352 {"tfloat", float_cons, 'x'},
1353 {"value", cons, 2},
1354 {"slong", signed_cons, 4},
1355 {"noopt", s_ignore, 0},
1356 {"optim", s_ignore, 0},
1357 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1358 {"code16", set_code_flag, CODE_16BIT},
1359 {"code32", set_code_flag, CODE_32BIT},
1360 #ifdef BFD64
1361 {"code64", set_code_flag, CODE_64BIT},
1362 #endif
1363 {"intel_syntax", set_intel_syntax, 1},
1364 {"att_syntax", set_intel_syntax, 0},
1365 {"intel_mnemonic", set_intel_mnemonic, 1},
1366 {"att_mnemonic", set_intel_mnemonic, 0},
1367 {"allow_index_reg", set_allow_index_reg, 1},
1368 {"disallow_index_reg", set_allow_index_reg, 0},
1369 {"sse_check", set_check, 0},
1370 {"operand_check", set_check, 1},
1371 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1372 {"largecomm", handle_large_common, 0},
1373 #else
1374 {"file", dwarf2_directive_file, 0},
1375 {"loc", dwarf2_directive_loc, 0},
1376 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1377 #endif
1378 #ifdef TE_PE
1379 {"secrel32", pe_directive_secrel, 0},
1380 #endif
1381 {0, 0, 0}
1382 };
1383
1384 /* For interface with expression (). */
1385 extern char *input_line_pointer;
1386
1387 /* Hash table for instruction mnemonic lookup. */
1388 static htab_t op_hash;
1389
1390 /* Hash table for register lookup. */
1391 static htab_t reg_hash;
1392 \f
1393 /* Various efficient no-op patterns for aligning code labels.
1394 Note: Don't try to assemble the instructions in the comments.
1395 0L and 0w are not legal. */
1396 static const unsigned char f32_1[] =
1397 {0x90}; /* nop */
1398 static const unsigned char f32_2[] =
1399 {0x66,0x90}; /* xchg %ax,%ax */
1400 static const unsigned char f32_3[] =
1401 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1402 static const unsigned char f32_4[] =
1403 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1404 static const unsigned char f32_6[] =
1405 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1406 static const unsigned char f32_7[] =
1407 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1408 static const unsigned char f16_3[] =
1409 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1410 static const unsigned char f16_4[] =
1411 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1412 static const unsigned char jump_disp8[] =
1413 {0xeb}; /* jmp disp8 */
1414 static const unsigned char jump32_disp32[] =
1415 {0xe9}; /* jmp disp32 */
1416 static const unsigned char jump16_disp32[] =
1417 {0x66,0xe9}; /* jmp disp32 */
1418 /* 32-bit NOPs patterns. */
1419 static const unsigned char *const f32_patt[] = {
1420 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1421 };
1422 /* 16-bit NOPs patterns. */
1423 static const unsigned char *const f16_patt[] = {
1424 f32_1, f32_2, f16_3, f16_4
1425 };
1426 /* nopl (%[re]ax) */
1427 static const unsigned char alt_3[] =
1428 {0x0f,0x1f,0x00};
1429 /* nopl 0(%[re]ax) */
1430 static const unsigned char alt_4[] =
1431 {0x0f,0x1f,0x40,0x00};
1432 /* nopl 0(%[re]ax,%[re]ax,1) */
1433 static const unsigned char alt_5[] =
1434 {0x0f,0x1f,0x44,0x00,0x00};
1435 /* nopw 0(%[re]ax,%[re]ax,1) */
1436 static const unsigned char alt_6[] =
1437 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1438 /* nopl 0L(%[re]ax) */
1439 static const unsigned char alt_7[] =
1440 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1441 /* nopl 0L(%[re]ax,%[re]ax,1) */
1442 static const unsigned char alt_8[] =
1443 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1444 /* nopw 0L(%[re]ax,%[re]ax,1) */
1445 static const unsigned char alt_9[] =
1446 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1447 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1448 static const unsigned char alt_10[] =
1449 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1450 /* data16 nopw %cs:0L(%eax,%eax,1) */
1451 static const unsigned char alt_11[] =
1452 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1453 /* 32-bit and 64-bit NOPs patterns. */
1454 static const unsigned char *const alt_patt[] = {
1455 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1456 alt_9, alt_10, alt_11
1457 };
1458
1459 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1460 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1461
1462 static void
1463 i386_output_nops (char *where, const unsigned char *const *patt,
1464 int count, int max_single_nop_size)
1465
1466 {
1467 /* Place the longer NOP first. */
1468 int last;
1469 int offset;
1470 const unsigned char *nops;
1471
1472 if (max_single_nop_size < 1)
1473 {
1474 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1475 max_single_nop_size);
1476 return;
1477 }
1478
1479 nops = patt[max_single_nop_size - 1];
1480
1481 /* Use the smaller one if the requsted one isn't available. */
1482 if (nops == NULL)
1483 {
1484 max_single_nop_size--;
1485 nops = patt[max_single_nop_size - 1];
1486 }
1487
1488 last = count % max_single_nop_size;
1489
1490 count -= last;
1491 for (offset = 0; offset < count; offset += max_single_nop_size)
1492 memcpy (where + offset, nops, max_single_nop_size);
1493
1494 if (last)
1495 {
1496 nops = patt[last - 1];
1497 if (nops == NULL)
1498 {
1499 /* Use the smaller one plus one-byte NOP if the needed one
1500 isn't available. */
1501 last--;
1502 nops = patt[last - 1];
1503 memcpy (where + offset, nops, last);
1504 where[offset + last] = *patt[0];
1505 }
1506 else
1507 memcpy (where + offset, nops, last);
1508 }
1509 }
1510
1511 static INLINE int
1512 fits_in_imm7 (offsetT num)
1513 {
1514 return (num & 0x7f) == num;
1515 }
1516
1517 static INLINE int
1518 fits_in_imm31 (offsetT num)
1519 {
1520 return (num & 0x7fffffff) == num;
1521 }
1522
1523 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1524 single NOP instruction LIMIT. */
1525
1526 void
1527 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1528 {
1529 const unsigned char *const *patt = NULL;
1530 int max_single_nop_size;
1531 /* Maximum number of NOPs before switching to jump over NOPs. */
1532 int max_number_of_nops;
1533
1534 switch (fragP->fr_type)
1535 {
1536 case rs_fill_nop:
1537 case rs_align_code:
1538 break;
1539 case rs_machine_dependent:
1540 /* Allow NOP padding for jumps and calls. */
1541 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1542 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1543 break;
1544 /* Fall through. */
1545 default:
1546 return;
1547 }
1548
1549 /* We need to decide which NOP sequence to use for 32bit and
1550 64bit. When -mtune= is used:
1551
1552 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1553 PROCESSOR_GENERIC32, f32_patt will be used.
1554 2. For the rest, alt_patt will be used.
1555
1556 When -mtune= isn't used, alt_patt will be used if
1557 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1558 be used.
1559
1560 When -march= or .arch is used, we can't use anything beyond
1561 cpu_arch_isa_flags. */
1562
1563 if (flag_code == CODE_16BIT)
1564 {
1565 patt = f16_patt;
1566 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1567 /* Limit number of NOPs to 2 in 16-bit mode. */
1568 max_number_of_nops = 2;
1569 }
1570 else
1571 {
1572 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1573 {
1574 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1575 switch (cpu_arch_tune)
1576 {
1577 case PROCESSOR_UNKNOWN:
1578 /* We use cpu_arch_isa_flags to check if we SHOULD
1579 optimize with nops. */
1580 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1581 patt = alt_patt;
1582 else
1583 patt = f32_patt;
1584 break;
1585 case PROCESSOR_PENTIUM4:
1586 case PROCESSOR_NOCONA:
1587 case PROCESSOR_CORE:
1588 case PROCESSOR_CORE2:
1589 case PROCESSOR_COREI7:
1590 case PROCESSOR_L1OM:
1591 case PROCESSOR_K1OM:
1592 case PROCESSOR_GENERIC64:
1593 case PROCESSOR_K6:
1594 case PROCESSOR_ATHLON:
1595 case PROCESSOR_K8:
1596 case PROCESSOR_AMDFAM10:
1597 case PROCESSOR_BD:
1598 case PROCESSOR_ZNVER:
1599 case PROCESSOR_BT:
1600 patt = alt_patt;
1601 break;
1602 case PROCESSOR_I386:
1603 case PROCESSOR_I486:
1604 case PROCESSOR_PENTIUM:
1605 case PROCESSOR_PENTIUMPRO:
1606 case PROCESSOR_IAMCU:
1607 case PROCESSOR_GENERIC32:
1608 patt = f32_patt;
1609 break;
1610 }
1611 }
1612 else
1613 {
1614 switch (fragP->tc_frag_data.tune)
1615 {
1616 case PROCESSOR_UNKNOWN:
1617 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1618 PROCESSOR_UNKNOWN. */
1619 abort ();
1620 break;
1621
1622 case PROCESSOR_I386:
1623 case PROCESSOR_I486:
1624 case PROCESSOR_PENTIUM:
1625 case PROCESSOR_IAMCU:
1626 case PROCESSOR_K6:
1627 case PROCESSOR_ATHLON:
1628 case PROCESSOR_K8:
1629 case PROCESSOR_AMDFAM10:
1630 case PROCESSOR_BD:
1631 case PROCESSOR_ZNVER:
1632 case PROCESSOR_BT:
1633 case PROCESSOR_GENERIC32:
1634 /* We use cpu_arch_isa_flags to check if we CAN optimize
1635 with nops. */
1636 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1637 patt = alt_patt;
1638 else
1639 patt = f32_patt;
1640 break;
1641 case PROCESSOR_PENTIUMPRO:
1642 case PROCESSOR_PENTIUM4:
1643 case PROCESSOR_NOCONA:
1644 case PROCESSOR_CORE:
1645 case PROCESSOR_CORE2:
1646 case PROCESSOR_COREI7:
1647 case PROCESSOR_L1OM:
1648 case PROCESSOR_K1OM:
1649 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1650 patt = alt_patt;
1651 else
1652 patt = f32_patt;
1653 break;
1654 case PROCESSOR_GENERIC64:
1655 patt = alt_patt;
1656 break;
1657 }
1658 }
1659
1660 if (patt == f32_patt)
1661 {
1662 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1663 /* Limit number of NOPs to 2 for older processors. */
1664 max_number_of_nops = 2;
1665 }
1666 else
1667 {
1668 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1669 /* Limit number of NOPs to 7 for newer processors. */
1670 max_number_of_nops = 7;
1671 }
1672 }
1673
1674 if (limit == 0)
1675 limit = max_single_nop_size;
1676
1677 if (fragP->fr_type == rs_fill_nop)
1678 {
1679 /* Output NOPs for .nop directive. */
1680 if (limit > max_single_nop_size)
1681 {
1682 as_bad_where (fragP->fr_file, fragP->fr_line,
1683 _("invalid single nop size: %d "
1684 "(expect within [0, %d])"),
1685 limit, max_single_nop_size);
1686 return;
1687 }
1688 }
1689 else if (fragP->fr_type != rs_machine_dependent)
1690 fragP->fr_var = count;
1691
1692 if ((count / max_single_nop_size) > max_number_of_nops)
1693 {
1694 /* Generate jump over NOPs. */
1695 offsetT disp = count - 2;
1696 if (fits_in_imm7 (disp))
1697 {
1698 /* Use "jmp disp8" if possible. */
1699 count = disp;
1700 where[0] = jump_disp8[0];
1701 where[1] = count;
1702 where += 2;
1703 }
1704 else
1705 {
1706 unsigned int size_of_jump;
1707
1708 if (flag_code == CODE_16BIT)
1709 {
1710 where[0] = jump16_disp32[0];
1711 where[1] = jump16_disp32[1];
1712 size_of_jump = 2;
1713 }
1714 else
1715 {
1716 where[0] = jump32_disp32[0];
1717 size_of_jump = 1;
1718 }
1719
1720 count -= size_of_jump + 4;
1721 if (!fits_in_imm31 (count))
1722 {
1723 as_bad_where (fragP->fr_file, fragP->fr_line,
1724 _("jump over nop padding out of range"));
1725 return;
1726 }
1727
1728 md_number_to_chars (where + size_of_jump, count, 4);
1729 where += size_of_jump + 4;
1730 }
1731 }
1732
1733 /* Generate multiple NOPs. */
1734 i386_output_nops (where, patt, count, limit);
1735 }
1736
1737 static INLINE int
1738 operand_type_all_zero (const union i386_operand_type *x)
1739 {
1740 switch (ARRAY_SIZE(x->array))
1741 {
1742 case 3:
1743 if (x->array[2])
1744 return 0;
1745 /* Fall through. */
1746 case 2:
1747 if (x->array[1])
1748 return 0;
1749 /* Fall through. */
1750 case 1:
1751 return !x->array[0];
1752 default:
1753 abort ();
1754 }
1755 }
1756
1757 static INLINE void
1758 operand_type_set (union i386_operand_type *x, unsigned int v)
1759 {
1760 switch (ARRAY_SIZE(x->array))
1761 {
1762 case 3:
1763 x->array[2] = v;
1764 /* Fall through. */
1765 case 2:
1766 x->array[1] = v;
1767 /* Fall through. */
1768 case 1:
1769 x->array[0] = v;
1770 /* Fall through. */
1771 break;
1772 default:
1773 abort ();
1774 }
1775
1776 x->bitfield.class = ClassNone;
1777 x->bitfield.instance = InstanceNone;
1778 }
1779
1780 static INLINE int
1781 operand_type_equal (const union i386_operand_type *x,
1782 const union i386_operand_type *y)
1783 {
1784 switch (ARRAY_SIZE(x->array))
1785 {
1786 case 3:
1787 if (x->array[2] != y->array[2])
1788 return 0;
1789 /* Fall through. */
1790 case 2:
1791 if (x->array[1] != y->array[1])
1792 return 0;
1793 /* Fall through. */
1794 case 1:
1795 return x->array[0] == y->array[0];
1796 break;
1797 default:
1798 abort ();
1799 }
1800 }
1801
1802 static INLINE int
1803 cpu_flags_all_zero (const union i386_cpu_flags *x)
1804 {
1805 switch (ARRAY_SIZE(x->array))
1806 {
1807 case 4:
1808 if (x->array[3])
1809 return 0;
1810 /* Fall through. */
1811 case 3:
1812 if (x->array[2])
1813 return 0;
1814 /* Fall through. */
1815 case 2:
1816 if (x->array[1])
1817 return 0;
1818 /* Fall through. */
1819 case 1:
1820 return !x->array[0];
1821 default:
1822 abort ();
1823 }
1824 }
1825
1826 static INLINE int
1827 cpu_flags_equal (const union i386_cpu_flags *x,
1828 const union i386_cpu_flags *y)
1829 {
1830 switch (ARRAY_SIZE(x->array))
1831 {
1832 case 4:
1833 if (x->array[3] != y->array[3])
1834 return 0;
1835 /* Fall through. */
1836 case 3:
1837 if (x->array[2] != y->array[2])
1838 return 0;
1839 /* Fall through. */
1840 case 2:
1841 if (x->array[1] != y->array[1])
1842 return 0;
1843 /* Fall through. */
1844 case 1:
1845 return x->array[0] == y->array[0];
1846 break;
1847 default:
1848 abort ();
1849 }
1850 }
1851
1852 static INLINE int
1853 cpu_flags_check_cpu64 (i386_cpu_flags f)
1854 {
1855 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1856 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1857 }
1858
1859 static INLINE i386_cpu_flags
1860 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1861 {
1862 switch (ARRAY_SIZE (x.array))
1863 {
1864 case 4:
1865 x.array [3] &= y.array [3];
1866 /* Fall through. */
1867 case 3:
1868 x.array [2] &= y.array [2];
1869 /* Fall through. */
1870 case 2:
1871 x.array [1] &= y.array [1];
1872 /* Fall through. */
1873 case 1:
1874 x.array [0] &= y.array [0];
1875 break;
1876 default:
1877 abort ();
1878 }
1879 return x;
1880 }
1881
1882 static INLINE i386_cpu_flags
1883 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1884 {
1885 switch (ARRAY_SIZE (x.array))
1886 {
1887 case 4:
1888 x.array [3] |= y.array [3];
1889 /* Fall through. */
1890 case 3:
1891 x.array [2] |= y.array [2];
1892 /* Fall through. */
1893 case 2:
1894 x.array [1] |= y.array [1];
1895 /* Fall through. */
1896 case 1:
1897 x.array [0] |= y.array [0];
1898 break;
1899 default:
1900 abort ();
1901 }
1902 return x;
1903 }
1904
1905 static INLINE i386_cpu_flags
1906 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1907 {
1908 switch (ARRAY_SIZE (x.array))
1909 {
1910 case 4:
1911 x.array [3] &= ~y.array [3];
1912 /* Fall through. */
1913 case 3:
1914 x.array [2] &= ~y.array [2];
1915 /* Fall through. */
1916 case 2:
1917 x.array [1] &= ~y.array [1];
1918 /* Fall through. */
1919 case 1:
1920 x.array [0] &= ~y.array [0];
1921 break;
1922 default:
1923 abort ();
1924 }
1925 return x;
1926 }
1927
1928 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1929
1930 #define CPU_FLAGS_ARCH_MATCH 0x1
1931 #define CPU_FLAGS_64BIT_MATCH 0x2
1932
1933 #define CPU_FLAGS_PERFECT_MATCH \
1934 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1935
1936 /* Return CPU flags match bits. */
1937
1938 static int
1939 cpu_flags_match (const insn_template *t)
1940 {
1941 i386_cpu_flags x = t->cpu_flags;
1942 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1943
1944 x.bitfield.cpu64 = 0;
1945 x.bitfield.cpuno64 = 0;
1946
1947 if (cpu_flags_all_zero (&x))
1948 {
1949 /* This instruction is available on all archs. */
1950 match |= CPU_FLAGS_ARCH_MATCH;
1951 }
1952 else
1953 {
1954 /* This instruction is available only on some archs. */
1955 i386_cpu_flags cpu = cpu_arch_flags;
1956
1957 /* AVX512VL is no standalone feature - match it and then strip it. */
1958 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1959 return match;
1960 x.bitfield.cpuavx512vl = 0;
1961
1962 cpu = cpu_flags_and (x, cpu);
1963 if (!cpu_flags_all_zero (&cpu))
1964 {
1965 if (x.bitfield.cpuavx)
1966 {
1967 /* We need to check a few extra flags with AVX. */
1968 if (cpu.bitfield.cpuavx
1969 && (!t->opcode_modifier.sse2avx
1970 || (sse2avx && !i.prefix[DATA_PREFIX]))
1971 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1972 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1973 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1974 match |= CPU_FLAGS_ARCH_MATCH;
1975 }
1976 else if (x.bitfield.cpuavx512f)
1977 {
1978 /* We need to check a few extra flags with AVX512F. */
1979 if (cpu.bitfield.cpuavx512f
1980 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1981 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1982 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1983 match |= CPU_FLAGS_ARCH_MATCH;
1984 }
1985 else
1986 match |= CPU_FLAGS_ARCH_MATCH;
1987 }
1988 }
1989 return match;
1990 }
1991
1992 static INLINE i386_operand_type
1993 operand_type_and (i386_operand_type x, i386_operand_type y)
1994 {
1995 if (x.bitfield.class != y.bitfield.class)
1996 x.bitfield.class = ClassNone;
1997 if (x.bitfield.instance != y.bitfield.instance)
1998 x.bitfield.instance = InstanceNone;
1999
2000 switch (ARRAY_SIZE (x.array))
2001 {
2002 case 3:
2003 x.array [2] &= y.array [2];
2004 /* Fall through. */
2005 case 2:
2006 x.array [1] &= y.array [1];
2007 /* Fall through. */
2008 case 1:
2009 x.array [0] &= y.array [0];
2010 break;
2011 default:
2012 abort ();
2013 }
2014 return x;
2015 }
2016
2017 static INLINE i386_operand_type
2018 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2019 {
2020 gas_assert (y.bitfield.class == ClassNone);
2021 gas_assert (y.bitfield.instance == InstanceNone);
2022
2023 switch (ARRAY_SIZE (x.array))
2024 {
2025 case 3:
2026 x.array [2] &= ~y.array [2];
2027 /* Fall through. */
2028 case 2:
2029 x.array [1] &= ~y.array [1];
2030 /* Fall through. */
2031 case 1:
2032 x.array [0] &= ~y.array [0];
2033 break;
2034 default:
2035 abort ();
2036 }
2037 return x;
2038 }
2039
2040 static INLINE i386_operand_type
2041 operand_type_or (i386_operand_type x, i386_operand_type y)
2042 {
2043 gas_assert (x.bitfield.class == ClassNone ||
2044 y.bitfield.class == ClassNone ||
2045 x.bitfield.class == y.bitfield.class);
2046 gas_assert (x.bitfield.instance == InstanceNone ||
2047 y.bitfield.instance == InstanceNone ||
2048 x.bitfield.instance == y.bitfield.instance);
2049
2050 switch (ARRAY_SIZE (x.array))
2051 {
2052 case 3:
2053 x.array [2] |= y.array [2];
2054 /* Fall through. */
2055 case 2:
2056 x.array [1] |= y.array [1];
2057 /* Fall through. */
2058 case 1:
2059 x.array [0] |= y.array [0];
2060 break;
2061 default:
2062 abort ();
2063 }
2064 return x;
2065 }
2066
2067 static INLINE i386_operand_type
2068 operand_type_xor (i386_operand_type x, i386_operand_type y)
2069 {
2070 gas_assert (y.bitfield.class == ClassNone);
2071 gas_assert (y.bitfield.instance == InstanceNone);
2072
2073 switch (ARRAY_SIZE (x.array))
2074 {
2075 case 3:
2076 x.array [2] ^= y.array [2];
2077 /* Fall through. */
2078 case 2:
2079 x.array [1] ^= y.array [1];
2080 /* Fall through. */
2081 case 1:
2082 x.array [0] ^= y.array [0];
2083 break;
2084 default:
2085 abort ();
2086 }
2087 return x;
2088 }
2089
2090 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2091 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2092 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2093 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2094 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2095 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2096 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2097 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2098 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2099 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2100 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2101 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2102 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2103 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2104 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2105 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2106 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2107
2108 enum operand_type
2109 {
2110 reg,
2111 imm,
2112 disp,
2113 anymem
2114 };
2115
2116 static INLINE int
2117 operand_type_check (i386_operand_type t, enum operand_type c)
2118 {
2119 switch (c)
2120 {
2121 case reg:
2122 return t.bitfield.class == Reg;
2123
2124 case imm:
2125 return (t.bitfield.imm8
2126 || t.bitfield.imm8s
2127 || t.bitfield.imm16
2128 || t.bitfield.imm32
2129 || t.bitfield.imm32s
2130 || t.bitfield.imm64);
2131
2132 case disp:
2133 return (t.bitfield.disp8
2134 || t.bitfield.disp16
2135 || t.bitfield.disp32
2136 || t.bitfield.disp32s
2137 || t.bitfield.disp64);
2138
2139 case anymem:
2140 return (t.bitfield.disp8
2141 || t.bitfield.disp16
2142 || t.bitfield.disp32
2143 || t.bitfield.disp32s
2144 || t.bitfield.disp64
2145 || t.bitfield.baseindex);
2146
2147 default:
2148 abort ();
2149 }
2150
2151 return 0;
2152 }
2153
2154 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2155 between operand GIVEN and opeand WANTED for instruction template T. */
2156
2157 static INLINE int
2158 match_operand_size (const insn_template *t, unsigned int wanted,
2159 unsigned int given)
2160 {
2161 return !((i.types[given].bitfield.byte
2162 && !t->operand_types[wanted].bitfield.byte)
2163 || (i.types[given].bitfield.word
2164 && !t->operand_types[wanted].bitfield.word)
2165 || (i.types[given].bitfield.dword
2166 && !t->operand_types[wanted].bitfield.dword)
2167 || (i.types[given].bitfield.qword
2168 && !t->operand_types[wanted].bitfield.qword)
2169 || (i.types[given].bitfield.tbyte
2170 && !t->operand_types[wanted].bitfield.tbyte));
2171 }
2172
2173 /* Return 1 if there is no conflict in SIMD register between operand
2174 GIVEN and opeand WANTED for instruction template T. */
2175
2176 static INLINE int
2177 match_simd_size (const insn_template *t, unsigned int wanted,
2178 unsigned int given)
2179 {
2180 return !((i.types[given].bitfield.xmmword
2181 && !t->operand_types[wanted].bitfield.xmmword)
2182 || (i.types[given].bitfield.ymmword
2183 && !t->operand_types[wanted].bitfield.ymmword)
2184 || (i.types[given].bitfield.zmmword
2185 && !t->operand_types[wanted].bitfield.zmmword)
2186 || (i.types[given].bitfield.tmmword
2187 && !t->operand_types[wanted].bitfield.tmmword));
2188 }
2189
2190 /* Return 1 if there is no conflict in any size between operand GIVEN
2191 and opeand WANTED for instruction template T. */
2192
2193 static INLINE int
2194 match_mem_size (const insn_template *t, unsigned int wanted,
2195 unsigned int given)
2196 {
2197 return (match_operand_size (t, wanted, given)
2198 && !((i.types[given].bitfield.unspecified
2199 && !i.broadcast
2200 && !t->operand_types[wanted].bitfield.unspecified)
2201 || (i.types[given].bitfield.fword
2202 && !t->operand_types[wanted].bitfield.fword)
2203 /* For scalar opcode templates to allow register and memory
2204 operands at the same time, some special casing is needed
2205 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2206 down-conversion vpmov*. */
2207 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2208 && t->operand_types[wanted].bitfield.byte
2209 + t->operand_types[wanted].bitfield.word
2210 + t->operand_types[wanted].bitfield.dword
2211 + t->operand_types[wanted].bitfield.qword
2212 > !!t->opcode_modifier.broadcast)
2213 ? (i.types[given].bitfield.xmmword
2214 || i.types[given].bitfield.ymmword
2215 || i.types[given].bitfield.zmmword)
2216 : !match_simd_size(t, wanted, given))));
2217 }
2218
2219 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2220 operands for instruction template T, and it has MATCH_REVERSE set if there
2221 is no size conflict on any operands for the template with operands reversed
2222 (and the template allows for reversing in the first place). */
2223
2224 #define MATCH_STRAIGHT 1
2225 #define MATCH_REVERSE 2
2226
2227 static INLINE unsigned int
2228 operand_size_match (const insn_template *t)
2229 {
2230 unsigned int j, match = MATCH_STRAIGHT;
2231
2232 /* Don't check non-absolute jump instructions. */
2233 if (t->opcode_modifier.jump
2234 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2235 return match;
2236
2237 /* Check memory and accumulator operand size. */
2238 for (j = 0; j < i.operands; j++)
2239 {
2240 if (i.types[j].bitfield.class != Reg
2241 && i.types[j].bitfield.class != RegSIMD
2242 && t->opcode_modifier.anysize)
2243 continue;
2244
2245 if (t->operand_types[j].bitfield.class == Reg
2246 && !match_operand_size (t, j, j))
2247 {
2248 match = 0;
2249 break;
2250 }
2251
2252 if (t->operand_types[j].bitfield.class == RegSIMD
2253 && !match_simd_size (t, j, j))
2254 {
2255 match = 0;
2256 break;
2257 }
2258
2259 if (t->operand_types[j].bitfield.instance == Accum
2260 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2261 {
2262 match = 0;
2263 break;
2264 }
2265
2266 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2267 {
2268 match = 0;
2269 break;
2270 }
2271 }
2272
2273 if (!t->opcode_modifier.d)
2274 {
2275 mismatch:
2276 if (!match)
2277 i.error = operand_size_mismatch;
2278 return match;
2279 }
2280
2281 /* Check reverse. */
2282 gas_assert (i.operands >= 2 && i.operands <= 3);
2283
2284 for (j = 0; j < i.operands; j++)
2285 {
2286 unsigned int given = i.operands - j - 1;
2287
2288 if (t->operand_types[j].bitfield.class == Reg
2289 && !match_operand_size (t, j, given))
2290 goto mismatch;
2291
2292 if (t->operand_types[j].bitfield.class == RegSIMD
2293 && !match_simd_size (t, j, given))
2294 goto mismatch;
2295
2296 if (t->operand_types[j].bitfield.instance == Accum
2297 && (!match_operand_size (t, j, given)
2298 || !match_simd_size (t, j, given)))
2299 goto mismatch;
2300
2301 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2302 goto mismatch;
2303 }
2304
2305 return match | MATCH_REVERSE;
2306 }
2307
2308 static INLINE int
2309 operand_type_match (i386_operand_type overlap,
2310 i386_operand_type given)
2311 {
2312 i386_operand_type temp = overlap;
2313
2314 temp.bitfield.unspecified = 0;
2315 temp.bitfield.byte = 0;
2316 temp.bitfield.word = 0;
2317 temp.bitfield.dword = 0;
2318 temp.bitfield.fword = 0;
2319 temp.bitfield.qword = 0;
2320 temp.bitfield.tbyte = 0;
2321 temp.bitfield.xmmword = 0;
2322 temp.bitfield.ymmword = 0;
2323 temp.bitfield.zmmword = 0;
2324 temp.bitfield.tmmword = 0;
2325 if (operand_type_all_zero (&temp))
2326 goto mismatch;
2327
2328 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2329 return 1;
2330
2331 mismatch:
2332 i.error = operand_type_mismatch;
2333 return 0;
2334 }
2335
2336 /* If given types g0 and g1 are registers they must be of the same type
2337 unless the expected operand type register overlap is null.
2338 Some Intel syntax memory operand size checking also happens here. */
2339
2340 static INLINE int
2341 operand_type_register_match (i386_operand_type g0,
2342 i386_operand_type t0,
2343 i386_operand_type g1,
2344 i386_operand_type t1)
2345 {
2346 if (g0.bitfield.class != Reg
2347 && g0.bitfield.class != RegSIMD
2348 && (!operand_type_check (g0, anymem)
2349 || g0.bitfield.unspecified
2350 || (t0.bitfield.class != Reg
2351 && t0.bitfield.class != RegSIMD)))
2352 return 1;
2353
2354 if (g1.bitfield.class != Reg
2355 && g1.bitfield.class != RegSIMD
2356 && (!operand_type_check (g1, anymem)
2357 || g1.bitfield.unspecified
2358 || (t1.bitfield.class != Reg
2359 && t1.bitfield.class != RegSIMD)))
2360 return 1;
2361
2362 if (g0.bitfield.byte == g1.bitfield.byte
2363 && g0.bitfield.word == g1.bitfield.word
2364 && g0.bitfield.dword == g1.bitfield.dword
2365 && g0.bitfield.qword == g1.bitfield.qword
2366 && g0.bitfield.xmmword == g1.bitfield.xmmword
2367 && g0.bitfield.ymmword == g1.bitfield.ymmword
2368 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2369 return 1;
2370
2371 if (!(t0.bitfield.byte & t1.bitfield.byte)
2372 && !(t0.bitfield.word & t1.bitfield.word)
2373 && !(t0.bitfield.dword & t1.bitfield.dword)
2374 && !(t0.bitfield.qword & t1.bitfield.qword)
2375 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2376 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2377 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2378 return 1;
2379
2380 i.error = register_type_mismatch;
2381
2382 return 0;
2383 }
2384
2385 static INLINE unsigned int
2386 register_number (const reg_entry *r)
2387 {
2388 unsigned int nr = r->reg_num;
2389
2390 if (r->reg_flags & RegRex)
2391 nr += 8;
2392
2393 if (r->reg_flags & RegVRex)
2394 nr += 16;
2395
2396 return nr;
2397 }
2398
2399 static INLINE unsigned int
2400 mode_from_disp_size (i386_operand_type t)
2401 {
2402 if (t.bitfield.disp8)
2403 return 1;
2404 else if (t.bitfield.disp16
2405 || t.bitfield.disp32
2406 || t.bitfield.disp32s)
2407 return 2;
2408 else
2409 return 0;
2410 }
2411
2412 static INLINE int
2413 fits_in_signed_byte (addressT num)
2414 {
2415 return num + 0x80 <= 0xff;
2416 }
2417
2418 static INLINE int
2419 fits_in_unsigned_byte (addressT num)
2420 {
2421 return num <= 0xff;
2422 }
2423
2424 static INLINE int
2425 fits_in_unsigned_word (addressT num)
2426 {
2427 return num <= 0xffff;
2428 }
2429
2430 static INLINE int
2431 fits_in_signed_word (addressT num)
2432 {
2433 return num + 0x8000 <= 0xffff;
2434 }
2435
2436 static INLINE int
2437 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2438 {
2439 #ifndef BFD64
2440 return 1;
2441 #else
2442 return num + 0x80000000 <= 0xffffffff;
2443 #endif
2444 } /* fits_in_signed_long() */
2445
2446 static INLINE int
2447 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2448 {
2449 #ifndef BFD64
2450 return 1;
2451 #else
2452 return num <= 0xffffffff;
2453 #endif
2454 } /* fits_in_unsigned_long() */
2455
2456 static INLINE int
2457 fits_in_disp8 (offsetT num)
2458 {
2459 int shift = i.memshift;
2460 unsigned int mask;
2461
2462 if (shift == -1)
2463 abort ();
2464
2465 mask = (1 << shift) - 1;
2466
2467 /* Return 0 if NUM isn't properly aligned. */
2468 if ((num & mask))
2469 return 0;
2470
2471 /* Check if NUM will fit in 8bit after shift. */
2472 return fits_in_signed_byte (num >> shift);
2473 }
2474
2475 static INLINE int
2476 fits_in_imm4 (offsetT num)
2477 {
2478 return (num & 0xf) == num;
2479 }
2480
2481 static i386_operand_type
2482 smallest_imm_type (offsetT num)
2483 {
2484 i386_operand_type t;
2485
2486 operand_type_set (&t, 0);
2487 t.bitfield.imm64 = 1;
2488
2489 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2490 {
2491 /* This code is disabled on the 486 because all the Imm1 forms
2492 in the opcode table are slower on the i486. They're the
2493 versions with the implicitly specified single-position
2494 displacement, which has another syntax if you really want to
2495 use that form. */
2496 t.bitfield.imm1 = 1;
2497 t.bitfield.imm8 = 1;
2498 t.bitfield.imm8s = 1;
2499 t.bitfield.imm16 = 1;
2500 t.bitfield.imm32 = 1;
2501 t.bitfield.imm32s = 1;
2502 }
2503 else if (fits_in_signed_byte (num))
2504 {
2505 t.bitfield.imm8 = 1;
2506 t.bitfield.imm8s = 1;
2507 t.bitfield.imm16 = 1;
2508 t.bitfield.imm32 = 1;
2509 t.bitfield.imm32s = 1;
2510 }
2511 else if (fits_in_unsigned_byte (num))
2512 {
2513 t.bitfield.imm8 = 1;
2514 t.bitfield.imm16 = 1;
2515 t.bitfield.imm32 = 1;
2516 t.bitfield.imm32s = 1;
2517 }
2518 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2519 {
2520 t.bitfield.imm16 = 1;
2521 t.bitfield.imm32 = 1;
2522 t.bitfield.imm32s = 1;
2523 }
2524 else if (fits_in_signed_long (num))
2525 {
2526 t.bitfield.imm32 = 1;
2527 t.bitfield.imm32s = 1;
2528 }
2529 else if (fits_in_unsigned_long (num))
2530 t.bitfield.imm32 = 1;
2531
2532 return t;
2533 }
2534
2535 static offsetT
2536 offset_in_range (offsetT val, int size)
2537 {
2538 addressT mask;
2539
2540 switch (size)
2541 {
2542 case 1: mask = ((addressT) 1 << 8) - 1; break;
2543 case 2: mask = ((addressT) 1 << 16) - 1; break;
2544 case 4: mask = ((addressT) 2 << 31) - 1; break;
2545 #ifdef BFD64
2546 case 8: mask = ((addressT) 2 << 63) - 1; break;
2547 #endif
2548 default: abort ();
2549 }
2550
2551 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2552 {
2553 char buf1[40], buf2[40];
2554
2555 sprint_value (buf1, val);
2556 sprint_value (buf2, val & mask);
2557 as_warn (_("%s shortened to %s"), buf1, buf2);
2558 }
2559 return val & mask;
2560 }
2561
2562 enum PREFIX_GROUP
2563 {
2564 PREFIX_EXIST = 0,
2565 PREFIX_LOCK,
2566 PREFIX_REP,
2567 PREFIX_DS,
2568 PREFIX_OTHER
2569 };
2570
2571 /* Returns
2572 a. PREFIX_EXIST if attempting to add a prefix where one from the
2573 same class already exists.
2574 b. PREFIX_LOCK if lock prefix is added.
2575 c. PREFIX_REP if rep/repne prefix is added.
2576 d. PREFIX_DS if ds prefix is added.
2577 e. PREFIX_OTHER if other prefix is added.
2578 */
2579
2580 static enum PREFIX_GROUP
2581 add_prefix (unsigned int prefix)
2582 {
2583 enum PREFIX_GROUP ret = PREFIX_OTHER;
2584 unsigned int q;
2585
2586 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2587 && flag_code == CODE_64BIT)
2588 {
2589 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2590 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2591 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2592 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2593 ret = PREFIX_EXIST;
2594 q = REX_PREFIX;
2595 }
2596 else
2597 {
2598 switch (prefix)
2599 {
2600 default:
2601 abort ();
2602
2603 case DS_PREFIX_OPCODE:
2604 ret = PREFIX_DS;
2605 /* Fall through. */
2606 case CS_PREFIX_OPCODE:
2607 case ES_PREFIX_OPCODE:
2608 case FS_PREFIX_OPCODE:
2609 case GS_PREFIX_OPCODE:
2610 case SS_PREFIX_OPCODE:
2611 q = SEG_PREFIX;
2612 break;
2613
2614 case REPNE_PREFIX_OPCODE:
2615 case REPE_PREFIX_OPCODE:
2616 q = REP_PREFIX;
2617 ret = PREFIX_REP;
2618 break;
2619
2620 case LOCK_PREFIX_OPCODE:
2621 q = LOCK_PREFIX;
2622 ret = PREFIX_LOCK;
2623 break;
2624
2625 case FWAIT_OPCODE:
2626 q = WAIT_PREFIX;
2627 break;
2628
2629 case ADDR_PREFIX_OPCODE:
2630 q = ADDR_PREFIX;
2631 break;
2632
2633 case DATA_PREFIX_OPCODE:
2634 q = DATA_PREFIX;
2635 break;
2636 }
2637 if (i.prefix[q] != 0)
2638 ret = PREFIX_EXIST;
2639 }
2640
2641 if (ret)
2642 {
2643 if (!i.prefix[q])
2644 ++i.prefixes;
2645 i.prefix[q] |= prefix;
2646 }
2647 else
2648 as_bad (_("same type of prefix used twice"));
2649
2650 return ret;
2651 }
2652
2653 static void
2654 update_code_flag (int value, int check)
2655 {
2656 PRINTF_LIKE ((*as_error));
2657
2658 flag_code = (enum flag_code) value;
2659 if (flag_code == CODE_64BIT)
2660 {
2661 cpu_arch_flags.bitfield.cpu64 = 1;
2662 cpu_arch_flags.bitfield.cpuno64 = 0;
2663 }
2664 else
2665 {
2666 cpu_arch_flags.bitfield.cpu64 = 0;
2667 cpu_arch_flags.bitfield.cpuno64 = 1;
2668 }
2669 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2670 {
2671 if (check)
2672 as_error = as_fatal;
2673 else
2674 as_error = as_bad;
2675 (*as_error) (_("64bit mode not supported on `%s'."),
2676 cpu_arch_name ? cpu_arch_name : default_arch);
2677 }
2678 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2679 {
2680 if (check)
2681 as_error = as_fatal;
2682 else
2683 as_error = as_bad;
2684 (*as_error) (_("32bit mode not supported on `%s'."),
2685 cpu_arch_name ? cpu_arch_name : default_arch);
2686 }
2687 stackop_size = '\0';
2688 }
2689
2690 static void
2691 set_code_flag (int value)
2692 {
2693 update_code_flag (value, 0);
2694 }
2695
2696 static void
2697 set_16bit_gcc_code_flag (int new_code_flag)
2698 {
2699 flag_code = (enum flag_code) new_code_flag;
2700 if (flag_code != CODE_16BIT)
2701 abort ();
2702 cpu_arch_flags.bitfield.cpu64 = 0;
2703 cpu_arch_flags.bitfield.cpuno64 = 1;
2704 stackop_size = LONG_MNEM_SUFFIX;
2705 }
2706
2707 static void
2708 set_intel_syntax (int syntax_flag)
2709 {
2710 /* Find out if register prefixing is specified. */
2711 int ask_naked_reg = 0;
2712
2713 SKIP_WHITESPACE ();
2714 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2715 {
2716 char *string;
2717 int e = get_symbol_name (&string);
2718
2719 if (strcmp (string, "prefix") == 0)
2720 ask_naked_reg = 1;
2721 else if (strcmp (string, "noprefix") == 0)
2722 ask_naked_reg = -1;
2723 else
2724 as_bad (_("bad argument to syntax directive."));
2725 (void) restore_line_pointer (e);
2726 }
2727 demand_empty_rest_of_line ();
2728
2729 intel_syntax = syntax_flag;
2730
2731 if (ask_naked_reg == 0)
2732 allow_naked_reg = (intel_syntax
2733 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2734 else
2735 allow_naked_reg = (ask_naked_reg < 0);
2736
2737 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2738
2739 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2740 identifier_chars['$'] = intel_syntax ? '$' : 0;
2741 register_prefix = allow_naked_reg ? "" : "%";
2742 }
2743
2744 static void
2745 set_intel_mnemonic (int mnemonic_flag)
2746 {
2747 intel_mnemonic = mnemonic_flag;
2748 }
2749
2750 static void
2751 set_allow_index_reg (int flag)
2752 {
2753 allow_index_reg = flag;
2754 }
2755
2756 static void
2757 set_check (int what)
2758 {
2759 enum check_kind *kind;
2760 const char *str;
2761
2762 if (what)
2763 {
2764 kind = &operand_check;
2765 str = "operand";
2766 }
2767 else
2768 {
2769 kind = &sse_check;
2770 str = "sse";
2771 }
2772
2773 SKIP_WHITESPACE ();
2774
2775 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2776 {
2777 char *string;
2778 int e = get_symbol_name (&string);
2779
2780 if (strcmp (string, "none") == 0)
2781 *kind = check_none;
2782 else if (strcmp (string, "warning") == 0)
2783 *kind = check_warning;
2784 else if (strcmp (string, "error") == 0)
2785 *kind = check_error;
2786 else
2787 as_bad (_("bad argument to %s_check directive."), str);
2788 (void) restore_line_pointer (e);
2789 }
2790 else
2791 as_bad (_("missing argument for %s_check directive"), str);
2792
2793 demand_empty_rest_of_line ();
2794 }
2795
2796 static void
2797 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2798 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2799 {
2800 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2801 static const char *arch;
2802
2803 /* Intel LIOM is only supported on ELF. */
2804 if (!IS_ELF)
2805 return;
2806
2807 if (!arch)
2808 {
2809 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2810 use default_arch. */
2811 arch = cpu_arch_name;
2812 if (!arch)
2813 arch = default_arch;
2814 }
2815
2816 /* If we are targeting Intel MCU, we must enable it. */
2817 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2818 || new_flag.bitfield.cpuiamcu)
2819 return;
2820
2821 /* If we are targeting Intel L1OM, we must enable it. */
2822 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2823 || new_flag.bitfield.cpul1om)
2824 return;
2825
2826 /* If we are targeting Intel K1OM, we must enable it. */
2827 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2828 || new_flag.bitfield.cpuk1om)
2829 return;
2830
2831 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2832 #endif
2833 }
2834
2835 static void
2836 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2837 {
2838 SKIP_WHITESPACE ();
2839
2840 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2841 {
2842 char *string;
2843 int e = get_symbol_name (&string);
2844 unsigned int j;
2845 i386_cpu_flags flags;
2846
2847 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2848 {
2849 if (strcmp (string, cpu_arch[j].name) == 0)
2850 {
2851 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2852
2853 if (*string != '.')
2854 {
2855 cpu_arch_name = cpu_arch[j].name;
2856 cpu_sub_arch_name = NULL;
2857 cpu_arch_flags = cpu_arch[j].flags;
2858 if (flag_code == CODE_64BIT)
2859 {
2860 cpu_arch_flags.bitfield.cpu64 = 1;
2861 cpu_arch_flags.bitfield.cpuno64 = 0;
2862 }
2863 else
2864 {
2865 cpu_arch_flags.bitfield.cpu64 = 0;
2866 cpu_arch_flags.bitfield.cpuno64 = 1;
2867 }
2868 cpu_arch_isa = cpu_arch[j].type;
2869 cpu_arch_isa_flags = cpu_arch[j].flags;
2870 if (!cpu_arch_tune_set)
2871 {
2872 cpu_arch_tune = cpu_arch_isa;
2873 cpu_arch_tune_flags = cpu_arch_isa_flags;
2874 }
2875 break;
2876 }
2877
2878 flags = cpu_flags_or (cpu_arch_flags,
2879 cpu_arch[j].flags);
2880
2881 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2882 {
2883 if (cpu_sub_arch_name)
2884 {
2885 char *name = cpu_sub_arch_name;
2886 cpu_sub_arch_name = concat (name,
2887 cpu_arch[j].name,
2888 (const char *) NULL);
2889 free (name);
2890 }
2891 else
2892 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2893 cpu_arch_flags = flags;
2894 cpu_arch_isa_flags = flags;
2895 }
2896 else
2897 cpu_arch_isa_flags
2898 = cpu_flags_or (cpu_arch_isa_flags,
2899 cpu_arch[j].flags);
2900 (void) restore_line_pointer (e);
2901 demand_empty_rest_of_line ();
2902 return;
2903 }
2904 }
2905
2906 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2907 {
2908 /* Disable an ISA extension. */
2909 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2910 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2911 {
2912 flags = cpu_flags_and_not (cpu_arch_flags,
2913 cpu_noarch[j].flags);
2914 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2915 {
2916 if (cpu_sub_arch_name)
2917 {
2918 char *name = cpu_sub_arch_name;
2919 cpu_sub_arch_name = concat (name, string,
2920 (const char *) NULL);
2921 free (name);
2922 }
2923 else
2924 cpu_sub_arch_name = xstrdup (string);
2925 cpu_arch_flags = flags;
2926 cpu_arch_isa_flags = flags;
2927 }
2928 (void) restore_line_pointer (e);
2929 demand_empty_rest_of_line ();
2930 return;
2931 }
2932
2933 j = ARRAY_SIZE (cpu_arch);
2934 }
2935
2936 if (j >= ARRAY_SIZE (cpu_arch))
2937 as_bad (_("no such architecture: `%s'"), string);
2938
2939 *input_line_pointer = e;
2940 }
2941 else
2942 as_bad (_("missing cpu architecture"));
2943
2944 no_cond_jump_promotion = 0;
2945 if (*input_line_pointer == ','
2946 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2947 {
2948 char *string;
2949 char e;
2950
2951 ++input_line_pointer;
2952 e = get_symbol_name (&string);
2953
2954 if (strcmp (string, "nojumps") == 0)
2955 no_cond_jump_promotion = 1;
2956 else if (strcmp (string, "jumps") == 0)
2957 ;
2958 else
2959 as_bad (_("no such architecture modifier: `%s'"), string);
2960
2961 (void) restore_line_pointer (e);
2962 }
2963
2964 demand_empty_rest_of_line ();
2965 }
2966
2967 enum bfd_architecture
2968 i386_arch (void)
2969 {
2970 if (cpu_arch_isa == PROCESSOR_L1OM)
2971 {
2972 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2973 || flag_code != CODE_64BIT)
2974 as_fatal (_("Intel L1OM is 64bit ELF only"));
2975 return bfd_arch_l1om;
2976 }
2977 else if (cpu_arch_isa == PROCESSOR_K1OM)
2978 {
2979 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2980 || flag_code != CODE_64BIT)
2981 as_fatal (_("Intel K1OM is 64bit ELF only"));
2982 return bfd_arch_k1om;
2983 }
2984 else if (cpu_arch_isa == PROCESSOR_IAMCU)
2985 {
2986 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2987 || flag_code == CODE_64BIT)
2988 as_fatal (_("Intel MCU is 32bit ELF only"));
2989 return bfd_arch_iamcu;
2990 }
2991 else
2992 return bfd_arch_i386;
2993 }
2994
2995 unsigned long
2996 i386_mach (void)
2997 {
2998 if (!strncmp (default_arch, "x86_64", 6))
2999 {
3000 if (cpu_arch_isa == PROCESSOR_L1OM)
3001 {
3002 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3003 || default_arch[6] != '\0')
3004 as_fatal (_("Intel L1OM is 64bit ELF only"));
3005 return bfd_mach_l1om;
3006 }
3007 else if (cpu_arch_isa == PROCESSOR_K1OM)
3008 {
3009 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3010 || default_arch[6] != '\0')
3011 as_fatal (_("Intel K1OM is 64bit ELF only"));
3012 return bfd_mach_k1om;
3013 }
3014 else if (default_arch[6] == '\0')
3015 return bfd_mach_x86_64;
3016 else
3017 return bfd_mach_x64_32;
3018 }
3019 else if (!strcmp (default_arch, "i386")
3020 || !strcmp (default_arch, "iamcu"))
3021 {
3022 if (cpu_arch_isa == PROCESSOR_IAMCU)
3023 {
3024 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3025 as_fatal (_("Intel MCU is 32bit ELF only"));
3026 return bfd_mach_i386_iamcu;
3027 }
3028 else
3029 return bfd_mach_i386_i386;
3030 }
3031 else
3032 as_fatal (_("unknown architecture"));
3033 }
3034 \f
3035 void
3036 md_begin (void)
3037 {
3038 /* Support pseudo prefixes like {disp32}. */
3039 lex_type ['{'] = LEX_BEGIN_NAME;
3040
3041 /* Initialize op_hash hash table. */
3042 op_hash = str_htab_create ();
3043
3044 {
3045 const insn_template *optab;
3046 templates *core_optab;
3047
3048 /* Setup for loop. */
3049 optab = i386_optab;
3050 core_optab = XNEW (templates);
3051 core_optab->start = optab;
3052
3053 while (1)
3054 {
3055 ++optab;
3056 if (optab->name == NULL
3057 || strcmp (optab->name, (optab - 1)->name) != 0)
3058 {
3059 /* different name --> ship out current template list;
3060 add to hash table; & begin anew. */
3061 core_optab->end = optab;
3062 if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3063 as_fatal (_("duplicate %s"), (optab - 1)->name);
3064
3065 if (optab->name == NULL)
3066 break;
3067 core_optab = XNEW (templates);
3068 core_optab->start = optab;
3069 }
3070 }
3071 }
3072
3073 /* Initialize reg_hash hash table. */
3074 reg_hash = str_htab_create ();
3075 {
3076 const reg_entry *regtab;
3077 unsigned int regtab_size = i386_regtab_size;
3078
3079 for (regtab = i386_regtab; regtab_size--; regtab++)
3080 if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3081 as_fatal (_("duplicate %s"), regtab->reg_name);
3082 }
3083
3084 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3085 {
3086 int c;
3087 char *p;
3088
3089 for (c = 0; c < 256; c++)
3090 {
3091 if (ISDIGIT (c))
3092 {
3093 digit_chars[c] = c;
3094 mnemonic_chars[c] = c;
3095 register_chars[c] = c;
3096 operand_chars[c] = c;
3097 }
3098 else if (ISLOWER (c))
3099 {
3100 mnemonic_chars[c] = c;
3101 register_chars[c] = c;
3102 operand_chars[c] = c;
3103 }
3104 else if (ISUPPER (c))
3105 {
3106 mnemonic_chars[c] = TOLOWER (c);
3107 register_chars[c] = mnemonic_chars[c];
3108 operand_chars[c] = c;
3109 }
3110 else if (c == '{' || c == '}')
3111 {
3112 mnemonic_chars[c] = c;
3113 operand_chars[c] = c;
3114 }
3115 #ifdef SVR4_COMMENT_CHARS
3116 else if (c == '\\' && strchr (i386_comment_chars, '/'))
3117 operand_chars[c] = c;
3118 #endif
3119
3120 if (ISALPHA (c) || ISDIGIT (c))
3121 identifier_chars[c] = c;
3122 else if (c >= 128)
3123 {
3124 identifier_chars[c] = c;
3125 operand_chars[c] = c;
3126 }
3127 }
3128
3129 #ifdef LEX_AT
3130 identifier_chars['@'] = '@';
3131 #endif
3132 #ifdef LEX_QM
3133 identifier_chars['?'] = '?';
3134 operand_chars['?'] = '?';
3135 #endif
3136 digit_chars['-'] = '-';
3137 mnemonic_chars['_'] = '_';
3138 mnemonic_chars['-'] = '-';
3139 mnemonic_chars['.'] = '.';
3140 identifier_chars['_'] = '_';
3141 identifier_chars['.'] = '.';
3142
3143 for (p = operand_special_chars; *p != '\0'; p++)
3144 operand_chars[(unsigned char) *p] = *p;
3145 }
3146
3147 if (flag_code == CODE_64BIT)
3148 {
3149 #if defined (OBJ_COFF) && defined (TE_PE)
3150 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3151 ? 32 : 16);
3152 #else
3153 x86_dwarf2_return_column = 16;
3154 #endif
3155 x86_cie_data_alignment = -8;
3156 }
3157 else
3158 {
3159 x86_dwarf2_return_column = 8;
3160 x86_cie_data_alignment = -4;
3161 }
3162
3163 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3164 can be turned into BRANCH_PREFIX frag. */
3165 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3166 abort ();
3167 }
3168
3169 void
3170 i386_print_statistics (FILE *file)
3171 {
3172 htab_print_statistics (file, "i386 opcode", op_hash);
3173 htab_print_statistics (file, "i386 register", reg_hash);
3174 }
3175 \f
3176 #ifdef DEBUG386
3177
3178 /* Debugging routines for md_assemble. */
3179 static void pte (insn_template *);
3180 static void pt (i386_operand_type);
3181 static void pe (expressionS *);
3182 static void ps (symbolS *);
3183
3184 static void
3185 pi (const char *line, i386_insn *x)
3186 {
3187 unsigned int j;
3188
3189 fprintf (stdout, "%s: template ", line);
3190 pte (&x->tm);
3191 fprintf (stdout, " address: base %s index %s scale %x\n",
3192 x->base_reg ? x->base_reg->reg_name : "none",
3193 x->index_reg ? x->index_reg->reg_name : "none",
3194 x->log2_scale_factor);
3195 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3196 x->rm.mode, x->rm.reg, x->rm.regmem);
3197 fprintf (stdout, " sib: base %x index %x scale %x\n",
3198 x->sib.base, x->sib.index, x->sib.scale);
3199 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3200 (x->rex & REX_W) != 0,
3201 (x->rex & REX_R) != 0,
3202 (x->rex & REX_X) != 0,
3203 (x->rex & REX_B) != 0);
3204 for (j = 0; j < x->operands; j++)
3205 {
3206 fprintf (stdout, " #%d: ", j + 1);
3207 pt (x->types[j]);
3208 fprintf (stdout, "\n");
3209 if (x->types[j].bitfield.class == Reg
3210 || x->types[j].bitfield.class == RegMMX
3211 || x->types[j].bitfield.class == RegSIMD
3212 || x->types[j].bitfield.class == RegMask
3213 || x->types[j].bitfield.class == SReg
3214 || x->types[j].bitfield.class == RegCR
3215 || x->types[j].bitfield.class == RegDR
3216 || x->types[j].bitfield.class == RegTR
3217 || x->types[j].bitfield.class == RegBND)
3218 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3219 if (operand_type_check (x->types[j], imm))
3220 pe (x->op[j].imms);
3221 if (operand_type_check (x->types[j], disp))
3222 pe (x->op[j].disps);
3223 }
3224 }
3225
3226 static void
3227 pte (insn_template *t)
3228 {
3229 unsigned int j;
3230 fprintf (stdout, " %d operands ", t->operands);
3231 fprintf (stdout, "opcode %x ", t->base_opcode);
3232 if (t->extension_opcode != None)
3233 fprintf (stdout, "ext %x ", t->extension_opcode);
3234 if (t->opcode_modifier.d)
3235 fprintf (stdout, "D");
3236 if (t->opcode_modifier.w)
3237 fprintf (stdout, "W");
3238 fprintf (stdout, "\n");
3239 for (j = 0; j < t->operands; j++)
3240 {
3241 fprintf (stdout, " #%d type ", j + 1);
3242 pt (t->operand_types[j]);
3243 fprintf (stdout, "\n");
3244 }
3245 }
3246
3247 static void
3248 pe (expressionS *e)
3249 {
3250 fprintf (stdout, " operation %d\n", e->X_op);
3251 fprintf (stdout, " add_number %ld (%lx)\n",
3252 (long) e->X_add_number, (long) e->X_add_number);
3253 if (e->X_add_symbol)
3254 {
3255 fprintf (stdout, " add_symbol ");
3256 ps (e->X_add_symbol);
3257 fprintf (stdout, "\n");
3258 }
3259 if (e->X_op_symbol)
3260 {
3261 fprintf (stdout, " op_symbol ");
3262 ps (e->X_op_symbol);
3263 fprintf (stdout, "\n");
3264 }
3265 }
3266
3267 static void
3268 ps (symbolS *s)
3269 {
3270 fprintf (stdout, "%s type %s%s",
3271 S_GET_NAME (s),
3272 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3273 segment_name (S_GET_SEGMENT (s)));
3274 }
3275
3276 static struct type_name
3277 {
3278 i386_operand_type mask;
3279 const char *name;
3280 }
3281 const type_names[] =
3282 {
3283 { OPERAND_TYPE_REG8, "r8" },
3284 { OPERAND_TYPE_REG16, "r16" },
3285 { OPERAND_TYPE_REG32, "r32" },
3286 { OPERAND_TYPE_REG64, "r64" },
3287 { OPERAND_TYPE_ACC8, "acc8" },
3288 { OPERAND_TYPE_ACC16, "acc16" },
3289 { OPERAND_TYPE_ACC32, "acc32" },
3290 { OPERAND_TYPE_ACC64, "acc64" },
3291 { OPERAND_TYPE_IMM8, "i8" },
3292 { OPERAND_TYPE_IMM8, "i8s" },
3293 { OPERAND_TYPE_IMM16, "i16" },
3294 { OPERAND_TYPE_IMM32, "i32" },
3295 { OPERAND_TYPE_IMM32S, "i32s" },
3296 { OPERAND_TYPE_IMM64, "i64" },
3297 { OPERAND_TYPE_IMM1, "i1" },
3298 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3299 { OPERAND_TYPE_DISP8, "d8" },
3300 { OPERAND_TYPE_DISP16, "d16" },
3301 { OPERAND_TYPE_DISP32, "d32" },
3302 { OPERAND_TYPE_DISP32S, "d32s" },
3303 { OPERAND_TYPE_DISP64, "d64" },
3304 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3305 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3306 { OPERAND_TYPE_CONTROL, "control reg" },
3307 { OPERAND_TYPE_TEST, "test reg" },
3308 { OPERAND_TYPE_DEBUG, "debug reg" },
3309 { OPERAND_TYPE_FLOATREG, "FReg" },
3310 { OPERAND_TYPE_FLOATACC, "FAcc" },
3311 { OPERAND_TYPE_SREG, "SReg" },
3312 { OPERAND_TYPE_REGMMX, "rMMX" },
3313 { OPERAND_TYPE_REGXMM, "rXMM" },
3314 { OPERAND_TYPE_REGYMM, "rYMM" },
3315 { OPERAND_TYPE_REGZMM, "rZMM" },
3316 { OPERAND_TYPE_REGTMM, "rTMM" },
3317 { OPERAND_TYPE_REGMASK, "Mask reg" },
3318 };
3319
3320 static void
3321 pt (i386_operand_type t)
3322 {
3323 unsigned int j;
3324 i386_operand_type a;
3325
3326 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3327 {
3328 a = operand_type_and (t, type_names[j].mask);
3329 if (operand_type_equal (&a, &type_names[j].mask))
3330 fprintf (stdout, "%s, ", type_names[j].name);
3331 }
3332 fflush (stdout);
3333 }
3334
3335 #endif /* DEBUG386 */
3336 \f
3337 static bfd_reloc_code_real_type
3338 reloc (unsigned int size,
3339 int pcrel,
3340 int sign,
3341 bfd_reloc_code_real_type other)
3342 {
3343 if (other != NO_RELOC)
3344 {
3345 reloc_howto_type *rel;
3346
3347 if (size == 8)
3348 switch (other)
3349 {
3350 case BFD_RELOC_X86_64_GOT32:
3351 return BFD_RELOC_X86_64_GOT64;
3352 break;
3353 case BFD_RELOC_X86_64_GOTPLT64:
3354 return BFD_RELOC_X86_64_GOTPLT64;
3355 break;
3356 case BFD_RELOC_X86_64_PLTOFF64:
3357 return BFD_RELOC_X86_64_PLTOFF64;
3358 break;
3359 case BFD_RELOC_X86_64_GOTPC32:
3360 other = BFD_RELOC_X86_64_GOTPC64;
3361 break;
3362 case BFD_RELOC_X86_64_GOTPCREL:
3363 other = BFD_RELOC_X86_64_GOTPCREL64;
3364 break;
3365 case BFD_RELOC_X86_64_TPOFF32:
3366 other = BFD_RELOC_X86_64_TPOFF64;
3367 break;
3368 case BFD_RELOC_X86_64_DTPOFF32:
3369 other = BFD_RELOC_X86_64_DTPOFF64;
3370 break;
3371 default:
3372 break;
3373 }
3374
3375 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3376 if (other == BFD_RELOC_SIZE32)
3377 {
3378 if (size == 8)
3379 other = BFD_RELOC_SIZE64;
3380 if (pcrel)
3381 {
3382 as_bad (_("there are no pc-relative size relocations"));
3383 return NO_RELOC;
3384 }
3385 }
3386 #endif
3387
3388 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3389 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3390 sign = -1;
3391
3392 rel = bfd_reloc_type_lookup (stdoutput, other);
3393 if (!rel)
3394 as_bad (_("unknown relocation (%u)"), other);
3395 else if (size != bfd_get_reloc_size (rel))
3396 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3397 bfd_get_reloc_size (rel),
3398 size);
3399 else if (pcrel && !rel->pc_relative)
3400 as_bad (_("non-pc-relative relocation for pc-relative field"));
3401 else if ((rel->complain_on_overflow == complain_overflow_signed
3402 && !sign)
3403 || (rel->complain_on_overflow == complain_overflow_unsigned
3404 && sign > 0))
3405 as_bad (_("relocated field and relocation type differ in signedness"));
3406 else
3407 return other;
3408 return NO_RELOC;
3409 }
3410
3411 if (pcrel)
3412 {
3413 if (!sign)
3414 as_bad (_("there are no unsigned pc-relative relocations"));
3415 switch (size)
3416 {
3417 case 1: return BFD_RELOC_8_PCREL;
3418 case 2: return BFD_RELOC_16_PCREL;
3419 case 4: return BFD_RELOC_32_PCREL;
3420 case 8: return BFD_RELOC_64_PCREL;
3421 }
3422 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3423 }
3424 else
3425 {
3426 if (sign > 0)
3427 switch (size)
3428 {
3429 case 4: return BFD_RELOC_X86_64_32S;
3430 }
3431 else
3432 switch (size)
3433 {
3434 case 1: return BFD_RELOC_8;
3435 case 2: return BFD_RELOC_16;
3436 case 4: return BFD_RELOC_32;
3437 case 8: return BFD_RELOC_64;
3438 }
3439 as_bad (_("cannot do %s %u byte relocation"),
3440 sign > 0 ? "signed" : "unsigned", size);
3441 }
3442
3443 return NO_RELOC;
3444 }
3445
3446 /* Here we decide which fixups can be adjusted to make them relative to
3447 the beginning of the section instead of the symbol. Basically we need
3448 to make sure that the dynamic relocations are done correctly, so in
3449 some cases we force the original symbol to be used. */
3450
3451 int
3452 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3453 {
3454 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3455 if (!IS_ELF)
3456 return 1;
3457
3458 /* Don't adjust pc-relative references to merge sections in 64-bit
3459 mode. */
3460 if (use_rela_relocations
3461 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3462 && fixP->fx_pcrel)
3463 return 0;
3464
3465 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3466 and changed later by validate_fix. */
3467 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3468 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3469 return 0;
3470
3471 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3472 for size relocations. */
3473 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3474 || fixP->fx_r_type == BFD_RELOC_SIZE64
3475 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3476 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3477 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3478 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3479 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3480 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3481 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3482 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3483 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3484 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3485 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3486 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3487 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3488 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3489 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3490 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3491 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3492 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3493 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3494 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3495 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3496 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3497 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3498 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3499 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3500 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3501 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3502 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3503 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3504 return 0;
3505 #endif
3506 return 1;
3507 }
3508
3509 static int
3510 intel_float_operand (const char *mnemonic)
3511 {
3512 /* Note that the value returned is meaningful only for opcodes with (memory)
3513 operands, hence the code here is free to improperly handle opcodes that
3514 have no operands (for better performance and smaller code). */
3515
3516 if (mnemonic[0] != 'f')
3517 return 0; /* non-math */
3518
3519 switch (mnemonic[1])
3520 {
3521 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3522 the fs segment override prefix not currently handled because no
3523 call path can make opcodes without operands get here */
3524 case 'i':
3525 return 2 /* integer op */;
3526 case 'l':
3527 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3528 return 3; /* fldcw/fldenv */
3529 break;
3530 case 'n':
3531 if (mnemonic[2] != 'o' /* fnop */)
3532 return 3; /* non-waiting control op */
3533 break;
3534 case 'r':
3535 if (mnemonic[2] == 's')
3536 return 3; /* frstor/frstpm */
3537 break;
3538 case 's':
3539 if (mnemonic[2] == 'a')
3540 return 3; /* fsave */
3541 if (mnemonic[2] == 't')
3542 {
3543 switch (mnemonic[3])
3544 {
3545 case 'c': /* fstcw */
3546 case 'd': /* fstdw */
3547 case 'e': /* fstenv */
3548 case 's': /* fsts[gw] */
3549 return 3;
3550 }
3551 }
3552 break;
3553 case 'x':
3554 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3555 return 0; /* fxsave/fxrstor are not really math ops */
3556 break;
3557 }
3558
3559 return 1;
3560 }
3561
3562 /* Build the VEX prefix. */
3563
3564 static void
3565 build_vex_prefix (const insn_template *t)
3566 {
3567 unsigned int register_specifier;
3568 unsigned int implied_prefix;
3569 unsigned int vector_length;
3570 unsigned int w;
3571
3572 /* Check register specifier. */
3573 if (i.vex.register_specifier)
3574 {
3575 register_specifier =
3576 ~register_number (i.vex.register_specifier) & 0xf;
3577 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3578 }
3579 else
3580 register_specifier = 0xf;
3581
3582 /* Use 2-byte VEX prefix by swapping destination and source operand
3583 if there are more than 1 register operand. */
3584 if (i.reg_operands > 1
3585 && i.vec_encoding != vex_encoding_vex3
3586 && i.dir_encoding == dir_encoding_default
3587 && i.operands == i.reg_operands
3588 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3589 && i.tm.opcode_modifier.vexopcode == VEX0F
3590 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3591 && i.rex == REX_B)
3592 {
3593 unsigned int xchg = i.operands - 1;
3594 union i386_op temp_op;
3595 i386_operand_type temp_type;
3596
3597 temp_type = i.types[xchg];
3598 i.types[xchg] = i.types[0];
3599 i.types[0] = temp_type;
3600 temp_op = i.op[xchg];
3601 i.op[xchg] = i.op[0];
3602 i.op[0] = temp_op;
3603
3604 gas_assert (i.rm.mode == 3);
3605
3606 i.rex = REX_R;
3607 xchg = i.rm.regmem;
3608 i.rm.regmem = i.rm.reg;
3609 i.rm.reg = xchg;
3610
3611 if (i.tm.opcode_modifier.d)
3612 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3613 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3614 else /* Use the next insn. */
3615 i.tm = t[1];
3616 }
3617
3618 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3619 are no memory operands and at least 3 register ones. */
3620 if (i.reg_operands >= 3
3621 && i.vec_encoding != vex_encoding_vex3
3622 && i.reg_operands == i.operands - i.imm_operands
3623 && i.tm.opcode_modifier.vex
3624 && i.tm.opcode_modifier.commutative
3625 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3626 && i.rex == REX_B
3627 && i.vex.register_specifier
3628 && !(i.vex.register_specifier->reg_flags & RegRex))
3629 {
3630 unsigned int xchg = i.operands - i.reg_operands;
3631 union i386_op temp_op;
3632 i386_operand_type temp_type;
3633
3634 gas_assert (i.tm.opcode_modifier.vexopcode == VEX0F);
3635 gas_assert (!i.tm.opcode_modifier.sae);
3636 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3637 &i.types[i.operands - 3]));
3638 gas_assert (i.rm.mode == 3);
3639
3640 temp_type = i.types[xchg];
3641 i.types[xchg] = i.types[xchg + 1];
3642 i.types[xchg + 1] = temp_type;
3643 temp_op = i.op[xchg];
3644 i.op[xchg] = i.op[xchg + 1];
3645 i.op[xchg + 1] = temp_op;
3646
3647 i.rex = 0;
3648 xchg = i.rm.regmem | 8;
3649 i.rm.regmem = ~register_specifier & 0xf;
3650 gas_assert (!(i.rm.regmem & 8));
3651 i.vex.register_specifier += xchg - i.rm.regmem;
3652 register_specifier = ~xchg & 0xf;
3653 }
3654
3655 if (i.tm.opcode_modifier.vex == VEXScalar)
3656 vector_length = avxscalar;
3657 else if (i.tm.opcode_modifier.vex == VEX256)
3658 vector_length = 1;
3659 else
3660 {
3661 unsigned int op;
3662
3663 /* Determine vector length from the last multi-length vector
3664 operand. */
3665 vector_length = 0;
3666 for (op = t->operands; op--;)
3667 if (t->operand_types[op].bitfield.xmmword
3668 && t->operand_types[op].bitfield.ymmword
3669 && i.types[op].bitfield.ymmword)
3670 {
3671 vector_length = 1;
3672 break;
3673 }
3674 }
3675
3676 switch ((i.tm.base_opcode >> (i.tm.opcode_length << 3)) & 0xff)
3677 {
3678 case 0:
3679 implied_prefix = 0;
3680 break;
3681 case DATA_PREFIX_OPCODE:
3682 implied_prefix = 1;
3683 break;
3684 case REPE_PREFIX_OPCODE:
3685 implied_prefix = 2;
3686 break;
3687 case REPNE_PREFIX_OPCODE:
3688 implied_prefix = 3;
3689 break;
3690 default:
3691 abort ();
3692 }
3693
3694 /* Check the REX.W bit and VEXW. */
3695 if (i.tm.opcode_modifier.vexw == VEXWIG)
3696 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3697 else if (i.tm.opcode_modifier.vexw)
3698 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3699 else
3700 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3701
3702 /* Use 2-byte VEX prefix if possible. */
3703 if (w == 0
3704 && i.vec_encoding != vex_encoding_vex3
3705 && i.tm.opcode_modifier.vexopcode == VEX0F
3706 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3707 {
3708 /* 2-byte VEX prefix. */
3709 unsigned int r;
3710
3711 i.vex.length = 2;
3712 i.vex.bytes[0] = 0xc5;
3713
3714 /* Check the REX.R bit. */
3715 r = (i.rex & REX_R) ? 0 : 1;
3716 i.vex.bytes[1] = (r << 7
3717 | register_specifier << 3
3718 | vector_length << 2
3719 | implied_prefix);
3720 }
3721 else
3722 {
3723 /* 3-byte VEX prefix. */
3724 unsigned int m;
3725
3726 i.vex.length = 3;
3727
3728 switch (i.tm.opcode_modifier.vexopcode)
3729 {
3730 case VEX0F:
3731 m = 0x1;
3732 i.vex.bytes[0] = 0xc4;
3733 break;
3734 case VEX0F38:
3735 m = 0x2;
3736 i.vex.bytes[0] = 0xc4;
3737 break;
3738 case VEX0F3A:
3739 m = 0x3;
3740 i.vex.bytes[0] = 0xc4;
3741 break;
3742 case XOP08:
3743 m = 0x8;
3744 i.vex.bytes[0] = 0x8f;
3745 break;
3746 case XOP09:
3747 m = 0x9;
3748 i.vex.bytes[0] = 0x8f;
3749 break;
3750 case XOP0A:
3751 m = 0xa;
3752 i.vex.bytes[0] = 0x8f;
3753 break;
3754 default:
3755 abort ();
3756 }
3757
3758 /* The high 3 bits of the second VEX byte are 1's compliment
3759 of RXB bits from REX. */
3760 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3761
3762 i.vex.bytes[2] = (w << 7
3763 | register_specifier << 3
3764 | vector_length << 2
3765 | implied_prefix);
3766 }
3767 }
3768
3769 static INLINE bfd_boolean
3770 is_evex_encoding (const insn_template *t)
3771 {
3772 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3773 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3774 || t->opcode_modifier.sae;
3775 }
3776
3777 static INLINE bfd_boolean
3778 is_any_vex_encoding (const insn_template *t)
3779 {
3780 return t->opcode_modifier.vex || t->opcode_modifier.vexopcode
3781 || is_evex_encoding (t);
3782 }
3783
3784 /* Build the EVEX prefix. */
3785
3786 static void
3787 build_evex_prefix (void)
3788 {
3789 unsigned int register_specifier;
3790 unsigned int implied_prefix;
3791 unsigned int m, w;
3792 rex_byte vrex_used = 0;
3793
3794 /* Check register specifier. */
3795 if (i.vex.register_specifier)
3796 {
3797 gas_assert ((i.vrex & REX_X) == 0);
3798
3799 register_specifier = i.vex.register_specifier->reg_num;
3800 if ((i.vex.register_specifier->reg_flags & RegRex))
3801 register_specifier += 8;
3802 /* The upper 16 registers are encoded in the fourth byte of the
3803 EVEX prefix. */
3804 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3805 i.vex.bytes[3] = 0x8;
3806 register_specifier = ~register_specifier & 0xf;
3807 }
3808 else
3809 {
3810 register_specifier = 0xf;
3811
3812 /* Encode upper 16 vector index register in the fourth byte of
3813 the EVEX prefix. */
3814 if (!(i.vrex & REX_X))
3815 i.vex.bytes[3] = 0x8;
3816 else
3817 vrex_used |= REX_X;
3818 }
3819
3820 switch ((i.tm.base_opcode >> 8) & 0xff)
3821 {
3822 case 0:
3823 implied_prefix = 0;
3824 break;
3825 case DATA_PREFIX_OPCODE:
3826 implied_prefix = 1;
3827 break;
3828 case REPE_PREFIX_OPCODE:
3829 implied_prefix = 2;
3830 break;
3831 case REPNE_PREFIX_OPCODE:
3832 implied_prefix = 3;
3833 break;
3834 default:
3835 abort ();
3836 }
3837
3838 /* 4 byte EVEX prefix. */
3839 i.vex.length = 4;
3840 i.vex.bytes[0] = 0x62;
3841
3842 /* mmmm bits. */
3843 switch (i.tm.opcode_modifier.vexopcode)
3844 {
3845 case VEX0F:
3846 m = 1;
3847 break;
3848 case VEX0F38:
3849 m = 2;
3850 break;
3851 case VEX0F3A:
3852 m = 3;
3853 break;
3854 default:
3855 abort ();
3856 break;
3857 }
3858
3859 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3860 bits from REX. */
3861 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | m;
3862
3863 /* The fifth bit of the second EVEX byte is 1's compliment of the
3864 REX_R bit in VREX. */
3865 if (!(i.vrex & REX_R))
3866 i.vex.bytes[1] |= 0x10;
3867 else
3868 vrex_used |= REX_R;
3869
3870 if ((i.reg_operands + i.imm_operands) == i.operands)
3871 {
3872 /* When all operands are registers, the REX_X bit in REX is not
3873 used. We reuse it to encode the upper 16 registers, which is
3874 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3875 as 1's compliment. */
3876 if ((i.vrex & REX_B))
3877 {
3878 vrex_used |= REX_B;
3879 i.vex.bytes[1] &= ~0x40;
3880 }
3881 }
3882
3883 /* EVEX instructions shouldn't need the REX prefix. */
3884 i.vrex &= ~vrex_used;
3885 gas_assert (i.vrex == 0);
3886
3887 /* Check the REX.W bit and VEXW. */
3888 if (i.tm.opcode_modifier.vexw == VEXWIG)
3889 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3890 else if (i.tm.opcode_modifier.vexw)
3891 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3892 else
3893 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3894
3895 /* Encode the U bit. */
3896 implied_prefix |= 0x4;
3897
3898 /* The third byte of the EVEX prefix. */
3899 i.vex.bytes[2] = (w << 7 | register_specifier << 3 | implied_prefix);
3900
3901 /* The fourth byte of the EVEX prefix. */
3902 /* The zeroing-masking bit. */
3903 if (i.mask && i.mask->zeroing)
3904 i.vex.bytes[3] |= 0x80;
3905
3906 /* Don't always set the broadcast bit if there is no RC. */
3907 if (!i.rounding)
3908 {
3909 /* Encode the vector length. */
3910 unsigned int vec_length;
3911
3912 if (!i.tm.opcode_modifier.evex
3913 || i.tm.opcode_modifier.evex == EVEXDYN)
3914 {
3915 unsigned int op;
3916
3917 /* Determine vector length from the last multi-length vector
3918 operand. */
3919 for (op = i.operands; op--;)
3920 if (i.tm.operand_types[op].bitfield.xmmword
3921 + i.tm.operand_types[op].bitfield.ymmword
3922 + i.tm.operand_types[op].bitfield.zmmword > 1)
3923 {
3924 if (i.types[op].bitfield.zmmword)
3925 {
3926 i.tm.opcode_modifier.evex = EVEX512;
3927 break;
3928 }
3929 else if (i.types[op].bitfield.ymmword)
3930 {
3931 i.tm.opcode_modifier.evex = EVEX256;
3932 break;
3933 }
3934 else if (i.types[op].bitfield.xmmword)
3935 {
3936 i.tm.opcode_modifier.evex = EVEX128;
3937 break;
3938 }
3939 else if (i.broadcast && (int) op == i.broadcast->operand)
3940 {
3941 switch (i.broadcast->bytes)
3942 {
3943 case 64:
3944 i.tm.opcode_modifier.evex = EVEX512;
3945 break;
3946 case 32:
3947 i.tm.opcode_modifier.evex = EVEX256;
3948 break;
3949 case 16:
3950 i.tm.opcode_modifier.evex = EVEX128;
3951 break;
3952 default:
3953 abort ();
3954 }
3955 break;
3956 }
3957 }
3958
3959 if (op >= MAX_OPERANDS)
3960 abort ();
3961 }
3962
3963 switch (i.tm.opcode_modifier.evex)
3964 {
3965 case EVEXLIG: /* LL' is ignored */
3966 vec_length = evexlig << 5;
3967 break;
3968 case EVEX128:
3969 vec_length = 0 << 5;
3970 break;
3971 case EVEX256:
3972 vec_length = 1 << 5;
3973 break;
3974 case EVEX512:
3975 vec_length = 2 << 5;
3976 break;
3977 default:
3978 abort ();
3979 break;
3980 }
3981 i.vex.bytes[3] |= vec_length;
3982 /* Encode the broadcast bit. */
3983 if (i.broadcast)
3984 i.vex.bytes[3] |= 0x10;
3985 }
3986 else
3987 {
3988 if (i.rounding->type != saeonly)
3989 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3990 else
3991 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3992 }
3993
3994 if (i.mask && i.mask->mask)
3995 i.vex.bytes[3] |= i.mask->mask->reg_num;
3996 }
3997
3998 static void
3999 process_immext (void)
4000 {
4001 expressionS *exp;
4002
4003 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
4004 which is coded in the same place as an 8-bit immediate field
4005 would be. Here we fake an 8-bit immediate operand from the
4006 opcode suffix stored in tm.extension_opcode.
4007
4008 AVX instructions also use this encoding, for some of
4009 3 argument instructions. */
4010
4011 gas_assert (i.imm_operands <= 1
4012 && (i.operands <= 2
4013 || (is_any_vex_encoding (&i.tm)
4014 && i.operands <= 4)));
4015
4016 exp = &im_expressions[i.imm_operands++];
4017 i.op[i.operands].imms = exp;
4018 i.types[i.operands] = imm8;
4019 i.operands++;
4020 exp->X_op = O_constant;
4021 exp->X_add_number = i.tm.extension_opcode;
4022 i.tm.extension_opcode = None;
4023 }
4024
4025
4026 static int
4027 check_hle (void)
4028 {
4029 switch (i.tm.opcode_modifier.hleprefixok)
4030 {
4031 default:
4032 abort ();
4033 case HLEPrefixNone:
4034 as_bad (_("invalid instruction `%s' after `%s'"),
4035 i.tm.name, i.hle_prefix);
4036 return 0;
4037 case HLEPrefixLock:
4038 if (i.prefix[LOCK_PREFIX])
4039 return 1;
4040 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4041 return 0;
4042 case HLEPrefixAny:
4043 return 1;
4044 case HLEPrefixRelease:
4045 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4046 {
4047 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4048 i.tm.name);
4049 return 0;
4050 }
4051 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4052 {
4053 as_bad (_("memory destination needed for instruction `%s'"
4054 " after `xrelease'"), i.tm.name);
4055 return 0;
4056 }
4057 return 1;
4058 }
4059 }
4060
4061 /* Try the shortest encoding by shortening operand size. */
4062
4063 static void
4064 optimize_encoding (void)
4065 {
4066 unsigned int j;
4067
4068 if (optimize_for_space
4069 && !is_any_vex_encoding (&i.tm)
4070 && i.reg_operands == 1
4071 && i.imm_operands == 1
4072 && !i.types[1].bitfield.byte
4073 && i.op[0].imms->X_op == O_constant
4074 && fits_in_imm7 (i.op[0].imms->X_add_number)
4075 && (i.tm.base_opcode == 0xa8
4076 || (i.tm.base_opcode == 0xf6
4077 && i.tm.extension_opcode == 0x0)))
4078 {
4079 /* Optimize: -Os:
4080 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4081 */
4082 unsigned int base_regnum = i.op[1].regs->reg_num;
4083 if (flag_code == CODE_64BIT || base_regnum < 4)
4084 {
4085 i.types[1].bitfield.byte = 1;
4086 /* Ignore the suffix. */
4087 i.suffix = 0;
4088 /* Convert to byte registers. */
4089 if (i.types[1].bitfield.word)
4090 j = 16;
4091 else if (i.types[1].bitfield.dword)
4092 j = 32;
4093 else
4094 j = 48;
4095 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4096 j += 8;
4097 i.op[1].regs -= j;
4098 }
4099 }
4100 else if (flag_code == CODE_64BIT
4101 && !is_any_vex_encoding (&i.tm)
4102 && ((i.types[1].bitfield.qword
4103 && i.reg_operands == 1
4104 && i.imm_operands == 1
4105 && i.op[0].imms->X_op == O_constant
4106 && ((i.tm.base_opcode == 0xb8
4107 && i.tm.extension_opcode == None
4108 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4109 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4110 && ((i.tm.base_opcode == 0x24
4111 || i.tm.base_opcode == 0xa8)
4112 || (i.tm.base_opcode == 0x80
4113 && i.tm.extension_opcode == 0x4)
4114 || ((i.tm.base_opcode == 0xf6
4115 || (i.tm.base_opcode | 1) == 0xc7)
4116 && i.tm.extension_opcode == 0x0)))
4117 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4118 && i.tm.base_opcode == 0x83
4119 && i.tm.extension_opcode == 0x4)))
4120 || (i.types[0].bitfield.qword
4121 && ((i.reg_operands == 2
4122 && i.op[0].regs == i.op[1].regs
4123 && (i.tm.base_opcode == 0x30
4124 || i.tm.base_opcode == 0x28))
4125 || (i.reg_operands == 1
4126 && i.operands == 1
4127 && i.tm.base_opcode == 0x30)))))
4128 {
4129 /* Optimize: -O:
4130 andq $imm31, %r64 -> andl $imm31, %r32
4131 andq $imm7, %r64 -> andl $imm7, %r32
4132 testq $imm31, %r64 -> testl $imm31, %r32
4133 xorq %r64, %r64 -> xorl %r32, %r32
4134 subq %r64, %r64 -> subl %r32, %r32
4135 movq $imm31, %r64 -> movl $imm31, %r32
4136 movq $imm32, %r64 -> movl $imm32, %r32
4137 */
4138 i.tm.opcode_modifier.norex64 = 1;
4139 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4140 {
4141 /* Handle
4142 movq $imm31, %r64 -> movl $imm31, %r32
4143 movq $imm32, %r64 -> movl $imm32, %r32
4144 */
4145 i.tm.operand_types[0].bitfield.imm32 = 1;
4146 i.tm.operand_types[0].bitfield.imm32s = 0;
4147 i.tm.operand_types[0].bitfield.imm64 = 0;
4148 i.types[0].bitfield.imm32 = 1;
4149 i.types[0].bitfield.imm32s = 0;
4150 i.types[0].bitfield.imm64 = 0;
4151 i.types[1].bitfield.dword = 1;
4152 i.types[1].bitfield.qword = 0;
4153 if ((i.tm.base_opcode | 1) == 0xc7)
4154 {
4155 /* Handle
4156 movq $imm31, %r64 -> movl $imm31, %r32
4157 */
4158 i.tm.base_opcode = 0xb8;
4159 i.tm.extension_opcode = None;
4160 i.tm.opcode_modifier.w = 0;
4161 i.tm.opcode_modifier.modrm = 0;
4162 }
4163 }
4164 }
4165 else if (optimize > 1
4166 && !optimize_for_space
4167 && !is_any_vex_encoding (&i.tm)
4168 && i.reg_operands == 2
4169 && i.op[0].regs == i.op[1].regs
4170 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4171 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4172 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4173 {
4174 /* Optimize: -O2:
4175 andb %rN, %rN -> testb %rN, %rN
4176 andw %rN, %rN -> testw %rN, %rN
4177 andq %rN, %rN -> testq %rN, %rN
4178 orb %rN, %rN -> testb %rN, %rN
4179 orw %rN, %rN -> testw %rN, %rN
4180 orq %rN, %rN -> testq %rN, %rN
4181
4182 and outside of 64-bit mode
4183
4184 andl %rN, %rN -> testl %rN, %rN
4185 orl %rN, %rN -> testl %rN, %rN
4186 */
4187 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4188 }
4189 else if (i.reg_operands == 3
4190 && i.op[0].regs == i.op[1].regs
4191 && !i.types[2].bitfield.xmmword
4192 && (i.tm.opcode_modifier.vex
4193 || ((!i.mask || i.mask->zeroing)
4194 && !i.rounding
4195 && is_evex_encoding (&i.tm)
4196 && (i.vec_encoding != vex_encoding_evex
4197 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4198 || i.tm.cpu_flags.bitfield.cpuavx512vl
4199 || (i.tm.operand_types[2].bitfield.zmmword
4200 && i.types[2].bitfield.ymmword))))
4201 && ((i.tm.base_opcode == 0x55
4202 || i.tm.base_opcode == 0x6655
4203 || i.tm.base_opcode == 0x66df
4204 || i.tm.base_opcode == 0x57
4205 || i.tm.base_opcode == 0x6657
4206 || i.tm.base_opcode == 0x66ef
4207 || i.tm.base_opcode == 0x66f8
4208 || i.tm.base_opcode == 0x66f9
4209 || i.tm.base_opcode == 0x66fa
4210 || i.tm.base_opcode == 0x66fb
4211 || i.tm.base_opcode == 0x42
4212 || i.tm.base_opcode == 0x6642
4213 || i.tm.base_opcode == 0x47
4214 || i.tm.base_opcode == 0x6647)
4215 && i.tm.extension_opcode == None))
4216 {
4217 /* Optimize: -O1:
4218 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4219 vpsubq and vpsubw:
4220 EVEX VOP %zmmM, %zmmM, %zmmN
4221 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4222 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4223 EVEX VOP %ymmM, %ymmM, %ymmN
4224 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4225 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4226 VEX VOP %ymmM, %ymmM, %ymmN
4227 -> VEX VOP %xmmM, %xmmM, %xmmN
4228 VOP, one of vpandn and vpxor:
4229 VEX VOP %ymmM, %ymmM, %ymmN
4230 -> VEX VOP %xmmM, %xmmM, %xmmN
4231 VOP, one of vpandnd and vpandnq:
4232 EVEX VOP %zmmM, %zmmM, %zmmN
4233 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4234 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4235 EVEX VOP %ymmM, %ymmM, %ymmN
4236 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4237 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4238 VOP, one of vpxord and vpxorq:
4239 EVEX VOP %zmmM, %zmmM, %zmmN
4240 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4241 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4242 EVEX VOP %ymmM, %ymmM, %ymmN
4243 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4244 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4245 VOP, one of kxord and kxorq:
4246 VEX VOP %kM, %kM, %kN
4247 -> VEX kxorw %kM, %kM, %kN
4248 VOP, one of kandnd and kandnq:
4249 VEX VOP %kM, %kM, %kN
4250 -> VEX kandnw %kM, %kM, %kN
4251 */
4252 if (is_evex_encoding (&i.tm))
4253 {
4254 if (i.vec_encoding != vex_encoding_evex)
4255 {
4256 i.tm.opcode_modifier.vex = VEX128;
4257 i.tm.opcode_modifier.vexw = VEXW0;
4258 i.tm.opcode_modifier.evex = 0;
4259 }
4260 else if (optimize > 1)
4261 i.tm.opcode_modifier.evex = EVEX128;
4262 else
4263 return;
4264 }
4265 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4266 {
4267 i.tm.base_opcode &= 0xff;
4268 i.tm.opcode_modifier.vexw = VEXW0;
4269 }
4270 else
4271 i.tm.opcode_modifier.vex = VEX128;
4272
4273 if (i.tm.opcode_modifier.vex)
4274 for (j = 0; j < 3; j++)
4275 {
4276 i.types[j].bitfield.xmmword = 1;
4277 i.types[j].bitfield.ymmword = 0;
4278 }
4279 }
4280 else if (i.vec_encoding != vex_encoding_evex
4281 && !i.types[0].bitfield.zmmword
4282 && !i.types[1].bitfield.zmmword
4283 && !i.mask
4284 && !i.broadcast
4285 && is_evex_encoding (&i.tm)
4286 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x666f
4287 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf36f
4288 || (i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f
4289 || (i.tm.base_opcode & ~4) == 0x66db
4290 || (i.tm.base_opcode & ~4) == 0x66eb)
4291 && i.tm.extension_opcode == None)
4292 {
4293 /* Optimize: -O1:
4294 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4295 vmovdqu32 and vmovdqu64:
4296 EVEX VOP %xmmM, %xmmN
4297 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4298 EVEX VOP %ymmM, %ymmN
4299 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4300 EVEX VOP %xmmM, mem
4301 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4302 EVEX VOP %ymmM, mem
4303 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4304 EVEX VOP mem, %xmmN
4305 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4306 EVEX VOP mem, %ymmN
4307 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4308 VOP, one of vpand, vpandn, vpor, vpxor:
4309 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4310 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4311 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4312 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4313 EVEX VOP{d,q} mem, %xmmM, %xmmN
4314 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4315 EVEX VOP{d,q} mem, %ymmM, %ymmN
4316 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4317 */
4318 for (j = 0; j < i.operands; j++)
4319 if (operand_type_check (i.types[j], disp)
4320 && i.op[j].disps->X_op == O_constant)
4321 {
4322 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4323 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4324 bytes, we choose EVEX Disp8 over VEX Disp32. */
4325 int evex_disp8, vex_disp8;
4326 unsigned int memshift = i.memshift;
4327 offsetT n = i.op[j].disps->X_add_number;
4328
4329 evex_disp8 = fits_in_disp8 (n);
4330 i.memshift = 0;
4331 vex_disp8 = fits_in_disp8 (n);
4332 if (evex_disp8 != vex_disp8)
4333 {
4334 i.memshift = memshift;
4335 return;
4336 }
4337
4338 i.types[j].bitfield.disp8 = vex_disp8;
4339 break;
4340 }
4341 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0xf26f)
4342 i.tm.base_opcode ^= 0xf36f ^ 0xf26f;
4343 i.tm.opcode_modifier.vex
4344 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4345 i.tm.opcode_modifier.vexw = VEXW0;
4346 /* VPAND, VPOR, and VPXOR are commutative. */
4347 if (i.reg_operands == 3 && i.tm.base_opcode != 0x66df)
4348 i.tm.opcode_modifier.commutative = 1;
4349 i.tm.opcode_modifier.evex = 0;
4350 i.tm.opcode_modifier.masking = 0;
4351 i.tm.opcode_modifier.broadcast = 0;
4352 i.tm.opcode_modifier.disp8memshift = 0;
4353 i.memshift = 0;
4354 if (j < i.operands)
4355 i.types[j].bitfield.disp8
4356 = fits_in_disp8 (i.op[j].disps->X_add_number);
4357 }
4358 }
4359
4360 /* Return non-zero for load instruction. */
4361
4362 static int
4363 load_insn_p (void)
4364 {
4365 unsigned int dest;
4366 int any_vex_p = is_any_vex_encoding (&i.tm);
4367 unsigned int base_opcode = i.tm.base_opcode | 1;
4368
4369 if (!any_vex_p)
4370 {
4371 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4372 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4373 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4374 if (i.tm.opcode_modifier.anysize)
4375 return 0;
4376
4377 /* pop, popf, popa. */
4378 if (strcmp (i.tm.name, "pop") == 0
4379 || i.tm.base_opcode == 0x9d
4380 || i.tm.base_opcode == 0x61)
4381 return 1;
4382
4383 /* movs, cmps, lods, scas. */
4384 if ((i.tm.base_opcode | 0xb) == 0xaf)
4385 return 1;
4386
4387 /* outs, xlatb. */
4388 if (base_opcode == 0x6f
4389 || i.tm.base_opcode == 0xd7)
4390 return 1;
4391 /* NB: For AMD-specific insns with implicit memory operands,
4392 they're intentionally not covered. */
4393 }
4394
4395 /* No memory operand. */
4396 if (!i.mem_operands)
4397 return 0;
4398
4399 if (any_vex_p)
4400 {
4401 /* vldmxcsr. */
4402 if (i.tm.base_opcode == 0xae
4403 && i.tm.opcode_modifier.vex
4404 && i.tm.opcode_modifier.vexopcode == VEX0F
4405 && i.tm.extension_opcode == 2)
4406 return 1;
4407 }
4408 else
4409 {
4410 /* test, not, neg, mul, imul, div, idiv. */
4411 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4412 && i.tm.extension_opcode != 1)
4413 return 1;
4414
4415 /* inc, dec. */
4416 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4417 return 1;
4418
4419 /* add, or, adc, sbb, and, sub, xor, cmp. */
4420 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4421 return 1;
4422
4423 /* bt, bts, btr, btc. */
4424 if (i.tm.base_opcode == 0xfba
4425 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4426 return 1;
4427
4428 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4429 if ((base_opcode == 0xc1
4430 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4431 && i.tm.extension_opcode != 6)
4432 return 1;
4433
4434 /* cmpxchg8b, cmpxchg16b, xrstors. */
4435 if (i.tm.base_opcode == 0xfc7
4436 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3))
4437 return 1;
4438
4439 /* fxrstor, ldmxcsr, xrstor. */
4440 if (i.tm.base_opcode == 0xfae
4441 && (i.tm.extension_opcode == 1
4442 || i.tm.extension_opcode == 2
4443 || i.tm.extension_opcode == 5))
4444 return 1;
4445
4446 /* lgdt, lidt, lmsw. */
4447 if (i.tm.base_opcode == 0xf01
4448 && (i.tm.extension_opcode == 2
4449 || i.tm.extension_opcode == 3
4450 || i.tm.extension_opcode == 6))
4451 return 1;
4452
4453 /* vmptrld */
4454 if (i.tm.base_opcode == 0xfc7
4455 && i.tm.extension_opcode == 6)
4456 return 1;
4457
4458 /* Check for x87 instructions. */
4459 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4460 {
4461 /* Skip fst, fstp, fstenv, fstcw. */
4462 if (i.tm.base_opcode == 0xd9
4463 && (i.tm.extension_opcode == 2
4464 || i.tm.extension_opcode == 3
4465 || i.tm.extension_opcode == 6
4466 || i.tm.extension_opcode == 7))
4467 return 0;
4468
4469 /* Skip fisttp, fist, fistp, fstp. */
4470 if (i.tm.base_opcode == 0xdb
4471 && (i.tm.extension_opcode == 1
4472 || i.tm.extension_opcode == 2
4473 || i.tm.extension_opcode == 3
4474 || i.tm.extension_opcode == 7))
4475 return 0;
4476
4477 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4478 if (i.tm.base_opcode == 0xdd
4479 && (i.tm.extension_opcode == 1
4480 || i.tm.extension_opcode == 2
4481 || i.tm.extension_opcode == 3
4482 || i.tm.extension_opcode == 6
4483 || i.tm.extension_opcode == 7))
4484 return 0;
4485
4486 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4487 if (i.tm.base_opcode == 0xdf
4488 && (i.tm.extension_opcode == 1
4489 || i.tm.extension_opcode == 2
4490 || i.tm.extension_opcode == 3
4491 || i.tm.extension_opcode == 6
4492 || i.tm.extension_opcode == 7))
4493 return 0;
4494
4495 return 1;
4496 }
4497 }
4498
4499 dest = i.operands - 1;
4500
4501 /* Check fake imm8 operand and 3 source operands. */
4502 if ((i.tm.opcode_modifier.immext
4503 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4504 && i.types[dest].bitfield.imm8)
4505 dest--;
4506
4507 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4508 if (!any_vex_p
4509 && (base_opcode == 0x1
4510 || base_opcode == 0x9
4511 || base_opcode == 0x11
4512 || base_opcode == 0x19
4513 || base_opcode == 0x21
4514 || base_opcode == 0x29
4515 || base_opcode == 0x31
4516 || base_opcode == 0x39
4517 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4518 || base_opcode == 0xfc1))
4519 return 1;
4520
4521 /* Check for load instruction. */
4522 return (i.types[dest].bitfield.class != ClassNone
4523 || i.types[dest].bitfield.instance == Accum);
4524 }
4525
4526 /* Output lfence, 0xfaee8, after instruction. */
4527
4528 static void
4529 insert_lfence_after (void)
4530 {
4531 if (lfence_after_load && load_insn_p ())
4532 {
4533 /* There are also two REP string instructions that require
4534 special treatment. Specifically, the compare string (CMPS)
4535 and scan string (SCAS) instructions set EFLAGS in a manner
4536 that depends on the data being compared/scanned. When used
4537 with a REP prefix, the number of iterations may therefore
4538 vary depending on this data. If the data is a program secret
4539 chosen by the adversary using an LVI method,
4540 then this data-dependent behavior may leak some aspect
4541 of the secret. */
4542 if (((i.tm.base_opcode | 0x1) == 0xa7
4543 || (i.tm.base_opcode | 0x1) == 0xaf)
4544 && i.prefix[REP_PREFIX])
4545 {
4546 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4547 i.tm.name);
4548 }
4549 char *p = frag_more (3);
4550 *p++ = 0xf;
4551 *p++ = 0xae;
4552 *p = 0xe8;
4553 }
4554 }
4555
4556 /* Output lfence, 0xfaee8, before instruction. */
4557
4558 static void
4559 insert_lfence_before (void)
4560 {
4561 char *p;
4562
4563 if (is_any_vex_encoding (&i.tm))
4564 return;
4565
4566 if (i.tm.base_opcode == 0xff
4567 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4568 {
4569 /* Insert lfence before indirect branch if needed. */
4570
4571 if (lfence_before_indirect_branch == lfence_branch_none)
4572 return;
4573
4574 if (i.operands != 1)
4575 abort ();
4576
4577 if (i.reg_operands == 1)
4578 {
4579 /* Indirect branch via register. Don't insert lfence with
4580 -mlfence-after-load=yes. */
4581 if (lfence_after_load
4582 || lfence_before_indirect_branch == lfence_branch_memory)
4583 return;
4584 }
4585 else if (i.mem_operands == 1
4586 && lfence_before_indirect_branch != lfence_branch_register)
4587 {
4588 as_warn (_("indirect `%s` with memory operand should be avoided"),
4589 i.tm.name);
4590 return;
4591 }
4592 else
4593 return;
4594
4595 if (last_insn.kind != last_insn_other
4596 && last_insn.seg == now_seg)
4597 {
4598 as_warn_where (last_insn.file, last_insn.line,
4599 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4600 last_insn.name, i.tm.name);
4601 return;
4602 }
4603
4604 p = frag_more (3);
4605 *p++ = 0xf;
4606 *p++ = 0xae;
4607 *p = 0xe8;
4608 return;
4609 }
4610
4611 /* Output or/not/shl and lfence before near ret. */
4612 if (lfence_before_ret != lfence_before_ret_none
4613 && (i.tm.base_opcode == 0xc2
4614 || i.tm.base_opcode == 0xc3))
4615 {
4616 if (last_insn.kind != last_insn_other
4617 && last_insn.seg == now_seg)
4618 {
4619 as_warn_where (last_insn.file, last_insn.line,
4620 _("`%s` skips -mlfence-before-ret on `%s`"),
4621 last_insn.name, i.tm.name);
4622 return;
4623 }
4624
4625 /* Near ret ingore operand size override under CPU64. */
4626 char prefix = flag_code == CODE_64BIT
4627 ? 0x48
4628 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4629
4630 if (lfence_before_ret == lfence_before_ret_not)
4631 {
4632 /* not: 0xf71424, may add prefix
4633 for operand size override or 64-bit code. */
4634 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4635 if (prefix)
4636 *p++ = prefix;
4637 *p++ = 0xf7;
4638 *p++ = 0x14;
4639 *p++ = 0x24;
4640 if (prefix)
4641 *p++ = prefix;
4642 *p++ = 0xf7;
4643 *p++ = 0x14;
4644 *p++ = 0x24;
4645 }
4646 else
4647 {
4648 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4649 if (prefix)
4650 *p++ = prefix;
4651 if (lfence_before_ret == lfence_before_ret_or)
4652 {
4653 /* or: 0x830c2400, may add prefix
4654 for operand size override or 64-bit code. */
4655 *p++ = 0x83;
4656 *p++ = 0x0c;
4657 }
4658 else
4659 {
4660 /* shl: 0xc1242400, may add prefix
4661 for operand size override or 64-bit code. */
4662 *p++ = 0xc1;
4663 *p++ = 0x24;
4664 }
4665
4666 *p++ = 0x24;
4667 *p++ = 0x0;
4668 }
4669
4670 *p++ = 0xf;
4671 *p++ = 0xae;
4672 *p = 0xe8;
4673 }
4674 }
4675
4676 /* This is the guts of the machine-dependent assembler. LINE points to a
4677 machine dependent instruction. This function is supposed to emit
4678 the frags/bytes it assembles to. */
4679
4680 void
4681 md_assemble (char *line)
4682 {
4683 unsigned int j;
4684 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4685 const insn_template *t;
4686
4687 /* Initialize globals. */
4688 memset (&i, '\0', sizeof (i));
4689 for (j = 0; j < MAX_OPERANDS; j++)
4690 i.reloc[j] = NO_RELOC;
4691 memset (disp_expressions, '\0', sizeof (disp_expressions));
4692 memset (im_expressions, '\0', sizeof (im_expressions));
4693 save_stack_p = save_stack;
4694
4695 /* First parse an instruction mnemonic & call i386_operand for the operands.
4696 We assume that the scrubber has arranged it so that line[0] is the valid
4697 start of a (possibly prefixed) mnemonic. */
4698
4699 line = parse_insn (line, mnemonic);
4700 if (line == NULL)
4701 return;
4702 mnem_suffix = i.suffix;
4703
4704 line = parse_operands (line, mnemonic);
4705 this_operand = -1;
4706 xfree (i.memop1_string);
4707 i.memop1_string = NULL;
4708 if (line == NULL)
4709 return;
4710
4711 /* Now we've parsed the mnemonic into a set of templates, and have the
4712 operands at hand. */
4713
4714 /* All Intel opcodes have reversed operands except for "bound", "enter",
4715 "monitor*", "mwait*", "tpause", and "umwait". We also don't reverse
4716 intersegment "jmp" and "call" instructions with 2 immediate operands so
4717 that the immediate segment precedes the offset, as it does when in AT&T
4718 mode. */
4719 if (intel_syntax
4720 && i.operands > 1
4721 && (strcmp (mnemonic, "bound") != 0)
4722 && (strcmp (mnemonic, "invlpga") != 0)
4723 && (strncmp (mnemonic, "monitor", 7) != 0)
4724 && (strncmp (mnemonic, "mwait", 5) != 0)
4725 && (strcmp (mnemonic, "tpause") != 0)
4726 && (strcmp (mnemonic, "umwait") != 0)
4727 && !(operand_type_check (i.types[0], imm)
4728 && operand_type_check (i.types[1], imm)))
4729 swap_operands ();
4730
4731 /* The order of the immediates should be reversed
4732 for 2 immediates extrq and insertq instructions */
4733 if (i.imm_operands == 2
4734 && (strcmp (mnemonic, "extrq") == 0
4735 || strcmp (mnemonic, "insertq") == 0))
4736 swap_2_operands (0, 1);
4737
4738 if (i.imm_operands)
4739 optimize_imm ();
4740
4741 /* Don't optimize displacement for movabs since it only takes 64bit
4742 displacement. */
4743 if (i.disp_operands
4744 && i.disp_encoding != disp_encoding_32bit
4745 && (flag_code != CODE_64BIT
4746 || strcmp (mnemonic, "movabs") != 0))
4747 optimize_disp ();
4748
4749 /* Next, we find a template that matches the given insn,
4750 making sure the overlap of the given operands types is consistent
4751 with the template operand types. */
4752
4753 if (!(t = match_template (mnem_suffix)))
4754 return;
4755
4756 if (sse_check != check_none
4757 && !i.tm.opcode_modifier.noavx
4758 && !i.tm.cpu_flags.bitfield.cpuavx
4759 && !i.tm.cpu_flags.bitfield.cpuavx512f
4760 && (i.tm.cpu_flags.bitfield.cpusse
4761 || i.tm.cpu_flags.bitfield.cpusse2
4762 || i.tm.cpu_flags.bitfield.cpusse3
4763 || i.tm.cpu_flags.bitfield.cpussse3
4764 || i.tm.cpu_flags.bitfield.cpusse4_1
4765 || i.tm.cpu_flags.bitfield.cpusse4_2
4766 || i.tm.cpu_flags.bitfield.cpupclmul
4767 || i.tm.cpu_flags.bitfield.cpuaes
4768 || i.tm.cpu_flags.bitfield.cpusha
4769 || i.tm.cpu_flags.bitfield.cpugfni))
4770 {
4771 (sse_check == check_warning
4772 ? as_warn
4773 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4774 }
4775
4776 if (i.tm.opcode_modifier.fwait)
4777 if (!add_prefix (FWAIT_OPCODE))
4778 return;
4779
4780 /* Check if REP prefix is OK. */
4781 if (i.rep_prefix && !i.tm.opcode_modifier.repprefixok)
4782 {
4783 as_bad (_("invalid instruction `%s' after `%s'"),
4784 i.tm.name, i.rep_prefix);
4785 return;
4786 }
4787
4788 /* Check for lock without a lockable instruction. Destination operand
4789 must be memory unless it is xchg (0x86). */
4790 if (i.prefix[LOCK_PREFIX]
4791 && (!i.tm.opcode_modifier.islockable
4792 || i.mem_operands == 0
4793 || (i.tm.base_opcode != 0x86
4794 && !(i.flags[i.operands - 1] & Operand_Mem))))
4795 {
4796 as_bad (_("expecting lockable instruction after `lock'"));
4797 return;
4798 }
4799
4800 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4801 if (i.prefix[DATA_PREFIX]
4802 && (is_any_vex_encoding (&i.tm)
4803 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4804 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4805 {
4806 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4807 return;
4808 }
4809
4810 /* Check if HLE prefix is OK. */
4811 if (i.hle_prefix && !check_hle ())
4812 return;
4813
4814 /* Check BND prefix. */
4815 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4816 as_bad (_("expecting valid branch instruction after `bnd'"));
4817
4818 /* Check NOTRACK prefix. */
4819 if (i.notrack_prefix && !i.tm.opcode_modifier.notrackprefixok)
4820 as_bad (_("expecting indirect branch instruction after `notrack'"));
4821
4822 if (i.tm.cpu_flags.bitfield.cpumpx)
4823 {
4824 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4825 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4826 else if (flag_code != CODE_16BIT
4827 ? i.prefix[ADDR_PREFIX]
4828 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4829 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4830 }
4831
4832 /* Insert BND prefix. */
4833 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4834 {
4835 if (!i.prefix[BND_PREFIX])
4836 add_prefix (BND_PREFIX_OPCODE);
4837 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4838 {
4839 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4840 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4841 }
4842 }
4843
4844 /* Check string instruction segment overrides. */
4845 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4846 {
4847 gas_assert (i.mem_operands);
4848 if (!check_string ())
4849 return;
4850 i.disp_operands = 0;
4851 }
4852
4853 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4854 optimize_encoding ();
4855
4856 if (!process_suffix ())
4857 return;
4858
4859 /* Update operand types and check extended states. */
4860 for (j = 0; j < i.operands; j++)
4861 {
4862 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4863 switch (i.tm.operand_types[j].bitfield.class)
4864 {
4865 default:
4866 break;
4867 case RegMMX:
4868 i.xstate |= xstate_mmx;
4869 break;
4870 case RegMask:
4871 i.xstate |= xstate_zmm;
4872 break;
4873 case RegSIMD:
4874 if (i.tm.operand_types[j].bitfield.tmmword)
4875 i.xstate |= xstate_tmm;
4876 else if (i.tm.operand_types[j].bitfield.zmmword)
4877 i.xstate |= xstate_zmm;
4878 else if (i.tm.operand_types[j].bitfield.ymmword)
4879 i.xstate |= xstate_ymm;
4880 else if (i.tm.operand_types[j].bitfield.xmmword)
4881 i.xstate |= xstate_xmm;
4882 break;
4883 }
4884 }
4885
4886 /* Make still unresolved immediate matches conform to size of immediate
4887 given in i.suffix. */
4888 if (!finalize_imm ())
4889 return;
4890
4891 if (i.types[0].bitfield.imm1)
4892 i.imm_operands = 0; /* kludge for shift insns. */
4893
4894 /* We only need to check those implicit registers for instructions
4895 with 3 operands or less. */
4896 if (i.operands <= 3)
4897 for (j = 0; j < i.operands; j++)
4898 if (i.types[j].bitfield.instance != InstanceNone
4899 && !i.types[j].bitfield.xmmword)
4900 i.reg_operands--;
4901
4902 /* For insns with operands there are more diddles to do to the opcode. */
4903 if (i.operands)
4904 {
4905 if (!process_operands ())
4906 return;
4907 }
4908 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4909 {
4910 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4911 as_warn (_("translating to `%sp'"), i.tm.name);
4912 }
4913
4914 if (is_any_vex_encoding (&i.tm))
4915 {
4916 if (!cpu_arch_flags.bitfield.cpui286)
4917 {
4918 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4919 i.tm.name);
4920 return;
4921 }
4922
4923 /* Check for explicit REX prefix. */
4924 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4925 {
4926 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4927 return;
4928 }
4929
4930 if (i.tm.opcode_modifier.vex)
4931 build_vex_prefix (t);
4932 else
4933 build_evex_prefix ();
4934
4935 /* The individual REX.RXBW bits got consumed. */
4936 i.rex &= REX_OPCODE;
4937 }
4938
4939 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4940 instructions may define INT_OPCODE as well, so avoid this corner
4941 case for those instructions that use MODRM. */
4942 if (i.tm.base_opcode == INT_OPCODE
4943 && !i.tm.opcode_modifier.modrm
4944 && i.op[0].imms->X_add_number == 3)
4945 {
4946 i.tm.base_opcode = INT3_OPCODE;
4947 i.imm_operands = 0;
4948 }
4949
4950 if ((i.tm.opcode_modifier.jump == JUMP
4951 || i.tm.opcode_modifier.jump == JUMP_BYTE
4952 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4953 && i.op[0].disps->X_op == O_constant)
4954 {
4955 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4956 the absolute address given by the constant. Since ix86 jumps and
4957 calls are pc relative, we need to generate a reloc. */
4958 i.op[0].disps->X_add_symbol = &abs_symbol;
4959 i.op[0].disps->X_op = O_symbol;
4960 }
4961
4962 /* For 8 bit registers we need an empty rex prefix. Also if the
4963 instruction already has a prefix, we need to convert old
4964 registers to new ones. */
4965
4966 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4967 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4968 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4969 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4970 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4971 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4972 && i.rex != 0))
4973 {
4974 int x;
4975
4976 i.rex |= REX_OPCODE;
4977 for (x = 0; x < 2; x++)
4978 {
4979 /* Look for 8 bit operand that uses old registers. */
4980 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4981 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4982 {
4983 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4984 /* In case it is "hi" register, give up. */
4985 if (i.op[x].regs->reg_num > 3)
4986 as_bad (_("can't encode register '%s%s' in an "
4987 "instruction requiring REX prefix."),
4988 register_prefix, i.op[x].regs->reg_name);
4989
4990 /* Otherwise it is equivalent to the extended register.
4991 Since the encoding doesn't change this is merely
4992 cosmetic cleanup for debug output. */
4993
4994 i.op[x].regs = i.op[x].regs + 8;
4995 }
4996 }
4997 }
4998
4999 if (i.rex == 0 && i.rex_encoding)
5000 {
5001 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
5002 that uses legacy register. If it is "hi" register, don't add
5003 the REX_OPCODE byte. */
5004 int x;
5005 for (x = 0; x < 2; x++)
5006 if (i.types[x].bitfield.class == Reg
5007 && i.types[x].bitfield.byte
5008 && (i.op[x].regs->reg_flags & RegRex64) == 0
5009 && i.op[x].regs->reg_num > 3)
5010 {
5011 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
5012 i.rex_encoding = FALSE;
5013 break;
5014 }
5015
5016 if (i.rex_encoding)
5017 i.rex = REX_OPCODE;
5018 }
5019
5020 if (i.rex != 0)
5021 add_prefix (REX_OPCODE | i.rex);
5022
5023 insert_lfence_before ();
5024
5025 /* We are ready to output the insn. */
5026 output_insn ();
5027
5028 insert_lfence_after ();
5029
5030 last_insn.seg = now_seg;
5031
5032 if (i.tm.opcode_modifier.isprefix)
5033 {
5034 last_insn.kind = last_insn_prefix;
5035 last_insn.name = i.tm.name;
5036 last_insn.file = as_where (&last_insn.line);
5037 }
5038 else
5039 last_insn.kind = last_insn_other;
5040 }
5041
5042 static char *
5043 parse_insn (char *line, char *mnemonic)
5044 {
5045 char *l = line;
5046 char *token_start = l;
5047 char *mnem_p;
5048 int supported;
5049 const insn_template *t;
5050 char *dot_p = NULL;
5051
5052 while (1)
5053 {
5054 mnem_p = mnemonic;
5055 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5056 {
5057 if (*mnem_p == '.')
5058 dot_p = mnem_p;
5059 mnem_p++;
5060 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5061 {
5062 as_bad (_("no such instruction: `%s'"), token_start);
5063 return NULL;
5064 }
5065 l++;
5066 }
5067 if (!is_space_char (*l)
5068 && *l != END_OF_INSN
5069 && (intel_syntax
5070 || (*l != PREFIX_SEPARATOR
5071 && *l != ',')))
5072 {
5073 as_bad (_("invalid character %s in mnemonic"),
5074 output_invalid (*l));
5075 return NULL;
5076 }
5077 if (token_start == l)
5078 {
5079 if (!intel_syntax && *l == PREFIX_SEPARATOR)
5080 as_bad (_("expecting prefix; got nothing"));
5081 else
5082 as_bad (_("expecting mnemonic; got nothing"));
5083 return NULL;
5084 }
5085
5086 /* Look up instruction (or prefix) via hash table. */
5087 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5088
5089 if (*l != END_OF_INSN
5090 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5091 && current_templates
5092 && current_templates->start->opcode_modifier.isprefix)
5093 {
5094 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5095 {
5096 as_bad ((flag_code != CODE_64BIT
5097 ? _("`%s' is only supported in 64-bit mode")
5098 : _("`%s' is not supported in 64-bit mode")),
5099 current_templates->start->name);
5100 return NULL;
5101 }
5102 /* If we are in 16-bit mode, do not allow addr16 or data16.
5103 Similarly, in 32-bit mode, do not allow addr32 or data32. */
5104 if ((current_templates->start->opcode_modifier.size == SIZE16
5105 || current_templates->start->opcode_modifier.size == SIZE32)
5106 && flag_code != CODE_64BIT
5107 && ((current_templates->start->opcode_modifier.size == SIZE32)
5108 ^ (flag_code == CODE_16BIT)))
5109 {
5110 as_bad (_("redundant %s prefix"),
5111 current_templates->start->name);
5112 return NULL;
5113 }
5114 if (current_templates->start->opcode_length == 0)
5115 {
5116 /* Handle pseudo prefixes. */
5117 switch (current_templates->start->base_opcode)
5118 {
5119 case Prefix_Disp8:
5120 /* {disp8} */
5121 i.disp_encoding = disp_encoding_8bit;
5122 break;
5123 case Prefix_Disp16:
5124 /* {disp16} */
5125 i.disp_encoding = disp_encoding_16bit;
5126 break;
5127 case Prefix_Disp32:
5128 /* {disp32} */
5129 i.disp_encoding = disp_encoding_32bit;
5130 break;
5131 case Prefix_Load:
5132 /* {load} */
5133 i.dir_encoding = dir_encoding_load;
5134 break;
5135 case Prefix_Store:
5136 /* {store} */
5137 i.dir_encoding = dir_encoding_store;
5138 break;
5139 case Prefix_VEX:
5140 /* {vex} */
5141 i.vec_encoding = vex_encoding_vex;
5142 break;
5143 case Prefix_VEX3:
5144 /* {vex3} */
5145 i.vec_encoding = vex_encoding_vex3;
5146 break;
5147 case Prefix_EVEX:
5148 /* {evex} */
5149 i.vec_encoding = vex_encoding_evex;
5150 break;
5151 case Prefix_REX:
5152 /* {rex} */
5153 i.rex_encoding = TRUE;
5154 break;
5155 case Prefix_NoOptimize:
5156 /* {nooptimize} */
5157 i.no_optimize = TRUE;
5158 break;
5159 default:
5160 abort ();
5161 }
5162 }
5163 else
5164 {
5165 /* Add prefix, checking for repeated prefixes. */
5166 switch (add_prefix (current_templates->start->base_opcode))
5167 {
5168 case PREFIX_EXIST:
5169 return NULL;
5170 case PREFIX_DS:
5171 if (current_templates->start->cpu_flags.bitfield.cpuibt)
5172 i.notrack_prefix = current_templates->start->name;
5173 break;
5174 case PREFIX_REP:
5175 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5176 i.hle_prefix = current_templates->start->name;
5177 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5178 i.bnd_prefix = current_templates->start->name;
5179 else
5180 i.rep_prefix = current_templates->start->name;
5181 break;
5182 default:
5183 break;
5184 }
5185 }
5186 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5187 token_start = ++l;
5188 }
5189 else
5190 break;
5191 }
5192
5193 if (!current_templates)
5194 {
5195 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5196 Check if we should swap operand or force 32bit displacement in
5197 encoding. */
5198 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5199 i.dir_encoding = dir_encoding_swap;
5200 else if (mnem_p - 3 == dot_p
5201 && dot_p[1] == 'd'
5202 && dot_p[2] == '8')
5203 i.disp_encoding = disp_encoding_8bit;
5204 else if (mnem_p - 4 == dot_p
5205 && dot_p[1] == 'd'
5206 && dot_p[2] == '3'
5207 && dot_p[3] == '2')
5208 i.disp_encoding = disp_encoding_32bit;
5209 else
5210 goto check_suffix;
5211 mnem_p = dot_p;
5212 *dot_p = '\0';
5213 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5214 }
5215
5216 if (!current_templates)
5217 {
5218 check_suffix:
5219 if (mnem_p > mnemonic)
5220 {
5221 /* See if we can get a match by trimming off a suffix. */
5222 switch (mnem_p[-1])
5223 {
5224 case WORD_MNEM_SUFFIX:
5225 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5226 i.suffix = SHORT_MNEM_SUFFIX;
5227 else
5228 /* Fall through. */
5229 case BYTE_MNEM_SUFFIX:
5230 case QWORD_MNEM_SUFFIX:
5231 i.suffix = mnem_p[-1];
5232 mnem_p[-1] = '\0';
5233 current_templates
5234 = (const templates *) str_hash_find (op_hash, mnemonic);
5235 break;
5236 case SHORT_MNEM_SUFFIX:
5237 case LONG_MNEM_SUFFIX:
5238 if (!intel_syntax)
5239 {
5240 i.suffix = mnem_p[-1];
5241 mnem_p[-1] = '\0';
5242 current_templates
5243 = (const templates *) str_hash_find (op_hash, mnemonic);
5244 }
5245 break;
5246
5247 /* Intel Syntax. */
5248 case 'd':
5249 if (intel_syntax)
5250 {
5251 if (intel_float_operand (mnemonic) == 1)
5252 i.suffix = SHORT_MNEM_SUFFIX;
5253 else
5254 i.suffix = LONG_MNEM_SUFFIX;
5255 mnem_p[-1] = '\0';
5256 current_templates
5257 = (const templates *) str_hash_find (op_hash, mnemonic);
5258 }
5259 break;
5260 }
5261 }
5262
5263 if (!current_templates)
5264 {
5265 as_bad (_("no such instruction: `%s'"), token_start);
5266 return NULL;
5267 }
5268 }
5269
5270 if (current_templates->start->opcode_modifier.jump == JUMP
5271 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5272 {
5273 /* Check for a branch hint. We allow ",pt" and ",pn" for
5274 predict taken and predict not taken respectively.
5275 I'm not sure that branch hints actually do anything on loop
5276 and jcxz insns (JumpByte) for current Pentium4 chips. They
5277 may work in the future and it doesn't hurt to accept them
5278 now. */
5279 if (l[0] == ',' && l[1] == 'p')
5280 {
5281 if (l[2] == 't')
5282 {
5283 if (!add_prefix (DS_PREFIX_OPCODE))
5284 return NULL;
5285 l += 3;
5286 }
5287 else if (l[2] == 'n')
5288 {
5289 if (!add_prefix (CS_PREFIX_OPCODE))
5290 return NULL;
5291 l += 3;
5292 }
5293 }
5294 }
5295 /* Any other comma loses. */
5296 if (*l == ',')
5297 {
5298 as_bad (_("invalid character %s in mnemonic"),
5299 output_invalid (*l));
5300 return NULL;
5301 }
5302
5303 /* Check if instruction is supported on specified architecture. */
5304 supported = 0;
5305 for (t = current_templates->start; t < current_templates->end; ++t)
5306 {
5307 supported |= cpu_flags_match (t);
5308 if (supported == CPU_FLAGS_PERFECT_MATCH)
5309 {
5310 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5311 as_warn (_("use .code16 to ensure correct addressing mode"));
5312
5313 return l;
5314 }
5315 }
5316
5317 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5318 as_bad (flag_code == CODE_64BIT
5319 ? _("`%s' is not supported in 64-bit mode")
5320 : _("`%s' is only supported in 64-bit mode"),
5321 current_templates->start->name);
5322 else
5323 as_bad (_("`%s' is not supported on `%s%s'"),
5324 current_templates->start->name,
5325 cpu_arch_name ? cpu_arch_name : default_arch,
5326 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5327
5328 return NULL;
5329 }
5330
5331 static char *
5332 parse_operands (char *l, const char *mnemonic)
5333 {
5334 char *token_start;
5335
5336 /* 1 if operand is pending after ','. */
5337 unsigned int expecting_operand = 0;
5338
5339 /* Non-zero if operand parens not balanced. */
5340 unsigned int paren_not_balanced;
5341
5342 while (*l != END_OF_INSN)
5343 {
5344 /* Skip optional white space before operand. */
5345 if (is_space_char (*l))
5346 ++l;
5347 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5348 {
5349 as_bad (_("invalid character %s before operand %d"),
5350 output_invalid (*l),
5351 i.operands + 1);
5352 return NULL;
5353 }
5354 token_start = l; /* After white space. */
5355 paren_not_balanced = 0;
5356 while (paren_not_balanced || *l != ',')
5357 {
5358 if (*l == END_OF_INSN)
5359 {
5360 if (paren_not_balanced)
5361 {
5362 if (!intel_syntax)
5363 as_bad (_("unbalanced parenthesis in operand %d."),
5364 i.operands + 1);
5365 else
5366 as_bad (_("unbalanced brackets in operand %d."),
5367 i.operands + 1);
5368 return NULL;
5369 }
5370 else
5371 break; /* we are done */
5372 }
5373 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5374 {
5375 as_bad (_("invalid character %s in operand %d"),
5376 output_invalid (*l),
5377 i.operands + 1);
5378 return NULL;
5379 }
5380 if (!intel_syntax)
5381 {
5382 if (*l == '(')
5383 ++paren_not_balanced;
5384 if (*l == ')')
5385 --paren_not_balanced;
5386 }
5387 else
5388 {
5389 if (*l == '[')
5390 ++paren_not_balanced;
5391 if (*l == ']')
5392 --paren_not_balanced;
5393 }
5394 l++;
5395 }
5396 if (l != token_start)
5397 { /* Yes, we've read in another operand. */
5398 unsigned int operand_ok;
5399 this_operand = i.operands++;
5400 if (i.operands > MAX_OPERANDS)
5401 {
5402 as_bad (_("spurious operands; (%d operands/instruction max)"),
5403 MAX_OPERANDS);
5404 return NULL;
5405 }
5406 i.types[this_operand].bitfield.unspecified = 1;
5407 /* Now parse operand adding info to 'i' as we go along. */
5408 END_STRING_AND_SAVE (l);
5409
5410 if (i.mem_operands > 1)
5411 {
5412 as_bad (_("too many memory references for `%s'"),
5413 mnemonic);
5414 return 0;
5415 }
5416
5417 if (intel_syntax)
5418 operand_ok =
5419 i386_intel_operand (token_start,
5420 intel_float_operand (mnemonic));
5421 else
5422 operand_ok = i386_att_operand (token_start);
5423
5424 RESTORE_END_STRING (l);
5425 if (!operand_ok)
5426 return NULL;
5427 }
5428 else
5429 {
5430 if (expecting_operand)
5431 {
5432 expecting_operand_after_comma:
5433 as_bad (_("expecting operand after ','; got nothing"));
5434 return NULL;
5435 }
5436 if (*l == ',')
5437 {
5438 as_bad (_("expecting operand before ','; got nothing"));
5439 return NULL;
5440 }
5441 }
5442
5443 /* Now *l must be either ',' or END_OF_INSN. */
5444 if (*l == ',')
5445 {
5446 if (*++l == END_OF_INSN)
5447 {
5448 /* Just skip it, if it's \n complain. */
5449 goto expecting_operand_after_comma;
5450 }
5451 expecting_operand = 1;
5452 }
5453 }
5454 return l;
5455 }
5456
5457 static void
5458 swap_2_operands (int xchg1, int xchg2)
5459 {
5460 union i386_op temp_op;
5461 i386_operand_type temp_type;
5462 unsigned int temp_flags;
5463 enum bfd_reloc_code_real temp_reloc;
5464
5465 temp_type = i.types[xchg2];
5466 i.types[xchg2] = i.types[xchg1];
5467 i.types[xchg1] = temp_type;
5468
5469 temp_flags = i.flags[xchg2];
5470 i.flags[xchg2] = i.flags[xchg1];
5471 i.flags[xchg1] = temp_flags;
5472
5473 temp_op = i.op[xchg2];
5474 i.op[xchg2] = i.op[xchg1];
5475 i.op[xchg1] = temp_op;
5476
5477 temp_reloc = i.reloc[xchg2];
5478 i.reloc[xchg2] = i.reloc[xchg1];
5479 i.reloc[xchg1] = temp_reloc;
5480
5481 if (i.mask)
5482 {
5483 if (i.mask->operand == xchg1)
5484 i.mask->operand = xchg2;
5485 else if (i.mask->operand == xchg2)
5486 i.mask->operand = xchg1;
5487 }
5488 if (i.broadcast)
5489 {
5490 if (i.broadcast->operand == xchg1)
5491 i.broadcast->operand = xchg2;
5492 else if (i.broadcast->operand == xchg2)
5493 i.broadcast->operand = xchg1;
5494 }
5495 if (i.rounding)
5496 {
5497 if (i.rounding->operand == xchg1)
5498 i.rounding->operand = xchg2;
5499 else if (i.rounding->operand == xchg2)
5500 i.rounding->operand = xchg1;
5501 }
5502 }
5503
5504 static void
5505 swap_operands (void)
5506 {
5507 switch (i.operands)
5508 {
5509 case 5:
5510 case 4:
5511 swap_2_operands (1, i.operands - 2);
5512 /* Fall through. */
5513 case 3:
5514 case 2:
5515 swap_2_operands (0, i.operands - 1);
5516 break;
5517 default:
5518 abort ();
5519 }
5520
5521 if (i.mem_operands == 2)
5522 {
5523 const seg_entry *temp_seg;
5524 temp_seg = i.seg[0];
5525 i.seg[0] = i.seg[1];
5526 i.seg[1] = temp_seg;
5527 }
5528 }
5529
5530 /* Try to ensure constant immediates are represented in the smallest
5531 opcode possible. */
5532 static void
5533 optimize_imm (void)
5534 {
5535 char guess_suffix = 0;
5536 int op;
5537
5538 if (i.suffix)
5539 guess_suffix = i.suffix;
5540 else if (i.reg_operands)
5541 {
5542 /* Figure out a suffix from the last register operand specified.
5543 We can't do this properly yet, i.e. excluding special register
5544 instances, but the following works for instructions with
5545 immediates. In any case, we can't set i.suffix yet. */
5546 for (op = i.operands; --op >= 0;)
5547 if (i.types[op].bitfield.class != Reg)
5548 continue;
5549 else if (i.types[op].bitfield.byte)
5550 {
5551 guess_suffix = BYTE_MNEM_SUFFIX;
5552 break;
5553 }
5554 else if (i.types[op].bitfield.word)
5555 {
5556 guess_suffix = WORD_MNEM_SUFFIX;
5557 break;
5558 }
5559 else if (i.types[op].bitfield.dword)
5560 {
5561 guess_suffix = LONG_MNEM_SUFFIX;
5562 break;
5563 }
5564 else if (i.types[op].bitfield.qword)
5565 {
5566 guess_suffix = QWORD_MNEM_SUFFIX;
5567 break;
5568 }
5569 }
5570 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5571 guess_suffix = WORD_MNEM_SUFFIX;
5572
5573 for (op = i.operands; --op >= 0;)
5574 if (operand_type_check (i.types[op], imm))
5575 {
5576 switch (i.op[op].imms->X_op)
5577 {
5578 case O_constant:
5579 /* If a suffix is given, this operand may be shortened. */
5580 switch (guess_suffix)
5581 {
5582 case LONG_MNEM_SUFFIX:
5583 i.types[op].bitfield.imm32 = 1;
5584 i.types[op].bitfield.imm64 = 1;
5585 break;
5586 case WORD_MNEM_SUFFIX:
5587 i.types[op].bitfield.imm16 = 1;
5588 i.types[op].bitfield.imm32 = 1;
5589 i.types[op].bitfield.imm32s = 1;
5590 i.types[op].bitfield.imm64 = 1;
5591 break;
5592 case BYTE_MNEM_SUFFIX:
5593 i.types[op].bitfield.imm8 = 1;
5594 i.types[op].bitfield.imm8s = 1;
5595 i.types[op].bitfield.imm16 = 1;
5596 i.types[op].bitfield.imm32 = 1;
5597 i.types[op].bitfield.imm32s = 1;
5598 i.types[op].bitfield.imm64 = 1;
5599 break;
5600 }
5601
5602 /* If this operand is at most 16 bits, convert it
5603 to a signed 16 bit number before trying to see
5604 whether it will fit in an even smaller size.
5605 This allows a 16-bit operand such as $0xffe0 to
5606 be recognised as within Imm8S range. */
5607 if ((i.types[op].bitfield.imm16)
5608 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5609 {
5610 i.op[op].imms->X_add_number =
5611 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5612 }
5613 #ifdef BFD64
5614 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5615 if ((i.types[op].bitfield.imm32)
5616 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5617 == 0))
5618 {
5619 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5620 ^ ((offsetT) 1 << 31))
5621 - ((offsetT) 1 << 31));
5622 }
5623 #endif
5624 i.types[op]
5625 = operand_type_or (i.types[op],
5626 smallest_imm_type (i.op[op].imms->X_add_number));
5627
5628 /* We must avoid matching of Imm32 templates when 64bit
5629 only immediate is available. */
5630 if (guess_suffix == QWORD_MNEM_SUFFIX)
5631 i.types[op].bitfield.imm32 = 0;
5632 break;
5633
5634 case O_absent:
5635 case O_register:
5636 abort ();
5637
5638 /* Symbols and expressions. */
5639 default:
5640 /* Convert symbolic operand to proper sizes for matching, but don't
5641 prevent matching a set of insns that only supports sizes other
5642 than those matching the insn suffix. */
5643 {
5644 i386_operand_type mask, allowed;
5645 const insn_template *t;
5646
5647 operand_type_set (&mask, 0);
5648 operand_type_set (&allowed, 0);
5649
5650 for (t = current_templates->start;
5651 t < current_templates->end;
5652 ++t)
5653 {
5654 allowed = operand_type_or (allowed, t->operand_types[op]);
5655 allowed = operand_type_and (allowed, anyimm);
5656 }
5657 switch (guess_suffix)
5658 {
5659 case QWORD_MNEM_SUFFIX:
5660 mask.bitfield.imm64 = 1;
5661 mask.bitfield.imm32s = 1;
5662 break;
5663 case LONG_MNEM_SUFFIX:
5664 mask.bitfield.imm32 = 1;
5665 break;
5666 case WORD_MNEM_SUFFIX:
5667 mask.bitfield.imm16 = 1;
5668 break;
5669 case BYTE_MNEM_SUFFIX:
5670 mask.bitfield.imm8 = 1;
5671 break;
5672 default:
5673 break;
5674 }
5675 allowed = operand_type_and (mask, allowed);
5676 if (!operand_type_all_zero (&allowed))
5677 i.types[op] = operand_type_and (i.types[op], mask);
5678 }
5679 break;
5680 }
5681 }
5682 }
5683
5684 /* Try to use the smallest displacement type too. */
5685 static void
5686 optimize_disp (void)
5687 {
5688 int op;
5689
5690 for (op = i.operands; --op >= 0;)
5691 if (operand_type_check (i.types[op], disp))
5692 {
5693 if (i.op[op].disps->X_op == O_constant)
5694 {
5695 offsetT op_disp = i.op[op].disps->X_add_number;
5696
5697 if (i.types[op].bitfield.disp16
5698 && (op_disp & ~(offsetT) 0xffff) == 0)
5699 {
5700 /* If this operand is at most 16 bits, convert
5701 to a signed 16 bit number and don't use 64bit
5702 displacement. */
5703 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5704 i.types[op].bitfield.disp64 = 0;
5705 }
5706 #ifdef BFD64
5707 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5708 if (i.types[op].bitfield.disp32
5709 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5710 {
5711 /* If this operand is at most 32 bits, convert
5712 to a signed 32 bit number and don't use 64bit
5713 displacement. */
5714 op_disp &= (((offsetT) 2 << 31) - 1);
5715 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5716 i.types[op].bitfield.disp64 = 0;
5717 }
5718 #endif
5719 if (!op_disp && i.types[op].bitfield.baseindex)
5720 {
5721 i.types[op].bitfield.disp8 = 0;
5722 i.types[op].bitfield.disp16 = 0;
5723 i.types[op].bitfield.disp32 = 0;
5724 i.types[op].bitfield.disp32s = 0;
5725 i.types[op].bitfield.disp64 = 0;
5726 i.op[op].disps = 0;
5727 i.disp_operands--;
5728 }
5729 else if (flag_code == CODE_64BIT)
5730 {
5731 if (fits_in_signed_long (op_disp))
5732 {
5733 i.types[op].bitfield.disp64 = 0;
5734 i.types[op].bitfield.disp32s = 1;
5735 }
5736 if (i.prefix[ADDR_PREFIX]
5737 && fits_in_unsigned_long (op_disp))
5738 i.types[op].bitfield.disp32 = 1;
5739 }
5740 if ((i.types[op].bitfield.disp32
5741 || i.types[op].bitfield.disp32s
5742 || i.types[op].bitfield.disp16)
5743 && fits_in_disp8 (op_disp))
5744 i.types[op].bitfield.disp8 = 1;
5745 }
5746 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5747 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5748 {
5749 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5750 i.op[op].disps, 0, i.reloc[op]);
5751 i.types[op].bitfield.disp8 = 0;
5752 i.types[op].bitfield.disp16 = 0;
5753 i.types[op].bitfield.disp32 = 0;
5754 i.types[op].bitfield.disp32s = 0;
5755 i.types[op].bitfield.disp64 = 0;
5756 }
5757 else
5758 /* We only support 64bit displacement on constants. */
5759 i.types[op].bitfield.disp64 = 0;
5760 }
5761 }
5762
5763 /* Return 1 if there is a match in broadcast bytes between operand
5764 GIVEN and instruction template T. */
5765
5766 static INLINE int
5767 match_broadcast_size (const insn_template *t, unsigned int given)
5768 {
5769 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5770 && i.types[given].bitfield.byte)
5771 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5772 && i.types[given].bitfield.word)
5773 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5774 && i.types[given].bitfield.dword)
5775 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5776 && i.types[given].bitfield.qword));
5777 }
5778
5779 /* Check if operands are valid for the instruction. */
5780
5781 static int
5782 check_VecOperands (const insn_template *t)
5783 {
5784 unsigned int op;
5785 i386_cpu_flags cpu;
5786
5787 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5788 any one operand are implicity requiring AVX512VL support if the actual
5789 operand size is YMMword or XMMword. Since this function runs after
5790 template matching, there's no need to check for YMMword/XMMword in
5791 the template. */
5792 cpu = cpu_flags_and (t->cpu_flags, avx512);
5793 if (!cpu_flags_all_zero (&cpu)
5794 && !t->cpu_flags.bitfield.cpuavx512vl
5795 && !cpu_arch_flags.bitfield.cpuavx512vl)
5796 {
5797 for (op = 0; op < t->operands; ++op)
5798 {
5799 if (t->operand_types[op].bitfield.zmmword
5800 && (i.types[op].bitfield.ymmword
5801 || i.types[op].bitfield.xmmword))
5802 {
5803 i.error = unsupported;
5804 return 1;
5805 }
5806 }
5807 }
5808
5809 /* Without VSIB byte, we can't have a vector register for index. */
5810 if (!t->opcode_modifier.sib
5811 && i.index_reg
5812 && (i.index_reg->reg_type.bitfield.xmmword
5813 || i.index_reg->reg_type.bitfield.ymmword
5814 || i.index_reg->reg_type.bitfield.zmmword))
5815 {
5816 i.error = unsupported_vector_index_register;
5817 return 1;
5818 }
5819
5820 /* Check if default mask is allowed. */
5821 if (t->opcode_modifier.nodefmask
5822 && (!i.mask || i.mask->mask->reg_num == 0))
5823 {
5824 i.error = no_default_mask;
5825 return 1;
5826 }
5827
5828 /* For VSIB byte, we need a vector register for index, and all vector
5829 registers must be distinct. */
5830 if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5831 {
5832 if (!i.index_reg
5833 || !((t->opcode_modifier.sib == VECSIB128
5834 && i.index_reg->reg_type.bitfield.xmmword)
5835 || (t->opcode_modifier.sib == VECSIB256
5836 && i.index_reg->reg_type.bitfield.ymmword)
5837 || (t->opcode_modifier.sib == VECSIB512
5838 && i.index_reg->reg_type.bitfield.zmmword)))
5839 {
5840 i.error = invalid_vsib_address;
5841 return 1;
5842 }
5843
5844 gas_assert (i.reg_operands == 2 || i.mask);
5845 if (i.reg_operands == 2 && !i.mask)
5846 {
5847 gas_assert (i.types[0].bitfield.class == RegSIMD);
5848 gas_assert (i.types[0].bitfield.xmmword
5849 || i.types[0].bitfield.ymmword);
5850 gas_assert (i.types[2].bitfield.class == RegSIMD);
5851 gas_assert (i.types[2].bitfield.xmmword
5852 || i.types[2].bitfield.ymmword);
5853 if (operand_check == check_none)
5854 return 0;
5855 if (register_number (i.op[0].regs)
5856 != register_number (i.index_reg)
5857 && register_number (i.op[2].regs)
5858 != register_number (i.index_reg)
5859 && register_number (i.op[0].regs)
5860 != register_number (i.op[2].regs))
5861 return 0;
5862 if (operand_check == check_error)
5863 {
5864 i.error = invalid_vector_register_set;
5865 return 1;
5866 }
5867 as_warn (_("mask, index, and destination registers should be distinct"));
5868 }
5869 else if (i.reg_operands == 1 && i.mask)
5870 {
5871 if (i.types[1].bitfield.class == RegSIMD
5872 && (i.types[1].bitfield.xmmword
5873 || i.types[1].bitfield.ymmword
5874 || i.types[1].bitfield.zmmword)
5875 && (register_number (i.op[1].regs)
5876 == register_number (i.index_reg)))
5877 {
5878 if (operand_check == check_error)
5879 {
5880 i.error = invalid_vector_register_set;
5881 return 1;
5882 }
5883 if (operand_check != check_none)
5884 as_warn (_("index and destination registers should be distinct"));
5885 }
5886 }
5887 }
5888
5889 /* For AMX instructions with three tmmword operands, all tmmword operand must be
5890 distinct */
5891 if (t->operand_types[0].bitfield.tmmword
5892 && i.reg_operands == 3)
5893 {
5894 if (register_number (i.op[0].regs)
5895 == register_number (i.op[1].regs)
5896 || register_number (i.op[0].regs)
5897 == register_number (i.op[2].regs)
5898 || register_number (i.op[1].regs)
5899 == register_number (i.op[2].regs))
5900 {
5901 i.error = invalid_tmm_register_set;
5902 return 1;
5903 }
5904 }
5905
5906 /* Check if broadcast is supported by the instruction and is applied
5907 to the memory operand. */
5908 if (i.broadcast)
5909 {
5910 i386_operand_type type, overlap;
5911
5912 /* Check if specified broadcast is supported in this instruction,
5913 and its broadcast bytes match the memory operand. */
5914 op = i.broadcast->operand;
5915 if (!t->opcode_modifier.broadcast
5916 || !(i.flags[op] & Operand_Mem)
5917 || (!i.types[op].bitfield.unspecified
5918 && !match_broadcast_size (t, op)))
5919 {
5920 bad_broadcast:
5921 i.error = unsupported_broadcast;
5922 return 1;
5923 }
5924
5925 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5926 * i.broadcast->type);
5927 operand_type_set (&type, 0);
5928 switch (i.broadcast->bytes)
5929 {
5930 case 2:
5931 type.bitfield.word = 1;
5932 break;
5933 case 4:
5934 type.bitfield.dword = 1;
5935 break;
5936 case 8:
5937 type.bitfield.qword = 1;
5938 break;
5939 case 16:
5940 type.bitfield.xmmword = 1;
5941 break;
5942 case 32:
5943 type.bitfield.ymmword = 1;
5944 break;
5945 case 64:
5946 type.bitfield.zmmword = 1;
5947 break;
5948 default:
5949 goto bad_broadcast;
5950 }
5951
5952 overlap = operand_type_and (type, t->operand_types[op]);
5953 if (t->operand_types[op].bitfield.class == RegSIMD
5954 && t->operand_types[op].bitfield.byte
5955 + t->operand_types[op].bitfield.word
5956 + t->operand_types[op].bitfield.dword
5957 + t->operand_types[op].bitfield.qword > 1)
5958 {
5959 overlap.bitfield.xmmword = 0;
5960 overlap.bitfield.ymmword = 0;
5961 overlap.bitfield.zmmword = 0;
5962 }
5963 if (operand_type_all_zero (&overlap))
5964 goto bad_broadcast;
5965
5966 if (t->opcode_modifier.checkregsize)
5967 {
5968 unsigned int j;
5969
5970 type.bitfield.baseindex = 1;
5971 for (j = 0; j < i.operands; ++j)
5972 {
5973 if (j != op
5974 && !operand_type_register_match(i.types[j],
5975 t->operand_types[j],
5976 type,
5977 t->operand_types[op]))
5978 goto bad_broadcast;
5979 }
5980 }
5981 }
5982 /* If broadcast is supported in this instruction, we need to check if
5983 operand of one-element size isn't specified without broadcast. */
5984 else if (t->opcode_modifier.broadcast && i.mem_operands)
5985 {
5986 /* Find memory operand. */
5987 for (op = 0; op < i.operands; op++)
5988 if (i.flags[op] & Operand_Mem)
5989 break;
5990 gas_assert (op < i.operands);
5991 /* Check size of the memory operand. */
5992 if (match_broadcast_size (t, op))
5993 {
5994 i.error = broadcast_needed;
5995 return 1;
5996 }
5997 }
5998 else
5999 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
6000
6001 /* Check if requested masking is supported. */
6002 if (i.mask)
6003 {
6004 switch (t->opcode_modifier.masking)
6005 {
6006 case BOTH_MASKING:
6007 break;
6008 case MERGING_MASKING:
6009 if (i.mask->zeroing)
6010 {
6011 case 0:
6012 i.error = unsupported_masking;
6013 return 1;
6014 }
6015 break;
6016 case DYNAMIC_MASKING:
6017 /* Memory destinations allow only merging masking. */
6018 if (i.mask->zeroing && i.mem_operands)
6019 {
6020 /* Find memory operand. */
6021 for (op = 0; op < i.operands; op++)
6022 if (i.flags[op] & Operand_Mem)
6023 break;
6024 gas_assert (op < i.operands);
6025 if (op == i.operands - 1)
6026 {
6027 i.error = unsupported_masking;
6028 return 1;
6029 }
6030 }
6031 break;
6032 default:
6033 abort ();
6034 }
6035 }
6036
6037 /* Check if masking is applied to dest operand. */
6038 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6039 {
6040 i.error = mask_not_on_destination;
6041 return 1;
6042 }
6043
6044 /* Check RC/SAE. */
6045 if (i.rounding)
6046 {
6047 if (!t->opcode_modifier.sae
6048 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6049 {
6050 i.error = unsupported_rc_sae;
6051 return 1;
6052 }
6053 /* If the instruction has several immediate operands and one of
6054 them is rounding, the rounding operand should be the last
6055 immediate operand. */
6056 if (i.imm_operands > 1
6057 && i.rounding->operand != (int) (i.imm_operands - 1))
6058 {
6059 i.error = rc_sae_operand_not_last_imm;
6060 return 1;
6061 }
6062 }
6063
6064 /* Check the special Imm4 cases; must be the first operand. */
6065 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6066 {
6067 if (i.op[0].imms->X_op != O_constant
6068 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6069 {
6070 i.error = bad_imm4;
6071 return 1;
6072 }
6073
6074 /* Turn off Imm<N> so that update_imm won't complain. */
6075 operand_type_set (&i.types[0], 0);
6076 }
6077
6078 /* Check vector Disp8 operand. */
6079 if (t->opcode_modifier.disp8memshift
6080 && i.disp_encoding != disp_encoding_32bit)
6081 {
6082 if (i.broadcast)
6083 i.memshift = t->opcode_modifier.broadcast - 1;
6084 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6085 i.memshift = t->opcode_modifier.disp8memshift;
6086 else
6087 {
6088 const i386_operand_type *type = NULL;
6089
6090 i.memshift = 0;
6091 for (op = 0; op < i.operands; op++)
6092 if (i.flags[op] & Operand_Mem)
6093 {
6094 if (t->opcode_modifier.evex == EVEXLIG)
6095 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6096 else if (t->operand_types[op].bitfield.xmmword
6097 + t->operand_types[op].bitfield.ymmword
6098 + t->operand_types[op].bitfield.zmmword <= 1)
6099 type = &t->operand_types[op];
6100 else if (!i.types[op].bitfield.unspecified)
6101 type = &i.types[op];
6102 }
6103 else if (i.types[op].bitfield.class == RegSIMD
6104 && t->opcode_modifier.evex != EVEXLIG)
6105 {
6106 if (i.types[op].bitfield.zmmword)
6107 i.memshift = 6;
6108 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6109 i.memshift = 5;
6110 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6111 i.memshift = 4;
6112 }
6113
6114 if (type)
6115 {
6116 if (type->bitfield.zmmword)
6117 i.memshift = 6;
6118 else if (type->bitfield.ymmword)
6119 i.memshift = 5;
6120 else if (type->bitfield.xmmword)
6121 i.memshift = 4;
6122 }
6123
6124 /* For the check in fits_in_disp8(). */
6125 if (i.memshift == 0)
6126 i.memshift = -1;
6127 }
6128
6129 for (op = 0; op < i.operands; op++)
6130 if (operand_type_check (i.types[op], disp)
6131 && i.op[op].disps->X_op == O_constant)
6132 {
6133 if (fits_in_disp8 (i.op[op].disps->X_add_number))
6134 {
6135 i.types[op].bitfield.disp8 = 1;
6136 return 0;
6137 }
6138 i.types[op].bitfield.disp8 = 0;
6139 }
6140 }
6141
6142 i.memshift = 0;
6143
6144 return 0;
6145 }
6146
6147 /* Check if encoding requirements are met by the instruction. */
6148
6149 static int
6150 VEX_check_encoding (const insn_template *t)
6151 {
6152 if (i.vec_encoding == vex_encoding_error)
6153 {
6154 i.error = unsupported;
6155 return 1;
6156 }
6157
6158 if (i.vec_encoding == vex_encoding_evex)
6159 {
6160 /* This instruction must be encoded with EVEX prefix. */
6161 if (!is_evex_encoding (t))
6162 {
6163 i.error = unsupported;
6164 return 1;
6165 }
6166 return 0;
6167 }
6168
6169 if (!t->opcode_modifier.vex)
6170 {
6171 /* This instruction template doesn't have VEX prefix. */
6172 if (i.vec_encoding != vex_encoding_default)
6173 {
6174 i.error = unsupported;
6175 return 1;
6176 }
6177 return 0;
6178 }
6179
6180 return 0;
6181 }
6182
6183 static const insn_template *
6184 match_template (char mnem_suffix)
6185 {
6186 /* Points to template once we've found it. */
6187 const insn_template *t;
6188 i386_operand_type overlap0, overlap1, overlap2, overlap3;
6189 i386_operand_type overlap4;
6190 unsigned int found_reverse_match;
6191 i386_opcode_modifier suffix_check;
6192 i386_operand_type operand_types [MAX_OPERANDS];
6193 int addr_prefix_disp;
6194 unsigned int j, size_match, check_register;
6195 enum i386_error specific_error = 0;
6196
6197 #if MAX_OPERANDS != 5
6198 # error "MAX_OPERANDS must be 5."
6199 #endif
6200
6201 found_reverse_match = 0;
6202 addr_prefix_disp = -1;
6203
6204 /* Prepare for mnemonic suffix check. */
6205 memset (&suffix_check, 0, sizeof (suffix_check));
6206 switch (mnem_suffix)
6207 {
6208 case BYTE_MNEM_SUFFIX:
6209 suffix_check.no_bsuf = 1;
6210 break;
6211 case WORD_MNEM_SUFFIX:
6212 suffix_check.no_wsuf = 1;
6213 break;
6214 case SHORT_MNEM_SUFFIX:
6215 suffix_check.no_ssuf = 1;
6216 break;
6217 case LONG_MNEM_SUFFIX:
6218 suffix_check.no_lsuf = 1;
6219 break;
6220 case QWORD_MNEM_SUFFIX:
6221 suffix_check.no_qsuf = 1;
6222 break;
6223 default:
6224 /* NB: In Intel syntax, normally we can check for memory operand
6225 size when there is no mnemonic suffix. But jmp and call have
6226 2 different encodings with Dword memory operand size, one with
6227 No_ldSuf and the other without. i.suffix is set to
6228 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6229 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6230 suffix_check.no_ldsuf = 1;
6231 }
6232
6233 /* Must have right number of operands. */
6234 i.error = number_of_operands_mismatch;
6235
6236 for (t = current_templates->start; t < current_templates->end; t++)
6237 {
6238 addr_prefix_disp = -1;
6239 found_reverse_match = 0;
6240
6241 if (i.operands != t->operands)
6242 continue;
6243
6244 /* Check processor support. */
6245 i.error = unsupported;
6246 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6247 continue;
6248
6249 /* Check AT&T mnemonic. */
6250 i.error = unsupported_with_intel_mnemonic;
6251 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6252 continue;
6253
6254 /* Check AT&T/Intel syntax. */
6255 i.error = unsupported_syntax;
6256 if ((intel_syntax && t->opcode_modifier.attsyntax)
6257 || (!intel_syntax && t->opcode_modifier.intelsyntax))
6258 continue;
6259
6260 /* Check Intel64/AMD64 ISA. */
6261 switch (isa64)
6262 {
6263 default:
6264 /* Default: Don't accept Intel64. */
6265 if (t->opcode_modifier.isa64 == INTEL64)
6266 continue;
6267 break;
6268 case amd64:
6269 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6270 if (t->opcode_modifier.isa64 >= INTEL64)
6271 continue;
6272 break;
6273 case intel64:
6274 /* -mintel64: Don't accept AMD64. */
6275 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6276 continue;
6277 break;
6278 }
6279
6280 /* Check the suffix. */
6281 i.error = invalid_instruction_suffix;
6282 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6283 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6284 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6285 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6286 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6287 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6288 continue;
6289
6290 size_match = operand_size_match (t);
6291 if (!size_match)
6292 continue;
6293
6294 /* This is intentionally not
6295
6296 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6297
6298 as the case of a missing * on the operand is accepted (perhaps with
6299 a warning, issued further down). */
6300 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6301 {
6302 i.error = operand_type_mismatch;
6303 continue;
6304 }
6305
6306 for (j = 0; j < MAX_OPERANDS; j++)
6307 operand_types[j] = t->operand_types[j];
6308
6309 /* In general, don't allow
6310 - 64-bit operands outside of 64-bit mode,
6311 - 32-bit operands on pre-386. */
6312 j = i.imm_operands + (t->operands > i.imm_operands + 1);
6313 if (((i.suffix == QWORD_MNEM_SUFFIX
6314 && flag_code != CODE_64BIT
6315 && (t->base_opcode != 0x0fc7
6316 || t->extension_opcode != 1 /* cmpxchg8b */))
6317 || (i.suffix == LONG_MNEM_SUFFIX
6318 && !cpu_arch_flags.bitfield.cpui386))
6319 && (intel_syntax
6320 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6321 && !intel_float_operand (t->name))
6322 : intel_float_operand (t->name) != 2)
6323 && (t->operands == i.imm_operands
6324 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6325 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6326 && operand_types[i.imm_operands].bitfield.class != RegMask)
6327 || (operand_types[j].bitfield.class != RegMMX
6328 && operand_types[j].bitfield.class != RegSIMD
6329 && operand_types[j].bitfield.class != RegMask))
6330 && !t->opcode_modifier.sib)
6331 continue;
6332
6333 /* Do not verify operands when there are none. */
6334 if (!t->operands)
6335 {
6336 if (VEX_check_encoding (t))
6337 {
6338 specific_error = i.error;
6339 continue;
6340 }
6341
6342 /* We've found a match; break out of loop. */
6343 break;
6344 }
6345
6346 if (!t->opcode_modifier.jump
6347 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6348 {
6349 /* There should be only one Disp operand. */
6350 for (j = 0; j < MAX_OPERANDS; j++)
6351 if (operand_type_check (operand_types[j], disp))
6352 break;
6353 if (j < MAX_OPERANDS)
6354 {
6355 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6356
6357 addr_prefix_disp = j;
6358
6359 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6360 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6361 switch (flag_code)
6362 {
6363 case CODE_16BIT:
6364 override = !override;
6365 /* Fall through. */
6366 case CODE_32BIT:
6367 if (operand_types[j].bitfield.disp32
6368 && operand_types[j].bitfield.disp16)
6369 {
6370 operand_types[j].bitfield.disp16 = override;
6371 operand_types[j].bitfield.disp32 = !override;
6372 }
6373 operand_types[j].bitfield.disp32s = 0;
6374 operand_types[j].bitfield.disp64 = 0;
6375 break;
6376
6377 case CODE_64BIT:
6378 if (operand_types[j].bitfield.disp32s
6379 || operand_types[j].bitfield.disp64)
6380 {
6381 operand_types[j].bitfield.disp64 &= !override;
6382 operand_types[j].bitfield.disp32s &= !override;
6383 operand_types[j].bitfield.disp32 = override;
6384 }
6385 operand_types[j].bitfield.disp16 = 0;
6386 break;
6387 }
6388 }
6389 }
6390
6391 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6392 if (i.reloc[0] == BFD_RELOC_386_GOT32 && t->base_opcode == 0xa0)
6393 continue;
6394
6395 /* We check register size if needed. */
6396 if (t->opcode_modifier.checkregsize)
6397 {
6398 check_register = (1 << t->operands) - 1;
6399 if (i.broadcast)
6400 check_register &= ~(1 << i.broadcast->operand);
6401 }
6402 else
6403 check_register = 0;
6404
6405 overlap0 = operand_type_and (i.types[0], operand_types[0]);
6406 switch (t->operands)
6407 {
6408 case 1:
6409 if (!operand_type_match (overlap0, i.types[0]))
6410 continue;
6411 break;
6412 case 2:
6413 /* xchg %eax, %eax is a special case. It is an alias for nop
6414 only in 32bit mode and we can use opcode 0x90. In 64bit
6415 mode, we can't use 0x90 for xchg %eax, %eax since it should
6416 zero-extend %eax to %rax. */
6417 if (flag_code == CODE_64BIT
6418 && t->base_opcode == 0x90
6419 && i.types[0].bitfield.instance == Accum
6420 && i.types[0].bitfield.dword
6421 && i.types[1].bitfield.instance == Accum
6422 && i.types[1].bitfield.dword)
6423 continue;
6424 /* xrelease mov %eax, <disp> is another special case. It must not
6425 match the accumulator-only encoding of mov. */
6426 if (flag_code != CODE_64BIT
6427 && i.hle_prefix
6428 && t->base_opcode == 0xa0
6429 && i.types[0].bitfield.instance == Accum
6430 && (i.flags[1] & Operand_Mem))
6431 continue;
6432 /* Fall through. */
6433
6434 case 3:
6435 if (!(size_match & MATCH_STRAIGHT))
6436 goto check_reverse;
6437 /* Reverse direction of operands if swapping is possible in the first
6438 place (operands need to be symmetric) and
6439 - the load form is requested, and the template is a store form,
6440 - the store form is requested, and the template is a load form,
6441 - the non-default (swapped) form is requested. */
6442 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6443 if (t->opcode_modifier.d && i.reg_operands == i.operands
6444 && !operand_type_all_zero (&overlap1))
6445 switch (i.dir_encoding)
6446 {
6447 case dir_encoding_load:
6448 if (operand_type_check (operand_types[i.operands - 1], anymem)
6449 || t->opcode_modifier.regmem)
6450 goto check_reverse;
6451 break;
6452
6453 case dir_encoding_store:
6454 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6455 && !t->opcode_modifier.regmem)
6456 goto check_reverse;
6457 break;
6458
6459 case dir_encoding_swap:
6460 goto check_reverse;
6461
6462 case dir_encoding_default:
6463 break;
6464 }
6465 /* If we want store form, we skip the current load. */
6466 if ((i.dir_encoding == dir_encoding_store
6467 || i.dir_encoding == dir_encoding_swap)
6468 && i.mem_operands == 0
6469 && t->opcode_modifier.load)
6470 continue;
6471 /* Fall through. */
6472 case 4:
6473 case 5:
6474 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6475 if (!operand_type_match (overlap0, i.types[0])
6476 || !operand_type_match (overlap1, i.types[1])
6477 || ((check_register & 3) == 3
6478 && !operand_type_register_match (i.types[0],
6479 operand_types[0],
6480 i.types[1],
6481 operand_types[1])))
6482 {
6483 /* Check if other direction is valid ... */
6484 if (!t->opcode_modifier.d)
6485 continue;
6486
6487 check_reverse:
6488 if (!(size_match & MATCH_REVERSE))
6489 continue;
6490 /* Try reversing direction of operands. */
6491 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6492 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6493 if (!operand_type_match (overlap0, i.types[0])
6494 || !operand_type_match (overlap1, i.types[i.operands - 1])
6495 || (check_register
6496 && !operand_type_register_match (i.types[0],
6497 operand_types[i.operands - 1],
6498 i.types[i.operands - 1],
6499 operand_types[0])))
6500 {
6501 /* Does not match either direction. */
6502 continue;
6503 }
6504 /* found_reverse_match holds which of D or FloatR
6505 we've found. */
6506 if (!t->opcode_modifier.d)
6507 found_reverse_match = 0;
6508 else if (operand_types[0].bitfield.tbyte)
6509 found_reverse_match = Opcode_FloatD;
6510 else if (operand_types[0].bitfield.xmmword
6511 || operand_types[i.operands - 1].bitfield.xmmword
6512 || operand_types[0].bitfield.class == RegMMX
6513 || operand_types[i.operands - 1].bitfield.class == RegMMX
6514 || is_any_vex_encoding(t))
6515 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6516 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6517 else
6518 found_reverse_match = Opcode_D;
6519 if (t->opcode_modifier.floatr)
6520 found_reverse_match |= Opcode_FloatR;
6521 }
6522 else
6523 {
6524 /* Found a forward 2 operand match here. */
6525 switch (t->operands)
6526 {
6527 case 5:
6528 overlap4 = operand_type_and (i.types[4],
6529 operand_types[4]);
6530 /* Fall through. */
6531 case 4:
6532 overlap3 = operand_type_and (i.types[3],
6533 operand_types[3]);
6534 /* Fall through. */
6535 case 3:
6536 overlap2 = operand_type_and (i.types[2],
6537 operand_types[2]);
6538 break;
6539 }
6540
6541 switch (t->operands)
6542 {
6543 case 5:
6544 if (!operand_type_match (overlap4, i.types[4])
6545 || !operand_type_register_match (i.types[3],
6546 operand_types[3],
6547 i.types[4],
6548 operand_types[4]))
6549 continue;
6550 /* Fall through. */
6551 case 4:
6552 if (!operand_type_match (overlap3, i.types[3])
6553 || ((check_register & 0xa) == 0xa
6554 && !operand_type_register_match (i.types[1],
6555 operand_types[1],
6556 i.types[3],
6557 operand_types[3]))
6558 || ((check_register & 0xc) == 0xc
6559 && !operand_type_register_match (i.types[2],
6560 operand_types[2],
6561 i.types[3],
6562 operand_types[3])))
6563 continue;
6564 /* Fall through. */
6565 case 3:
6566 /* Here we make use of the fact that there are no
6567 reverse match 3 operand instructions. */
6568 if (!operand_type_match (overlap2, i.types[2])
6569 || ((check_register & 5) == 5
6570 && !operand_type_register_match (i.types[0],
6571 operand_types[0],
6572 i.types[2],
6573 operand_types[2]))
6574 || ((check_register & 6) == 6
6575 && !operand_type_register_match (i.types[1],
6576 operand_types[1],
6577 i.types[2],
6578 operand_types[2])))
6579 continue;
6580 break;
6581 }
6582 }
6583 /* Found either forward/reverse 2, 3 or 4 operand match here:
6584 slip through to break. */
6585 }
6586
6587 /* Check if vector operands are valid. */
6588 if (check_VecOperands (t))
6589 {
6590 specific_error = i.error;
6591 continue;
6592 }
6593
6594 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6595 if (VEX_check_encoding (t))
6596 {
6597 specific_error = i.error;
6598 continue;
6599 }
6600
6601 /* We've found a match; break out of loop. */
6602 break;
6603 }
6604
6605 if (t == current_templates->end)
6606 {
6607 /* We found no match. */
6608 const char *err_msg;
6609 switch (specific_error ? specific_error : i.error)
6610 {
6611 default:
6612 abort ();
6613 case operand_size_mismatch:
6614 err_msg = _("operand size mismatch");
6615 break;
6616 case operand_type_mismatch:
6617 err_msg = _("operand type mismatch");
6618 break;
6619 case register_type_mismatch:
6620 err_msg = _("register type mismatch");
6621 break;
6622 case number_of_operands_mismatch:
6623 err_msg = _("number of operands mismatch");
6624 break;
6625 case invalid_instruction_suffix:
6626 err_msg = _("invalid instruction suffix");
6627 break;
6628 case bad_imm4:
6629 err_msg = _("constant doesn't fit in 4 bits");
6630 break;
6631 case unsupported_with_intel_mnemonic:
6632 err_msg = _("unsupported with Intel mnemonic");
6633 break;
6634 case unsupported_syntax:
6635 err_msg = _("unsupported syntax");
6636 break;
6637 case unsupported:
6638 as_bad (_("unsupported instruction `%s'"),
6639 current_templates->start->name);
6640 return NULL;
6641 case invalid_sib_address:
6642 err_msg = _("invalid SIB address");
6643 break;
6644 case invalid_vsib_address:
6645 err_msg = _("invalid VSIB address");
6646 break;
6647 case invalid_vector_register_set:
6648 err_msg = _("mask, index, and destination registers must be distinct");
6649 break;
6650 case invalid_tmm_register_set:
6651 err_msg = _("all tmm registers must be distinct");
6652 break;
6653 case unsupported_vector_index_register:
6654 err_msg = _("unsupported vector index register");
6655 break;
6656 case unsupported_broadcast:
6657 err_msg = _("unsupported broadcast");
6658 break;
6659 case broadcast_needed:
6660 err_msg = _("broadcast is needed for operand of such type");
6661 break;
6662 case unsupported_masking:
6663 err_msg = _("unsupported masking");
6664 break;
6665 case mask_not_on_destination:
6666 err_msg = _("mask not on destination operand");
6667 break;
6668 case no_default_mask:
6669 err_msg = _("default mask isn't allowed");
6670 break;
6671 case unsupported_rc_sae:
6672 err_msg = _("unsupported static rounding/sae");
6673 break;
6674 case rc_sae_operand_not_last_imm:
6675 if (intel_syntax)
6676 err_msg = _("RC/SAE operand must precede immediate operands");
6677 else
6678 err_msg = _("RC/SAE operand must follow immediate operands");
6679 break;
6680 case invalid_register_operand:
6681 err_msg = _("invalid register operand");
6682 break;
6683 }
6684 as_bad (_("%s for `%s'"), err_msg,
6685 current_templates->start->name);
6686 return NULL;
6687 }
6688
6689 if (!quiet_warnings)
6690 {
6691 if (!intel_syntax
6692 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6693 as_warn (_("indirect %s without `*'"), t->name);
6694
6695 if (t->opcode_modifier.isprefix
6696 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6697 {
6698 /* Warn them that a data or address size prefix doesn't
6699 affect assembly of the next line of code. */
6700 as_warn (_("stand-alone `%s' prefix"), t->name);
6701 }
6702 }
6703
6704 /* Copy the template we found. */
6705 i.tm = *t;
6706
6707 if (addr_prefix_disp != -1)
6708 i.tm.operand_types[addr_prefix_disp]
6709 = operand_types[addr_prefix_disp];
6710
6711 if (found_reverse_match)
6712 {
6713 /* If we found a reverse match we must alter the opcode direction
6714 bit and clear/flip the regmem modifier one. found_reverse_match
6715 holds bits to change (different for int & float insns). */
6716
6717 i.tm.base_opcode ^= found_reverse_match;
6718
6719 i.tm.operand_types[0] = operand_types[i.operands - 1];
6720 i.tm.operand_types[i.operands - 1] = operand_types[0];
6721
6722 /* Certain SIMD insns have their load forms specified in the opcode
6723 table, and hence we need to _set_ RegMem instead of clearing it.
6724 We need to avoid setting the bit though on insns like KMOVW. */
6725 i.tm.opcode_modifier.regmem
6726 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6727 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6728 && !i.tm.opcode_modifier.regmem;
6729 }
6730
6731 return t;
6732 }
6733
6734 static int
6735 check_string (void)
6736 {
6737 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6738 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6739
6740 if (i.seg[op] != NULL && i.seg[op] != &es)
6741 {
6742 as_bad (_("`%s' operand %u must use `%ses' segment"),
6743 i.tm.name,
6744 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6745 register_prefix);
6746 return 0;
6747 }
6748
6749 /* There's only ever one segment override allowed per instruction.
6750 This instruction possibly has a legal segment override on the
6751 second operand, so copy the segment to where non-string
6752 instructions store it, allowing common code. */
6753 i.seg[op] = i.seg[1];
6754
6755 return 1;
6756 }
6757
6758 static int
6759 process_suffix (void)
6760 {
6761 /* If matched instruction specifies an explicit instruction mnemonic
6762 suffix, use it. */
6763 if (i.tm.opcode_modifier.size == SIZE16)
6764 i.suffix = WORD_MNEM_SUFFIX;
6765 else if (i.tm.opcode_modifier.size == SIZE32)
6766 i.suffix = LONG_MNEM_SUFFIX;
6767 else if (i.tm.opcode_modifier.size == SIZE64)
6768 i.suffix = QWORD_MNEM_SUFFIX;
6769 else if (i.reg_operands
6770 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6771 && !i.tm.opcode_modifier.addrprefixopreg)
6772 {
6773 unsigned int numop = i.operands;
6774
6775 /* movsx/movzx want only their source operand considered here, for the
6776 ambiguity checking below. The suffix will be replaced afterwards
6777 to represent the destination (register). */
6778 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6779 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
6780 --i.operands;
6781
6782 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6783 if (i.tm.base_opcode == 0xf20f38f0
6784 && i.tm.operand_types[1].bitfield.qword)
6785 i.rex |= REX_W;
6786
6787 /* If there's no instruction mnemonic suffix we try to invent one
6788 based on GPR operands. */
6789 if (!i.suffix)
6790 {
6791 /* We take i.suffix from the last register operand specified,
6792 Destination register type is more significant than source
6793 register type. crc32 in SSE4.2 prefers source register
6794 type. */
6795 unsigned int op = i.tm.base_opcode != 0xf20f38f0 ? i.operands : 1;
6796
6797 while (op--)
6798 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6799 || i.tm.operand_types[op].bitfield.instance == Accum)
6800 {
6801 if (i.types[op].bitfield.class != Reg)
6802 continue;
6803 if (i.types[op].bitfield.byte)
6804 i.suffix = BYTE_MNEM_SUFFIX;
6805 else if (i.types[op].bitfield.word)
6806 i.suffix = WORD_MNEM_SUFFIX;
6807 else if (i.types[op].bitfield.dword)
6808 i.suffix = LONG_MNEM_SUFFIX;
6809 else if (i.types[op].bitfield.qword)
6810 i.suffix = QWORD_MNEM_SUFFIX;
6811 else
6812 continue;
6813 break;
6814 }
6815
6816 /* As an exception, movsx/movzx silently default to a byte source
6817 in AT&T mode. */
6818 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6819 && !i.suffix && !intel_syntax)
6820 i.suffix = BYTE_MNEM_SUFFIX;
6821 }
6822 else if (i.suffix == BYTE_MNEM_SUFFIX)
6823 {
6824 if (intel_syntax
6825 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6826 && i.tm.opcode_modifier.no_bsuf)
6827 i.suffix = 0;
6828 else if (!check_byte_reg ())
6829 return 0;
6830 }
6831 else if (i.suffix == LONG_MNEM_SUFFIX)
6832 {
6833 if (intel_syntax
6834 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6835 && i.tm.opcode_modifier.no_lsuf
6836 && !i.tm.opcode_modifier.todword
6837 && !i.tm.opcode_modifier.toqword)
6838 i.suffix = 0;
6839 else if (!check_long_reg ())
6840 return 0;
6841 }
6842 else if (i.suffix == QWORD_MNEM_SUFFIX)
6843 {
6844 if (intel_syntax
6845 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6846 && i.tm.opcode_modifier.no_qsuf
6847 && !i.tm.opcode_modifier.todword
6848 && !i.tm.opcode_modifier.toqword)
6849 i.suffix = 0;
6850 else if (!check_qword_reg ())
6851 return 0;
6852 }
6853 else if (i.suffix == WORD_MNEM_SUFFIX)
6854 {
6855 if (intel_syntax
6856 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6857 && i.tm.opcode_modifier.no_wsuf)
6858 i.suffix = 0;
6859 else if (!check_word_reg ())
6860 return 0;
6861 }
6862 else if (intel_syntax
6863 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6864 /* Do nothing if the instruction is going to ignore the prefix. */
6865 ;
6866 else
6867 abort ();
6868
6869 /* Undo the movsx/movzx change done above. */
6870 i.operands = numop;
6871 }
6872 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6873 && !i.suffix)
6874 {
6875 i.suffix = stackop_size;
6876 if (stackop_size == LONG_MNEM_SUFFIX)
6877 {
6878 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6879 .code16gcc directive to support 16-bit mode with
6880 32-bit address. For IRET without a suffix, generate
6881 16-bit IRET (opcode 0xcf) to return from an interrupt
6882 handler. */
6883 if (i.tm.base_opcode == 0xcf)
6884 {
6885 i.suffix = WORD_MNEM_SUFFIX;
6886 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6887 }
6888 /* Warn about changed behavior for segment register push/pop. */
6889 else if ((i.tm.base_opcode | 1) == 0x07)
6890 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6891 i.tm.name);
6892 }
6893 }
6894 else if (!i.suffix
6895 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6896 || i.tm.opcode_modifier.jump == JUMP_BYTE
6897 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6898 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6899 && i.tm.extension_opcode <= 3)))
6900 {
6901 switch (flag_code)
6902 {
6903 case CODE_64BIT:
6904 if (!i.tm.opcode_modifier.no_qsuf)
6905 {
6906 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6907 || i.tm.opcode_modifier.no_lsuf)
6908 i.suffix = QWORD_MNEM_SUFFIX;
6909 break;
6910 }
6911 /* Fall through. */
6912 case CODE_32BIT:
6913 if (!i.tm.opcode_modifier.no_lsuf)
6914 i.suffix = LONG_MNEM_SUFFIX;
6915 break;
6916 case CODE_16BIT:
6917 if (!i.tm.opcode_modifier.no_wsuf)
6918 i.suffix = WORD_MNEM_SUFFIX;
6919 break;
6920 }
6921 }
6922
6923 if (!i.suffix
6924 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6925 /* Also cover lret/retf/iret in 64-bit mode. */
6926 || (flag_code == CODE_64BIT
6927 && !i.tm.opcode_modifier.no_lsuf
6928 && !i.tm.opcode_modifier.no_qsuf))
6929 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6930 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6931 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6932 /* Accept FLDENV et al without suffix. */
6933 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6934 {
6935 unsigned int suffixes, evex = 0;
6936
6937 suffixes = !i.tm.opcode_modifier.no_bsuf;
6938 if (!i.tm.opcode_modifier.no_wsuf)
6939 suffixes |= 1 << 1;
6940 if (!i.tm.opcode_modifier.no_lsuf)
6941 suffixes |= 1 << 2;
6942 if (!i.tm.opcode_modifier.no_ldsuf)
6943 suffixes |= 1 << 3;
6944 if (!i.tm.opcode_modifier.no_ssuf)
6945 suffixes |= 1 << 4;
6946 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6947 suffixes |= 1 << 5;
6948
6949 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6950 also suitable for AT&T syntax mode, it was requested that this be
6951 restricted to just Intel syntax. */
6952 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6953 {
6954 unsigned int op;
6955
6956 for (op = 0; op < i.tm.operands; ++op)
6957 {
6958 if (is_evex_encoding (&i.tm)
6959 && !cpu_arch_flags.bitfield.cpuavx512vl)
6960 {
6961 if (i.tm.operand_types[op].bitfield.ymmword)
6962 i.tm.operand_types[op].bitfield.xmmword = 0;
6963 if (i.tm.operand_types[op].bitfield.zmmword)
6964 i.tm.operand_types[op].bitfield.ymmword = 0;
6965 if (!i.tm.opcode_modifier.evex
6966 || i.tm.opcode_modifier.evex == EVEXDYN)
6967 i.tm.opcode_modifier.evex = EVEX512;
6968 }
6969
6970 if (i.tm.operand_types[op].bitfield.xmmword
6971 + i.tm.operand_types[op].bitfield.ymmword
6972 + i.tm.operand_types[op].bitfield.zmmword < 2)
6973 continue;
6974
6975 /* Any properly sized operand disambiguates the insn. */
6976 if (i.types[op].bitfield.xmmword
6977 || i.types[op].bitfield.ymmword
6978 || i.types[op].bitfield.zmmword)
6979 {
6980 suffixes &= ~(7 << 6);
6981 evex = 0;
6982 break;
6983 }
6984
6985 if ((i.flags[op] & Operand_Mem)
6986 && i.tm.operand_types[op].bitfield.unspecified)
6987 {
6988 if (i.tm.operand_types[op].bitfield.xmmword)
6989 suffixes |= 1 << 6;
6990 if (i.tm.operand_types[op].bitfield.ymmword)
6991 suffixes |= 1 << 7;
6992 if (i.tm.operand_types[op].bitfield.zmmword)
6993 suffixes |= 1 << 8;
6994 if (is_evex_encoding (&i.tm))
6995 evex = EVEX512;
6996 }
6997 }
6998 }
6999
7000 /* Are multiple suffixes / operand sizes allowed? */
7001 if (suffixes & (suffixes - 1))
7002 {
7003 if (intel_syntax
7004 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
7005 || operand_check == check_error))
7006 {
7007 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
7008 return 0;
7009 }
7010 if (operand_check == check_error)
7011 {
7012 as_bad (_("no instruction mnemonic suffix given and "
7013 "no register operands; can't size `%s'"), i.tm.name);
7014 return 0;
7015 }
7016 if (operand_check == check_warning)
7017 as_warn (_("%s; using default for `%s'"),
7018 intel_syntax
7019 ? _("ambiguous operand size")
7020 : _("no instruction mnemonic suffix given and "
7021 "no register operands"),
7022 i.tm.name);
7023
7024 if (i.tm.opcode_modifier.floatmf)
7025 i.suffix = SHORT_MNEM_SUFFIX;
7026 else if ((i.tm.base_opcode | 8) == 0xfbe
7027 || (i.tm.base_opcode == 0x63
7028 && i.tm.cpu_flags.bitfield.cpu64))
7029 /* handled below */;
7030 else if (evex)
7031 i.tm.opcode_modifier.evex = evex;
7032 else if (flag_code == CODE_16BIT)
7033 i.suffix = WORD_MNEM_SUFFIX;
7034 else if (!i.tm.opcode_modifier.no_lsuf)
7035 i.suffix = LONG_MNEM_SUFFIX;
7036 else
7037 i.suffix = QWORD_MNEM_SUFFIX;
7038 }
7039 }
7040
7041 if ((i.tm.base_opcode | 8) == 0xfbe
7042 || (i.tm.base_opcode == 0x63 && i.tm.cpu_flags.bitfield.cpu64))
7043 {
7044 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7045 In AT&T syntax, if there is no suffix (warned about above), the default
7046 will be byte extension. */
7047 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7048 i.tm.base_opcode |= 1;
7049
7050 /* For further processing, the suffix should represent the destination
7051 (register). This is already the case when one was used with
7052 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7053 no suffix to begin with. */
7054 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7055 {
7056 if (i.types[1].bitfield.word)
7057 i.suffix = WORD_MNEM_SUFFIX;
7058 else if (i.types[1].bitfield.qword)
7059 i.suffix = QWORD_MNEM_SUFFIX;
7060 else
7061 i.suffix = LONG_MNEM_SUFFIX;
7062
7063 i.tm.opcode_modifier.w = 0;
7064 }
7065 }
7066
7067 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7068 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7069 != (i.tm.operand_types[1].bitfield.class == Reg);
7070
7071 /* Change the opcode based on the operand size given by i.suffix. */
7072 switch (i.suffix)
7073 {
7074 /* Size floating point instruction. */
7075 case LONG_MNEM_SUFFIX:
7076 if (i.tm.opcode_modifier.floatmf)
7077 {
7078 i.tm.base_opcode ^= 4;
7079 break;
7080 }
7081 /* fall through */
7082 case WORD_MNEM_SUFFIX:
7083 case QWORD_MNEM_SUFFIX:
7084 /* It's not a byte, select word/dword operation. */
7085 if (i.tm.opcode_modifier.w)
7086 {
7087 if (i.short_form)
7088 i.tm.base_opcode |= 8;
7089 else
7090 i.tm.base_opcode |= 1;
7091 }
7092 /* fall through */
7093 case SHORT_MNEM_SUFFIX:
7094 /* Now select between word & dword operations via the operand
7095 size prefix, except for instructions that will ignore this
7096 prefix anyway. */
7097 if (i.suffix != QWORD_MNEM_SUFFIX
7098 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7099 && !i.tm.opcode_modifier.floatmf
7100 && !is_any_vex_encoding (&i.tm)
7101 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7102 || (flag_code == CODE_64BIT
7103 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7104 {
7105 unsigned int prefix = DATA_PREFIX_OPCODE;
7106
7107 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7108 prefix = ADDR_PREFIX_OPCODE;
7109
7110 if (!add_prefix (prefix))
7111 return 0;
7112 }
7113
7114 /* Set mode64 for an operand. */
7115 if (i.suffix == QWORD_MNEM_SUFFIX
7116 && flag_code == CODE_64BIT
7117 && !i.tm.opcode_modifier.norex64
7118 && !i.tm.opcode_modifier.vexw
7119 /* Special case for xchg %rax,%rax. It is NOP and doesn't
7120 need rex64. */
7121 && ! (i.operands == 2
7122 && i.tm.base_opcode == 0x90
7123 && i.tm.extension_opcode == None
7124 && i.types[0].bitfield.instance == Accum
7125 && i.types[0].bitfield.qword
7126 && i.types[1].bitfield.instance == Accum
7127 && i.types[1].bitfield.qword))
7128 i.rex |= REX_W;
7129
7130 break;
7131
7132 case 0:
7133 /* Select word/dword/qword operation with explict data sizing prefix
7134 when there are no suitable register operands. */
7135 if (i.tm.opcode_modifier.w
7136 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7137 && (!i.reg_operands
7138 || (i.reg_operands == 1
7139 /* ShiftCount */
7140 && (i.tm.operand_types[0].bitfield.instance == RegC
7141 /* InOutPortReg */
7142 || i.tm.operand_types[0].bitfield.instance == RegD
7143 || i.tm.operand_types[1].bitfield.instance == RegD
7144 /* CRC32 */
7145 || i.tm.base_opcode == 0xf20f38f0))))
7146 i.tm.base_opcode |= 1;
7147 break;
7148 }
7149
7150 if (i.tm.opcode_modifier.addrprefixopreg)
7151 {
7152 gas_assert (!i.suffix);
7153 gas_assert (i.reg_operands);
7154
7155 if (i.tm.operand_types[0].bitfield.instance == Accum
7156 || i.operands == 1)
7157 {
7158 /* The address size override prefix changes the size of the
7159 first operand. */
7160 if (flag_code == CODE_64BIT
7161 && i.op[0].regs->reg_type.bitfield.word)
7162 {
7163 as_bad (_("16-bit addressing unavailable for `%s'"),
7164 i.tm.name);
7165 return 0;
7166 }
7167
7168 if ((flag_code == CODE_32BIT
7169 ? i.op[0].regs->reg_type.bitfield.word
7170 : i.op[0].regs->reg_type.bitfield.dword)
7171 && !add_prefix (ADDR_PREFIX_OPCODE))
7172 return 0;
7173 }
7174 else
7175 {
7176 /* Check invalid register operand when the address size override
7177 prefix changes the size of register operands. */
7178 unsigned int op;
7179 enum { need_word, need_dword, need_qword } need;
7180
7181 /* Check the register operand for the address size prefix if
7182 the memory operand has no real registers, like symbol, DISP
7183 or symbol(%rip). */
7184 if (i.mem_operands == 1
7185 && i.reg_operands == 1
7186 && i.operands == 2
7187 && i.types[1].bitfield.class == Reg
7188 && (flag_code == CODE_32BIT
7189 ? i.op[1].regs->reg_type.bitfield.word
7190 : i.op[1].regs->reg_type.bitfield.dword)
7191 && ((i.base_reg == NULL && i.index_reg == NULL)
7192 || (i.base_reg
7193 && i.base_reg->reg_num == RegIP
7194 && i.base_reg->reg_type.bitfield.qword))
7195 && !add_prefix (ADDR_PREFIX_OPCODE))
7196 return 0;
7197
7198 if (flag_code == CODE_32BIT)
7199 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7200 else if (i.prefix[ADDR_PREFIX])
7201 need = need_dword;
7202 else
7203 need = flag_code == CODE_64BIT ? need_qword : need_word;
7204
7205 for (op = 0; op < i.operands; op++)
7206 {
7207 if (i.types[op].bitfield.class != Reg)
7208 continue;
7209
7210 switch (need)
7211 {
7212 case need_word:
7213 if (i.op[op].regs->reg_type.bitfield.word)
7214 continue;
7215 break;
7216 case need_dword:
7217 if (i.op[op].regs->reg_type.bitfield.dword)
7218 continue;
7219 break;
7220 case need_qword:
7221 if (i.op[op].regs->reg_type.bitfield.qword)
7222 continue;
7223 break;
7224 }
7225
7226 as_bad (_("invalid register operand size for `%s'"),
7227 i.tm.name);
7228 return 0;
7229 }
7230 }
7231 }
7232
7233 return 1;
7234 }
7235
7236 static int
7237 check_byte_reg (void)
7238 {
7239 int op;
7240
7241 for (op = i.operands; --op >= 0;)
7242 {
7243 /* Skip non-register operands. */
7244 if (i.types[op].bitfield.class != Reg)
7245 continue;
7246
7247 /* If this is an eight bit register, it's OK. If it's the 16 or
7248 32 bit version of an eight bit register, we will just use the
7249 low portion, and that's OK too. */
7250 if (i.types[op].bitfield.byte)
7251 continue;
7252
7253 /* I/O port address operands are OK too. */
7254 if (i.tm.operand_types[op].bitfield.instance == RegD
7255 && i.tm.operand_types[op].bitfield.word)
7256 continue;
7257
7258 /* crc32 only wants its source operand checked here. */
7259 if (i.tm.base_opcode == 0xf20f38f0 && op)
7260 continue;
7261
7262 /* Any other register is bad. */
7263 as_bad (_("`%s%s' not allowed with `%s%c'"),
7264 register_prefix, i.op[op].regs->reg_name,
7265 i.tm.name, i.suffix);
7266 return 0;
7267 }
7268 return 1;
7269 }
7270
7271 static int
7272 check_long_reg (void)
7273 {
7274 int op;
7275
7276 for (op = i.operands; --op >= 0;)
7277 /* Skip non-register operands. */
7278 if (i.types[op].bitfield.class != Reg)
7279 continue;
7280 /* Reject eight bit registers, except where the template requires
7281 them. (eg. movzb) */
7282 else if (i.types[op].bitfield.byte
7283 && (i.tm.operand_types[op].bitfield.class == Reg
7284 || i.tm.operand_types[op].bitfield.instance == Accum)
7285 && (i.tm.operand_types[op].bitfield.word
7286 || i.tm.operand_types[op].bitfield.dword))
7287 {
7288 as_bad (_("`%s%s' not allowed with `%s%c'"),
7289 register_prefix,
7290 i.op[op].regs->reg_name,
7291 i.tm.name,
7292 i.suffix);
7293 return 0;
7294 }
7295 /* Error if the e prefix on a general reg is missing. */
7296 else if (i.types[op].bitfield.word
7297 && (i.tm.operand_types[op].bitfield.class == Reg
7298 || i.tm.operand_types[op].bitfield.instance == Accum)
7299 && i.tm.operand_types[op].bitfield.dword)
7300 {
7301 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7302 register_prefix, i.op[op].regs->reg_name,
7303 i.suffix);
7304 return 0;
7305 }
7306 /* Warn if the r prefix on a general reg is present. */
7307 else if (i.types[op].bitfield.qword
7308 && (i.tm.operand_types[op].bitfield.class == Reg
7309 || i.tm.operand_types[op].bitfield.instance == Accum)
7310 && i.tm.operand_types[op].bitfield.dword)
7311 {
7312 if (intel_syntax
7313 && i.tm.opcode_modifier.toqword
7314 && i.types[0].bitfield.class != RegSIMD)
7315 {
7316 /* Convert to QWORD. We want REX byte. */
7317 i.suffix = QWORD_MNEM_SUFFIX;
7318 }
7319 else
7320 {
7321 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7322 register_prefix, i.op[op].regs->reg_name,
7323 i.suffix);
7324 return 0;
7325 }
7326 }
7327 return 1;
7328 }
7329
7330 static int
7331 check_qword_reg (void)
7332 {
7333 int op;
7334
7335 for (op = i.operands; --op >= 0; )
7336 /* Skip non-register operands. */
7337 if (i.types[op].bitfield.class != Reg)
7338 continue;
7339 /* Reject eight bit registers, except where the template requires
7340 them. (eg. movzb) */
7341 else if (i.types[op].bitfield.byte
7342 && (i.tm.operand_types[op].bitfield.class == Reg
7343 || i.tm.operand_types[op].bitfield.instance == Accum)
7344 && (i.tm.operand_types[op].bitfield.word
7345 || i.tm.operand_types[op].bitfield.dword))
7346 {
7347 as_bad (_("`%s%s' not allowed with `%s%c'"),
7348 register_prefix,
7349 i.op[op].regs->reg_name,
7350 i.tm.name,
7351 i.suffix);
7352 return 0;
7353 }
7354 /* Warn if the r prefix on a general reg is missing. */
7355 else if ((i.types[op].bitfield.word
7356 || i.types[op].bitfield.dword)
7357 && (i.tm.operand_types[op].bitfield.class == Reg
7358 || i.tm.operand_types[op].bitfield.instance == Accum)
7359 && i.tm.operand_types[op].bitfield.qword)
7360 {
7361 /* Prohibit these changes in the 64bit mode, since the
7362 lowering is more complicated. */
7363 if (intel_syntax
7364 && i.tm.opcode_modifier.todword
7365 && i.types[0].bitfield.class != RegSIMD)
7366 {
7367 /* Convert to DWORD. We don't want REX byte. */
7368 i.suffix = LONG_MNEM_SUFFIX;
7369 }
7370 else
7371 {
7372 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7373 register_prefix, i.op[op].regs->reg_name,
7374 i.suffix);
7375 return 0;
7376 }
7377 }
7378 return 1;
7379 }
7380
7381 static int
7382 check_word_reg (void)
7383 {
7384 int op;
7385 for (op = i.operands; --op >= 0;)
7386 /* Skip non-register operands. */
7387 if (i.types[op].bitfield.class != Reg)
7388 continue;
7389 /* Reject eight bit registers, except where the template requires
7390 them. (eg. movzb) */
7391 else if (i.types[op].bitfield.byte
7392 && (i.tm.operand_types[op].bitfield.class == Reg
7393 || i.tm.operand_types[op].bitfield.instance == Accum)
7394 && (i.tm.operand_types[op].bitfield.word
7395 || i.tm.operand_types[op].bitfield.dword))
7396 {
7397 as_bad (_("`%s%s' not allowed with `%s%c'"),
7398 register_prefix,
7399 i.op[op].regs->reg_name,
7400 i.tm.name,
7401 i.suffix);
7402 return 0;
7403 }
7404 /* Error if the e or r prefix on a general reg is present. */
7405 else if ((i.types[op].bitfield.dword
7406 || i.types[op].bitfield.qword)
7407 && (i.tm.operand_types[op].bitfield.class == Reg
7408 || i.tm.operand_types[op].bitfield.instance == Accum)
7409 && i.tm.operand_types[op].bitfield.word)
7410 {
7411 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7412 register_prefix, i.op[op].regs->reg_name,
7413 i.suffix);
7414 return 0;
7415 }
7416 return 1;
7417 }
7418
7419 static int
7420 update_imm (unsigned int j)
7421 {
7422 i386_operand_type overlap = i.types[j];
7423 if ((overlap.bitfield.imm8
7424 || overlap.bitfield.imm8s
7425 || overlap.bitfield.imm16
7426 || overlap.bitfield.imm32
7427 || overlap.bitfield.imm32s
7428 || overlap.bitfield.imm64)
7429 && !operand_type_equal (&overlap, &imm8)
7430 && !operand_type_equal (&overlap, &imm8s)
7431 && !operand_type_equal (&overlap, &imm16)
7432 && !operand_type_equal (&overlap, &imm32)
7433 && !operand_type_equal (&overlap, &imm32s)
7434 && !operand_type_equal (&overlap, &imm64))
7435 {
7436 if (i.suffix)
7437 {
7438 i386_operand_type temp;
7439
7440 operand_type_set (&temp, 0);
7441 if (i.suffix == BYTE_MNEM_SUFFIX)
7442 {
7443 temp.bitfield.imm8 = overlap.bitfield.imm8;
7444 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7445 }
7446 else if (i.suffix == WORD_MNEM_SUFFIX)
7447 temp.bitfield.imm16 = overlap.bitfield.imm16;
7448 else if (i.suffix == QWORD_MNEM_SUFFIX)
7449 {
7450 temp.bitfield.imm64 = overlap.bitfield.imm64;
7451 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7452 }
7453 else
7454 temp.bitfield.imm32 = overlap.bitfield.imm32;
7455 overlap = temp;
7456 }
7457 else if (operand_type_equal (&overlap, &imm16_32_32s)
7458 || operand_type_equal (&overlap, &imm16_32)
7459 || operand_type_equal (&overlap, &imm16_32s))
7460 {
7461 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7462 overlap = imm16;
7463 else
7464 overlap = imm32s;
7465 }
7466 else if (i.prefix[REX_PREFIX] & REX_W)
7467 overlap = operand_type_and (overlap, imm32s);
7468 else if (i.prefix[DATA_PREFIX])
7469 overlap = operand_type_and (overlap,
7470 flag_code != CODE_16BIT ? imm16 : imm32);
7471 if (!operand_type_equal (&overlap, &imm8)
7472 && !operand_type_equal (&overlap, &imm8s)
7473 && !operand_type_equal (&overlap, &imm16)
7474 && !operand_type_equal (&overlap, &imm32)
7475 && !operand_type_equal (&overlap, &imm32s)
7476 && !operand_type_equal (&overlap, &imm64))
7477 {
7478 as_bad (_("no instruction mnemonic suffix given; "
7479 "can't determine immediate size"));
7480 return 0;
7481 }
7482 }
7483 i.types[j] = overlap;
7484
7485 return 1;
7486 }
7487
7488 static int
7489 finalize_imm (void)
7490 {
7491 unsigned int j, n;
7492
7493 /* Update the first 2 immediate operands. */
7494 n = i.operands > 2 ? 2 : i.operands;
7495 if (n)
7496 {
7497 for (j = 0; j < n; j++)
7498 if (update_imm (j) == 0)
7499 return 0;
7500
7501 /* The 3rd operand can't be immediate operand. */
7502 gas_assert (operand_type_check (i.types[2], imm) == 0);
7503 }
7504
7505 return 1;
7506 }
7507
7508 static int
7509 process_operands (void)
7510 {
7511 /* Default segment register this instruction will use for memory
7512 accesses. 0 means unknown. This is only for optimizing out
7513 unnecessary segment overrides. */
7514 const seg_entry *default_seg = 0;
7515
7516 if (i.tm.opcode_modifier.sse2avx)
7517 {
7518 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7519 need converting. */
7520 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7521 i.prefix[REX_PREFIX] = 0;
7522 i.rex_encoding = 0;
7523 }
7524 /* ImmExt should be processed after SSE2AVX. */
7525 else if (i.tm.opcode_modifier.immext)
7526 process_immext ();
7527
7528 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7529 {
7530 unsigned int dupl = i.operands;
7531 unsigned int dest = dupl - 1;
7532 unsigned int j;
7533
7534 /* The destination must be an xmm register. */
7535 gas_assert (i.reg_operands
7536 && MAX_OPERANDS > dupl
7537 && operand_type_equal (&i.types[dest], &regxmm));
7538
7539 if (i.tm.operand_types[0].bitfield.instance == Accum
7540 && i.tm.operand_types[0].bitfield.xmmword)
7541 {
7542 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7543 {
7544 /* Keep xmm0 for instructions with VEX prefix and 3
7545 sources. */
7546 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7547 i.tm.operand_types[0].bitfield.class = RegSIMD;
7548 goto duplicate;
7549 }
7550 else
7551 {
7552 /* We remove the first xmm0 and keep the number of
7553 operands unchanged, which in fact duplicates the
7554 destination. */
7555 for (j = 1; j < i.operands; j++)
7556 {
7557 i.op[j - 1] = i.op[j];
7558 i.types[j - 1] = i.types[j];
7559 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7560 i.flags[j - 1] = i.flags[j];
7561 }
7562 }
7563 }
7564 else if (i.tm.opcode_modifier.implicit1stxmm0)
7565 {
7566 gas_assert ((MAX_OPERANDS - 1) > dupl
7567 && (i.tm.opcode_modifier.vexsources
7568 == VEX3SOURCES));
7569
7570 /* Add the implicit xmm0 for instructions with VEX prefix
7571 and 3 sources. */
7572 for (j = i.operands; j > 0; j--)
7573 {
7574 i.op[j] = i.op[j - 1];
7575 i.types[j] = i.types[j - 1];
7576 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7577 i.flags[j] = i.flags[j - 1];
7578 }
7579 i.op[0].regs
7580 = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7581 i.types[0] = regxmm;
7582 i.tm.operand_types[0] = regxmm;
7583
7584 i.operands += 2;
7585 i.reg_operands += 2;
7586 i.tm.operands += 2;
7587
7588 dupl++;
7589 dest++;
7590 i.op[dupl] = i.op[dest];
7591 i.types[dupl] = i.types[dest];
7592 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7593 i.flags[dupl] = i.flags[dest];
7594 }
7595 else
7596 {
7597 duplicate:
7598 i.operands++;
7599 i.reg_operands++;
7600 i.tm.operands++;
7601
7602 i.op[dupl] = i.op[dest];
7603 i.types[dupl] = i.types[dest];
7604 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7605 i.flags[dupl] = i.flags[dest];
7606 }
7607
7608 if (i.tm.opcode_modifier.immext)
7609 process_immext ();
7610 }
7611 else if (i.tm.operand_types[0].bitfield.instance == Accum
7612 && i.tm.operand_types[0].bitfield.xmmword)
7613 {
7614 unsigned int j;
7615
7616 for (j = 1; j < i.operands; j++)
7617 {
7618 i.op[j - 1] = i.op[j];
7619 i.types[j - 1] = i.types[j];
7620
7621 /* We need to adjust fields in i.tm since they are used by
7622 build_modrm_byte. */
7623 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7624
7625 i.flags[j - 1] = i.flags[j];
7626 }
7627
7628 i.operands--;
7629 i.reg_operands--;
7630 i.tm.operands--;
7631 }
7632 else if (i.tm.opcode_modifier.implicitquadgroup)
7633 {
7634 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7635
7636 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7637 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7638 regnum = register_number (i.op[1].regs);
7639 first_reg_in_group = regnum & ~3;
7640 last_reg_in_group = first_reg_in_group + 3;
7641 if (regnum != first_reg_in_group)
7642 as_warn (_("source register `%s%s' implicitly denotes"
7643 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7644 register_prefix, i.op[1].regs->reg_name,
7645 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7646 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7647 i.tm.name);
7648 }
7649 else if (i.tm.opcode_modifier.regkludge)
7650 {
7651 /* The imul $imm, %reg instruction is converted into
7652 imul $imm, %reg, %reg, and the clr %reg instruction
7653 is converted into xor %reg, %reg. */
7654
7655 unsigned int first_reg_op;
7656
7657 if (operand_type_check (i.types[0], reg))
7658 first_reg_op = 0;
7659 else
7660 first_reg_op = 1;
7661 /* Pretend we saw the extra register operand. */
7662 gas_assert (i.reg_operands == 1
7663 && i.op[first_reg_op + 1].regs == 0);
7664 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7665 i.types[first_reg_op + 1] = i.types[first_reg_op];
7666 i.operands++;
7667 i.reg_operands++;
7668 }
7669
7670 if (i.tm.opcode_modifier.modrm)
7671 {
7672 /* The opcode is completed (modulo i.tm.extension_opcode which
7673 must be put into the modrm byte). Now, we make the modrm and
7674 index base bytes based on all the info we've collected. */
7675
7676 default_seg = build_modrm_byte ();
7677 }
7678 else if (i.types[0].bitfield.class == SReg)
7679 {
7680 if (flag_code != CODE_64BIT
7681 ? i.tm.base_opcode == POP_SEG_SHORT
7682 && i.op[0].regs->reg_num == 1
7683 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7684 && i.op[0].regs->reg_num < 4)
7685 {
7686 as_bad (_("you can't `%s %s%s'"),
7687 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7688 return 0;
7689 }
7690 if ( i.op[0].regs->reg_num > 3 && i.tm.opcode_length == 1 )
7691 {
7692 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7693 i.tm.opcode_length = 2;
7694 }
7695 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7696 }
7697 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7698 {
7699 default_seg = &ds;
7700 }
7701 else if (i.tm.opcode_modifier.isstring)
7702 {
7703 /* For the string instructions that allow a segment override
7704 on one of their operands, the default segment is ds. */
7705 default_seg = &ds;
7706 }
7707 else if (i.short_form)
7708 {
7709 /* The register or float register operand is in operand
7710 0 or 1. */
7711 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7712
7713 /* Register goes in low 3 bits of opcode. */
7714 i.tm.base_opcode |= i.op[op].regs->reg_num;
7715 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7716 i.rex |= REX_B;
7717 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7718 {
7719 /* Warn about some common errors, but press on regardless.
7720 The first case can be generated by gcc (<= 2.8.1). */
7721 if (i.operands == 2)
7722 {
7723 /* Reversed arguments on faddp, fsubp, etc. */
7724 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7725 register_prefix, i.op[!intel_syntax].regs->reg_name,
7726 register_prefix, i.op[intel_syntax].regs->reg_name);
7727 }
7728 else
7729 {
7730 /* Extraneous `l' suffix on fp insn. */
7731 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7732 register_prefix, i.op[0].regs->reg_name);
7733 }
7734 }
7735 }
7736
7737 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7738 && i.tm.base_opcode == 0x8d /* lea */
7739 && !is_any_vex_encoding(&i.tm))
7740 {
7741 if (!quiet_warnings)
7742 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7743 if (optimize)
7744 {
7745 i.seg[0] = NULL;
7746 i.prefix[SEG_PREFIX] = 0;
7747 }
7748 }
7749
7750 /* If a segment was explicitly specified, and the specified segment
7751 is neither the default nor the one already recorded from a prefix,
7752 use an opcode prefix to select it. If we never figured out what
7753 the default segment is, then default_seg will be zero at this
7754 point, and the specified segment prefix will always be used. */
7755 if (i.seg[0]
7756 && i.seg[0] != default_seg
7757 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7758 {
7759 if (!add_prefix (i.seg[0]->seg_prefix))
7760 return 0;
7761 }
7762 return 1;
7763 }
7764
7765 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7766 bfd_boolean do_sse2avx)
7767 {
7768 if (r->reg_flags & RegRex)
7769 {
7770 if (i.rex & rex_bit)
7771 as_bad (_("same type of prefix used twice"));
7772 i.rex |= rex_bit;
7773 }
7774 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7775 {
7776 gas_assert (i.vex.register_specifier == r);
7777 i.vex.register_specifier += 8;
7778 }
7779
7780 if (r->reg_flags & RegVRex)
7781 i.vrex |= rex_bit;
7782 }
7783
7784 static const seg_entry *
7785 build_modrm_byte (void)
7786 {
7787 const seg_entry *default_seg = 0;
7788 unsigned int source, dest;
7789 int vex_3_sources;
7790
7791 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7792 if (vex_3_sources)
7793 {
7794 unsigned int nds, reg_slot;
7795 expressionS *exp;
7796
7797 dest = i.operands - 1;
7798 nds = dest - 1;
7799
7800 /* There are 2 kinds of instructions:
7801 1. 5 operands: 4 register operands or 3 register operands
7802 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7803 VexW0 or VexW1. The destination must be either XMM, YMM or
7804 ZMM register.
7805 2. 4 operands: 4 register operands or 3 register operands
7806 plus 1 memory operand, with VexXDS. */
7807 gas_assert ((i.reg_operands == 4
7808 || (i.reg_operands == 3 && i.mem_operands == 1))
7809 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7810 && i.tm.opcode_modifier.vexw
7811 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7812
7813 /* If VexW1 is set, the first non-immediate operand is the source and
7814 the second non-immediate one is encoded in the immediate operand. */
7815 if (i.tm.opcode_modifier.vexw == VEXW1)
7816 {
7817 source = i.imm_operands;
7818 reg_slot = i.imm_operands + 1;
7819 }
7820 else
7821 {
7822 source = i.imm_operands + 1;
7823 reg_slot = i.imm_operands;
7824 }
7825
7826 if (i.imm_operands == 0)
7827 {
7828 /* When there is no immediate operand, generate an 8bit
7829 immediate operand to encode the first operand. */
7830 exp = &im_expressions[i.imm_operands++];
7831 i.op[i.operands].imms = exp;
7832 i.types[i.operands] = imm8;
7833 i.operands++;
7834
7835 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7836 exp->X_op = O_constant;
7837 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7838 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7839 }
7840 else
7841 {
7842 gas_assert (i.imm_operands == 1);
7843 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7844 gas_assert (!i.tm.opcode_modifier.immext);
7845
7846 /* Turn on Imm8 again so that output_imm will generate it. */
7847 i.types[0].bitfield.imm8 = 1;
7848
7849 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7850 i.op[0].imms->X_add_number
7851 |= register_number (i.op[reg_slot].regs) << 4;
7852 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7853 }
7854
7855 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7856 i.vex.register_specifier = i.op[nds].regs;
7857 }
7858 else
7859 source = dest = 0;
7860
7861 /* i.reg_operands MUST be the number of real register operands;
7862 implicit registers do not count. If there are 3 register
7863 operands, it must be a instruction with VexNDS. For a
7864 instruction with VexNDD, the destination register is encoded
7865 in VEX prefix. If there are 4 register operands, it must be
7866 a instruction with VEX prefix and 3 sources. */
7867 if (i.mem_operands == 0
7868 && ((i.reg_operands == 2
7869 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7870 || (i.reg_operands == 3
7871 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7872 || (i.reg_operands == 4 && vex_3_sources)))
7873 {
7874 switch (i.operands)
7875 {
7876 case 2:
7877 source = 0;
7878 break;
7879 case 3:
7880 /* When there are 3 operands, one of them may be immediate,
7881 which may be the first or the last operand. Otherwise,
7882 the first operand must be shift count register (cl) or it
7883 is an instruction with VexNDS. */
7884 gas_assert (i.imm_operands == 1
7885 || (i.imm_operands == 0
7886 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7887 || (i.types[0].bitfield.instance == RegC
7888 && i.types[0].bitfield.byte))));
7889 if (operand_type_check (i.types[0], imm)
7890 || (i.types[0].bitfield.instance == RegC
7891 && i.types[0].bitfield.byte))
7892 source = 1;
7893 else
7894 source = 0;
7895 break;
7896 case 4:
7897 /* When there are 4 operands, the first two must be 8bit
7898 immediate operands. The source operand will be the 3rd
7899 one.
7900
7901 For instructions with VexNDS, if the first operand
7902 an imm8, the source operand is the 2nd one. If the last
7903 operand is imm8, the source operand is the first one. */
7904 gas_assert ((i.imm_operands == 2
7905 && i.types[0].bitfield.imm8
7906 && i.types[1].bitfield.imm8)
7907 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7908 && i.imm_operands == 1
7909 && (i.types[0].bitfield.imm8
7910 || i.types[i.operands - 1].bitfield.imm8
7911 || i.rounding)));
7912 if (i.imm_operands == 2)
7913 source = 2;
7914 else
7915 {
7916 if (i.types[0].bitfield.imm8)
7917 source = 1;
7918 else
7919 source = 0;
7920 }
7921 break;
7922 case 5:
7923 if (is_evex_encoding (&i.tm))
7924 {
7925 /* For EVEX instructions, when there are 5 operands, the
7926 first one must be immediate operand. If the second one
7927 is immediate operand, the source operand is the 3th
7928 one. If the last one is immediate operand, the source
7929 operand is the 2nd one. */
7930 gas_assert (i.imm_operands == 2
7931 && i.tm.opcode_modifier.sae
7932 && operand_type_check (i.types[0], imm));
7933 if (operand_type_check (i.types[1], imm))
7934 source = 2;
7935 else if (operand_type_check (i.types[4], imm))
7936 source = 1;
7937 else
7938 abort ();
7939 }
7940 break;
7941 default:
7942 abort ();
7943 }
7944
7945 if (!vex_3_sources)
7946 {
7947 dest = source + 1;
7948
7949 /* RC/SAE operand could be between DEST and SRC. That happens
7950 when one operand is GPR and the other one is XMM/YMM/ZMM
7951 register. */
7952 if (i.rounding && i.rounding->operand == (int) dest)
7953 dest++;
7954
7955 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7956 {
7957 /* For instructions with VexNDS, the register-only source
7958 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7959 register. It is encoded in VEX prefix. */
7960
7961 i386_operand_type op;
7962 unsigned int vvvv;
7963
7964 /* Swap two source operands if needed. */
7965 if (i.tm.opcode_modifier.swapsources)
7966 {
7967 vvvv = source;
7968 source = dest;
7969 }
7970 else
7971 vvvv = dest;
7972
7973 op = i.tm.operand_types[vvvv];
7974 if ((dest + 1) >= i.operands
7975 || ((op.bitfield.class != Reg
7976 || (!op.bitfield.dword && !op.bitfield.qword))
7977 && op.bitfield.class != RegSIMD
7978 && !operand_type_equal (&op, &regmask)))
7979 abort ();
7980 i.vex.register_specifier = i.op[vvvv].regs;
7981 dest++;
7982 }
7983 }
7984
7985 i.rm.mode = 3;
7986 /* One of the register operands will be encoded in the i.rm.reg
7987 field, the other in the combined i.rm.mode and i.rm.regmem
7988 fields. If no form of this instruction supports a memory
7989 destination operand, then we assume the source operand may
7990 sometimes be a memory operand and so we need to store the
7991 destination in the i.rm.reg field. */
7992 if (!i.tm.opcode_modifier.regmem
7993 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7994 {
7995 i.rm.reg = i.op[dest].regs->reg_num;
7996 i.rm.regmem = i.op[source].regs->reg_num;
7997 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7998 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7999 }
8000 else
8001 {
8002 i.rm.reg = i.op[source].regs->reg_num;
8003 i.rm.regmem = i.op[dest].regs->reg_num;
8004 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8005 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
8006 }
8007 if (flag_code != CODE_64BIT && (i.rex & REX_R))
8008 {
8009 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8010 abort ();
8011 i.rex &= ~REX_R;
8012 add_prefix (LOCK_PREFIX_OPCODE);
8013 }
8014 }
8015 else
8016 { /* If it's not 2 reg operands... */
8017 unsigned int mem;
8018
8019 if (i.mem_operands)
8020 {
8021 unsigned int fake_zero_displacement = 0;
8022 unsigned int op;
8023
8024 for (op = 0; op < i.operands; op++)
8025 if (i.flags[op] & Operand_Mem)
8026 break;
8027 gas_assert (op < i.operands);
8028
8029 if (i.tm.opcode_modifier.sib)
8030 {
8031 /* The index register of VSIB shouldn't be RegIZ. */
8032 if (i.tm.opcode_modifier.sib != SIBMEM
8033 && i.index_reg->reg_num == RegIZ)
8034 abort ();
8035
8036 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8037 if (!i.base_reg)
8038 {
8039 i.sib.base = NO_BASE_REGISTER;
8040 i.sib.scale = i.log2_scale_factor;
8041 i.types[op].bitfield.disp8 = 0;
8042 i.types[op].bitfield.disp16 = 0;
8043 i.types[op].bitfield.disp64 = 0;
8044 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8045 {
8046 /* Must be 32 bit */
8047 i.types[op].bitfield.disp32 = 1;
8048 i.types[op].bitfield.disp32s = 0;
8049 }
8050 else
8051 {
8052 i.types[op].bitfield.disp32 = 0;
8053 i.types[op].bitfield.disp32s = 1;
8054 }
8055 }
8056
8057 /* Since the mandatory SIB always has index register, so
8058 the code logic remains unchanged. The non-mandatory SIB
8059 without index register is allowed and will be handled
8060 later. */
8061 if (i.index_reg)
8062 {
8063 if (i.index_reg->reg_num == RegIZ)
8064 i.sib.index = NO_INDEX_REGISTER;
8065 else
8066 i.sib.index = i.index_reg->reg_num;
8067 set_rex_vrex (i.index_reg, REX_X, FALSE);
8068 }
8069 }
8070
8071 default_seg = &ds;
8072
8073 if (i.base_reg == 0)
8074 {
8075 i.rm.mode = 0;
8076 if (!i.disp_operands)
8077 fake_zero_displacement = 1;
8078 if (i.index_reg == 0)
8079 {
8080 i386_operand_type newdisp;
8081
8082 /* Both check for VSIB and mandatory non-vector SIB. */
8083 gas_assert (!i.tm.opcode_modifier.sib
8084 || i.tm.opcode_modifier.sib == SIBMEM);
8085 /* Operand is just <disp> */
8086 if (flag_code == CODE_64BIT)
8087 {
8088 /* 64bit mode overwrites the 32bit absolute
8089 addressing by RIP relative addressing and
8090 absolute addressing is encoded by one of the
8091 redundant SIB forms. */
8092 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8093 i.sib.base = NO_BASE_REGISTER;
8094 i.sib.index = NO_INDEX_REGISTER;
8095 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8096 }
8097 else if ((flag_code == CODE_16BIT)
8098 ^ (i.prefix[ADDR_PREFIX] != 0))
8099 {
8100 i.rm.regmem = NO_BASE_REGISTER_16;
8101 newdisp = disp16;
8102 }
8103 else
8104 {
8105 i.rm.regmem = NO_BASE_REGISTER;
8106 newdisp = disp32;
8107 }
8108 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8109 i.types[op] = operand_type_or (i.types[op], newdisp);
8110 }
8111 else if (!i.tm.opcode_modifier.sib)
8112 {
8113 /* !i.base_reg && i.index_reg */
8114 if (i.index_reg->reg_num == RegIZ)
8115 i.sib.index = NO_INDEX_REGISTER;
8116 else
8117 i.sib.index = i.index_reg->reg_num;
8118 i.sib.base = NO_BASE_REGISTER;
8119 i.sib.scale = i.log2_scale_factor;
8120 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8121 i.types[op].bitfield.disp8 = 0;
8122 i.types[op].bitfield.disp16 = 0;
8123 i.types[op].bitfield.disp64 = 0;
8124 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8125 {
8126 /* Must be 32 bit */
8127 i.types[op].bitfield.disp32 = 1;
8128 i.types[op].bitfield.disp32s = 0;
8129 }
8130 else
8131 {
8132 i.types[op].bitfield.disp32 = 0;
8133 i.types[op].bitfield.disp32s = 1;
8134 }
8135 if ((i.index_reg->reg_flags & RegRex) != 0)
8136 i.rex |= REX_X;
8137 }
8138 }
8139 /* RIP addressing for 64bit mode. */
8140 else if (i.base_reg->reg_num == RegIP)
8141 {
8142 gas_assert (!i.tm.opcode_modifier.sib);
8143 i.rm.regmem = NO_BASE_REGISTER;
8144 i.types[op].bitfield.disp8 = 0;
8145 i.types[op].bitfield.disp16 = 0;
8146 i.types[op].bitfield.disp32 = 0;
8147 i.types[op].bitfield.disp32s = 1;
8148 i.types[op].bitfield.disp64 = 0;
8149 i.flags[op] |= Operand_PCrel;
8150 if (! i.disp_operands)
8151 fake_zero_displacement = 1;
8152 }
8153 else if (i.base_reg->reg_type.bitfield.word)
8154 {
8155 gas_assert (!i.tm.opcode_modifier.sib);
8156 switch (i.base_reg->reg_num)
8157 {
8158 case 3: /* (%bx) */
8159 if (i.index_reg == 0)
8160 i.rm.regmem = 7;
8161 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8162 i.rm.regmem = i.index_reg->reg_num - 6;
8163 break;
8164 case 5: /* (%bp) */
8165 default_seg = &ss;
8166 if (i.index_reg == 0)
8167 {
8168 i.rm.regmem = 6;
8169 if (operand_type_check (i.types[op], disp) == 0)
8170 {
8171 /* fake (%bp) into 0(%bp) */
8172 if (i.disp_encoding == disp_encoding_16bit)
8173 i.types[op].bitfield.disp16 = 1;
8174 else
8175 i.types[op].bitfield.disp8 = 1;
8176 fake_zero_displacement = 1;
8177 }
8178 }
8179 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8180 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8181 break;
8182 default: /* (%si) -> 4 or (%di) -> 5 */
8183 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8184 }
8185 if (!fake_zero_displacement
8186 && !i.disp_operands
8187 && i.disp_encoding)
8188 {
8189 fake_zero_displacement = 1;
8190 if (i.disp_encoding == disp_encoding_8bit)
8191 i.types[op].bitfield.disp8 = 1;
8192 else
8193 i.types[op].bitfield.disp16 = 1;
8194 }
8195 i.rm.mode = mode_from_disp_size (i.types[op]);
8196 }
8197 else /* i.base_reg and 32/64 bit mode */
8198 {
8199 if (flag_code == CODE_64BIT
8200 && operand_type_check (i.types[op], disp))
8201 {
8202 i.types[op].bitfield.disp16 = 0;
8203 i.types[op].bitfield.disp64 = 0;
8204 if (i.prefix[ADDR_PREFIX] == 0)
8205 {
8206 i.types[op].bitfield.disp32 = 0;
8207 i.types[op].bitfield.disp32s = 1;
8208 }
8209 else
8210 {
8211 i.types[op].bitfield.disp32 = 1;
8212 i.types[op].bitfield.disp32s = 0;
8213 }
8214 }
8215
8216 if (!i.tm.opcode_modifier.sib)
8217 i.rm.regmem = i.base_reg->reg_num;
8218 if ((i.base_reg->reg_flags & RegRex) != 0)
8219 i.rex |= REX_B;
8220 i.sib.base = i.base_reg->reg_num;
8221 /* x86-64 ignores REX prefix bit here to avoid decoder
8222 complications. */
8223 if (!(i.base_reg->reg_flags & RegRex)
8224 && (i.base_reg->reg_num == EBP_REG_NUM
8225 || i.base_reg->reg_num == ESP_REG_NUM))
8226 default_seg = &ss;
8227 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8228 {
8229 fake_zero_displacement = 1;
8230 if (i.disp_encoding == disp_encoding_32bit)
8231 i.types[op].bitfield.disp32 = 1;
8232 else
8233 i.types[op].bitfield.disp8 = 1;
8234 }
8235 i.sib.scale = i.log2_scale_factor;
8236 if (i.index_reg == 0)
8237 {
8238 /* Only check for VSIB. */
8239 gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8240 && i.tm.opcode_modifier.sib != VECSIB256
8241 && i.tm.opcode_modifier.sib != VECSIB512);
8242
8243 /* <disp>(%esp) becomes two byte modrm with no index
8244 register. We've already stored the code for esp
8245 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8246 Any base register besides %esp will not use the
8247 extra modrm byte. */
8248 i.sib.index = NO_INDEX_REGISTER;
8249 }
8250 else if (!i.tm.opcode_modifier.sib)
8251 {
8252 if (i.index_reg->reg_num == RegIZ)
8253 i.sib.index = NO_INDEX_REGISTER;
8254 else
8255 i.sib.index = i.index_reg->reg_num;
8256 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8257 if ((i.index_reg->reg_flags & RegRex) != 0)
8258 i.rex |= REX_X;
8259 }
8260
8261 if (i.disp_operands
8262 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8263 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8264 i.rm.mode = 0;
8265 else
8266 {
8267 if (!fake_zero_displacement
8268 && !i.disp_operands
8269 && i.disp_encoding)
8270 {
8271 fake_zero_displacement = 1;
8272 if (i.disp_encoding == disp_encoding_8bit)
8273 i.types[op].bitfield.disp8 = 1;
8274 else
8275 i.types[op].bitfield.disp32 = 1;
8276 }
8277 i.rm.mode = mode_from_disp_size (i.types[op]);
8278 }
8279 }
8280
8281 if (fake_zero_displacement)
8282 {
8283 /* Fakes a zero displacement assuming that i.types[op]
8284 holds the correct displacement size. */
8285 expressionS *exp;
8286
8287 gas_assert (i.op[op].disps == 0);
8288 exp = &disp_expressions[i.disp_operands++];
8289 i.op[op].disps = exp;
8290 exp->X_op = O_constant;
8291 exp->X_add_number = 0;
8292 exp->X_add_symbol = (symbolS *) 0;
8293 exp->X_op_symbol = (symbolS *) 0;
8294 }
8295
8296 mem = op;
8297 }
8298 else
8299 mem = ~0;
8300
8301 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8302 {
8303 if (operand_type_check (i.types[0], imm))
8304 i.vex.register_specifier = NULL;
8305 else
8306 {
8307 /* VEX.vvvv encodes one of the sources when the first
8308 operand is not an immediate. */
8309 if (i.tm.opcode_modifier.vexw == VEXW0)
8310 i.vex.register_specifier = i.op[0].regs;
8311 else
8312 i.vex.register_specifier = i.op[1].regs;
8313 }
8314
8315 /* Destination is a XMM register encoded in the ModRM.reg
8316 and VEX.R bit. */
8317 i.rm.reg = i.op[2].regs->reg_num;
8318 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8319 i.rex |= REX_R;
8320
8321 /* ModRM.rm and VEX.B encodes the other source. */
8322 if (!i.mem_operands)
8323 {
8324 i.rm.mode = 3;
8325
8326 if (i.tm.opcode_modifier.vexw == VEXW0)
8327 i.rm.regmem = i.op[1].regs->reg_num;
8328 else
8329 i.rm.regmem = i.op[0].regs->reg_num;
8330
8331 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8332 i.rex |= REX_B;
8333 }
8334 }
8335 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8336 {
8337 i.vex.register_specifier = i.op[2].regs;
8338 if (!i.mem_operands)
8339 {
8340 i.rm.mode = 3;
8341 i.rm.regmem = i.op[1].regs->reg_num;
8342 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8343 i.rex |= REX_B;
8344 }
8345 }
8346 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8347 (if any) based on i.tm.extension_opcode. Again, we must be
8348 careful to make sure that segment/control/debug/test/MMX
8349 registers are coded into the i.rm.reg field. */
8350 else if (i.reg_operands)
8351 {
8352 unsigned int op;
8353 unsigned int vex_reg = ~0;
8354
8355 for (op = 0; op < i.operands; op++)
8356 if (i.types[op].bitfield.class == Reg
8357 || i.types[op].bitfield.class == RegBND
8358 || i.types[op].bitfield.class == RegMask
8359 || i.types[op].bitfield.class == SReg
8360 || i.types[op].bitfield.class == RegCR
8361 || i.types[op].bitfield.class == RegDR
8362 || i.types[op].bitfield.class == RegTR
8363 || i.types[op].bitfield.class == RegSIMD
8364 || i.types[op].bitfield.class == RegMMX)
8365 break;
8366
8367 if (vex_3_sources)
8368 op = dest;
8369 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8370 {
8371 /* For instructions with VexNDS, the register-only
8372 source operand is encoded in VEX prefix. */
8373 gas_assert (mem != (unsigned int) ~0);
8374
8375 if (op > mem)
8376 {
8377 vex_reg = op++;
8378 gas_assert (op < i.operands);
8379 }
8380 else
8381 {
8382 /* Check register-only source operand when two source
8383 operands are swapped. */
8384 if (!i.tm.operand_types[op].bitfield.baseindex
8385 && i.tm.operand_types[op + 1].bitfield.baseindex)
8386 {
8387 vex_reg = op;
8388 op += 2;
8389 gas_assert (mem == (vex_reg + 1)
8390 && op < i.operands);
8391 }
8392 else
8393 {
8394 vex_reg = op + 1;
8395 gas_assert (vex_reg < i.operands);
8396 }
8397 }
8398 }
8399 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8400 {
8401 /* For instructions with VexNDD, the register destination
8402 is encoded in VEX prefix. */
8403 if (i.mem_operands == 0)
8404 {
8405 /* There is no memory operand. */
8406 gas_assert ((op + 2) == i.operands);
8407 vex_reg = op + 1;
8408 }
8409 else
8410 {
8411 /* There are only 2 non-immediate operands. */
8412 gas_assert (op < i.imm_operands + 2
8413 && i.operands == i.imm_operands + 2);
8414 vex_reg = i.imm_operands + 1;
8415 }
8416 }
8417 else
8418 gas_assert (op < i.operands);
8419
8420 if (vex_reg != (unsigned int) ~0)
8421 {
8422 i386_operand_type *type = &i.tm.operand_types[vex_reg];
8423
8424 if ((type->bitfield.class != Reg
8425 || (!type->bitfield.dword && !type->bitfield.qword))
8426 && type->bitfield.class != RegSIMD
8427 && !operand_type_equal (type, &regmask))
8428 abort ();
8429
8430 i.vex.register_specifier = i.op[vex_reg].regs;
8431 }
8432
8433 /* Don't set OP operand twice. */
8434 if (vex_reg != op)
8435 {
8436 /* If there is an extension opcode to put here, the
8437 register number must be put into the regmem field. */
8438 if (i.tm.extension_opcode != None)
8439 {
8440 i.rm.regmem = i.op[op].regs->reg_num;
8441 set_rex_vrex (i.op[op].regs, REX_B,
8442 i.tm.opcode_modifier.sse2avx);
8443 }
8444 else
8445 {
8446 i.rm.reg = i.op[op].regs->reg_num;
8447 set_rex_vrex (i.op[op].regs, REX_R,
8448 i.tm.opcode_modifier.sse2avx);
8449 }
8450 }
8451
8452 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8453 must set it to 3 to indicate this is a register operand
8454 in the regmem field. */
8455 if (!i.mem_operands)
8456 i.rm.mode = 3;
8457 }
8458
8459 /* Fill in i.rm.reg field with extension opcode (if any). */
8460 if (i.tm.extension_opcode != None)
8461 i.rm.reg = i.tm.extension_opcode;
8462 }
8463 return default_seg;
8464 }
8465
8466 static INLINE void
8467 frag_opcode_byte (unsigned char byte)
8468 {
8469 if (now_seg != absolute_section)
8470 FRAG_APPEND_1_CHAR (byte);
8471 else
8472 ++abs_section_offset;
8473 }
8474
8475 static unsigned int
8476 flip_code16 (unsigned int code16)
8477 {
8478 gas_assert (i.tm.operands == 1);
8479
8480 return !(i.prefix[REX_PREFIX] & REX_W)
8481 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8482 || i.tm.operand_types[0].bitfield.disp32s
8483 : i.tm.operand_types[0].bitfield.disp16)
8484 ? CODE16 : 0;
8485 }
8486
8487 static void
8488 output_branch (void)
8489 {
8490 char *p;
8491 int size;
8492 int code16;
8493 int prefix;
8494 relax_substateT subtype;
8495 symbolS *sym;
8496 offsetT off;
8497
8498 if (now_seg == absolute_section)
8499 {
8500 as_bad (_("relaxable branches not supported in absolute section"));
8501 return;
8502 }
8503
8504 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8505 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8506
8507 prefix = 0;
8508 if (i.prefix[DATA_PREFIX] != 0)
8509 {
8510 prefix = 1;
8511 i.prefixes -= 1;
8512 code16 ^= flip_code16(code16);
8513 }
8514 /* Pentium4 branch hints. */
8515 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8516 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8517 {
8518 prefix++;
8519 i.prefixes--;
8520 }
8521 if (i.prefix[REX_PREFIX] != 0)
8522 {
8523 prefix++;
8524 i.prefixes--;
8525 }
8526
8527 /* BND prefixed jump. */
8528 if (i.prefix[BND_PREFIX] != 0)
8529 {
8530 prefix++;
8531 i.prefixes--;
8532 }
8533
8534 if (i.prefixes != 0)
8535 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8536
8537 /* It's always a symbol; End frag & setup for relax.
8538 Make sure there is enough room in this frag for the largest
8539 instruction we may generate in md_convert_frag. This is 2
8540 bytes for the opcode and room for the prefix and largest
8541 displacement. */
8542 frag_grow (prefix + 2 + 4);
8543 /* Prefix and 1 opcode byte go in fr_fix. */
8544 p = frag_more (prefix + 1);
8545 if (i.prefix[DATA_PREFIX] != 0)
8546 *p++ = DATA_PREFIX_OPCODE;
8547 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8548 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8549 *p++ = i.prefix[SEG_PREFIX];
8550 if (i.prefix[BND_PREFIX] != 0)
8551 *p++ = BND_PREFIX_OPCODE;
8552 if (i.prefix[REX_PREFIX] != 0)
8553 *p++ = i.prefix[REX_PREFIX];
8554 *p = i.tm.base_opcode;
8555
8556 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8557 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8558 else if (cpu_arch_flags.bitfield.cpui386)
8559 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8560 else
8561 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8562 subtype |= code16;
8563
8564 sym = i.op[0].disps->X_add_symbol;
8565 off = i.op[0].disps->X_add_number;
8566
8567 if (i.op[0].disps->X_op != O_constant
8568 && i.op[0].disps->X_op != O_symbol)
8569 {
8570 /* Handle complex expressions. */
8571 sym = make_expr_symbol (i.op[0].disps);
8572 off = 0;
8573 }
8574
8575 /* 1 possible extra opcode + 4 byte displacement go in var part.
8576 Pass reloc in fr_var. */
8577 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8578 }
8579
8580 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8581 /* Return TRUE iff PLT32 relocation should be used for branching to
8582 symbol S. */
8583
8584 static bfd_boolean
8585 need_plt32_p (symbolS *s)
8586 {
8587 /* PLT32 relocation is ELF only. */
8588 if (!IS_ELF)
8589 return FALSE;
8590
8591 #ifdef TE_SOLARIS
8592 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8593 krtld support it. */
8594 return FALSE;
8595 #endif
8596
8597 /* Since there is no need to prepare for PLT branch on x86-64, we
8598 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8599 be used as a marker for 32-bit PC-relative branches. */
8600 if (!object_64bit)
8601 return FALSE;
8602
8603 /* Weak or undefined symbol need PLT32 relocation. */
8604 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8605 return TRUE;
8606
8607 /* Non-global symbol doesn't need PLT32 relocation. */
8608 if (! S_IS_EXTERNAL (s))
8609 return FALSE;
8610
8611 /* Other global symbols need PLT32 relocation. NB: Symbol with
8612 non-default visibilities are treated as normal global symbol
8613 so that PLT32 relocation can be used as a marker for 32-bit
8614 PC-relative branches. It is useful for linker relaxation. */
8615 return TRUE;
8616 }
8617 #endif
8618
8619 static void
8620 output_jump (void)
8621 {
8622 char *p;
8623 int size;
8624 fixS *fixP;
8625 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8626
8627 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8628 {
8629 /* This is a loop or jecxz type instruction. */
8630 size = 1;
8631 if (i.prefix[ADDR_PREFIX] != 0)
8632 {
8633 frag_opcode_byte (ADDR_PREFIX_OPCODE);
8634 i.prefixes -= 1;
8635 }
8636 /* Pentium4 branch hints. */
8637 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8638 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8639 {
8640 frag_opcode_byte (i.prefix[SEG_PREFIX]);
8641 i.prefixes--;
8642 }
8643 }
8644 else
8645 {
8646 int code16;
8647
8648 code16 = 0;
8649 if (flag_code == CODE_16BIT)
8650 code16 = CODE16;
8651
8652 if (i.prefix[DATA_PREFIX] != 0)
8653 {
8654 frag_opcode_byte (DATA_PREFIX_OPCODE);
8655 i.prefixes -= 1;
8656 code16 ^= flip_code16(code16);
8657 }
8658
8659 size = 4;
8660 if (code16)
8661 size = 2;
8662 }
8663
8664 /* BND prefixed jump. */
8665 if (i.prefix[BND_PREFIX] != 0)
8666 {
8667 frag_opcode_byte (i.prefix[BND_PREFIX]);
8668 i.prefixes -= 1;
8669 }
8670
8671 if (i.prefix[REX_PREFIX] != 0)
8672 {
8673 frag_opcode_byte (i.prefix[REX_PREFIX]);
8674 i.prefixes -= 1;
8675 }
8676
8677 if (i.prefixes != 0)
8678 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8679
8680 if (now_seg == absolute_section)
8681 {
8682 abs_section_offset += i.tm.opcode_length + size;
8683 return;
8684 }
8685
8686 p = frag_more (i.tm.opcode_length + size);
8687 switch (i.tm.opcode_length)
8688 {
8689 case 2:
8690 *p++ = i.tm.base_opcode >> 8;
8691 /* Fall through. */
8692 case 1:
8693 *p++ = i.tm.base_opcode;
8694 break;
8695 default:
8696 abort ();
8697 }
8698
8699 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8700 if (size == 4
8701 && jump_reloc == NO_RELOC
8702 && need_plt32_p (i.op[0].disps->X_add_symbol))
8703 jump_reloc = BFD_RELOC_X86_64_PLT32;
8704 #endif
8705
8706 jump_reloc = reloc (size, 1, 1, jump_reloc);
8707
8708 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8709 i.op[0].disps, 1, jump_reloc);
8710
8711 /* All jumps handled here are signed, but don't use a signed limit
8712 check for 32 and 16 bit jumps as we want to allow wrap around at
8713 4G and 64k respectively. */
8714 if (size == 1)
8715 fixP->fx_signed = 1;
8716 }
8717
8718 static void
8719 output_interseg_jump (void)
8720 {
8721 char *p;
8722 int size;
8723 int prefix;
8724 int code16;
8725
8726 code16 = 0;
8727 if (flag_code == CODE_16BIT)
8728 code16 = CODE16;
8729
8730 prefix = 0;
8731 if (i.prefix[DATA_PREFIX] != 0)
8732 {
8733 prefix = 1;
8734 i.prefixes -= 1;
8735 code16 ^= CODE16;
8736 }
8737
8738 gas_assert (!i.prefix[REX_PREFIX]);
8739
8740 size = 4;
8741 if (code16)
8742 size = 2;
8743
8744 if (i.prefixes != 0)
8745 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8746
8747 if (now_seg == absolute_section)
8748 {
8749 abs_section_offset += prefix + 1 + 2 + size;
8750 return;
8751 }
8752
8753 /* 1 opcode; 2 segment; offset */
8754 p = frag_more (prefix + 1 + 2 + size);
8755
8756 if (i.prefix[DATA_PREFIX] != 0)
8757 *p++ = DATA_PREFIX_OPCODE;
8758
8759 if (i.prefix[REX_PREFIX] != 0)
8760 *p++ = i.prefix[REX_PREFIX];
8761
8762 *p++ = i.tm.base_opcode;
8763 if (i.op[1].imms->X_op == O_constant)
8764 {
8765 offsetT n = i.op[1].imms->X_add_number;
8766
8767 if (size == 2
8768 && !fits_in_unsigned_word (n)
8769 && !fits_in_signed_word (n))
8770 {
8771 as_bad (_("16-bit jump out of range"));
8772 return;
8773 }
8774 md_number_to_chars (p, n, size);
8775 }
8776 else
8777 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8778 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8779
8780 p += size;
8781 if (i.op[0].imms->X_op == O_constant)
8782 md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
8783 else
8784 fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
8785 i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
8786 }
8787
8788 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8789 void
8790 x86_cleanup (void)
8791 {
8792 char *p;
8793 asection *seg = now_seg;
8794 subsegT subseg = now_subseg;
8795 asection *sec;
8796 unsigned int alignment, align_size_1;
8797 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8798 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8799 unsigned int padding;
8800
8801 if (!IS_ELF || !x86_used_note)
8802 return;
8803
8804 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8805
8806 /* The .note.gnu.property section layout:
8807
8808 Field Length Contents
8809 ---- ---- ----
8810 n_namsz 4 4
8811 n_descsz 4 The note descriptor size
8812 n_type 4 NT_GNU_PROPERTY_TYPE_0
8813 n_name 4 "GNU"
8814 n_desc n_descsz The program property array
8815 .... .... ....
8816 */
8817
8818 /* Create the .note.gnu.property section. */
8819 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8820 bfd_set_section_flags (sec,
8821 (SEC_ALLOC
8822 | SEC_LOAD
8823 | SEC_DATA
8824 | SEC_HAS_CONTENTS
8825 | SEC_READONLY));
8826
8827 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8828 {
8829 align_size_1 = 7;
8830 alignment = 3;
8831 }
8832 else
8833 {
8834 align_size_1 = 3;
8835 alignment = 2;
8836 }
8837
8838 bfd_set_section_alignment (sec, alignment);
8839 elf_section_type (sec) = SHT_NOTE;
8840
8841 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8842 + 4-byte data */
8843 isa_1_descsz_raw = 4 + 4 + 4;
8844 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8845 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8846
8847 feature_2_descsz_raw = isa_1_descsz;
8848 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8849 + 4-byte data */
8850 feature_2_descsz_raw += 4 + 4 + 4;
8851 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8852 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8853 & ~align_size_1);
8854
8855 descsz = feature_2_descsz;
8856 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8857 p = frag_more (4 + 4 + 4 + 4 + descsz);
8858
8859 /* Write n_namsz. */
8860 md_number_to_chars (p, (valueT) 4, 4);
8861
8862 /* Write n_descsz. */
8863 md_number_to_chars (p + 4, (valueT) descsz, 4);
8864
8865 /* Write n_type. */
8866 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8867
8868 /* Write n_name. */
8869 memcpy (p + 4 * 3, "GNU", 4);
8870
8871 /* Write 4-byte type. */
8872 md_number_to_chars (p + 4 * 4,
8873 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8874
8875 /* Write 4-byte data size. */
8876 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8877
8878 /* Write 4-byte data. */
8879 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8880
8881 /* Zero out paddings. */
8882 padding = isa_1_descsz - isa_1_descsz_raw;
8883 if (padding)
8884 memset (p + 4 * 7, 0, padding);
8885
8886 /* Write 4-byte type. */
8887 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8888 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8889
8890 /* Write 4-byte data size. */
8891 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8892
8893 /* Write 4-byte data. */
8894 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8895 (valueT) x86_feature_2_used, 4);
8896
8897 /* Zero out paddings. */
8898 padding = feature_2_descsz - feature_2_descsz_raw;
8899 if (padding)
8900 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8901
8902 /* We probably can't restore the current segment, for there likely
8903 isn't one yet... */
8904 if (seg && subseg)
8905 subseg_set (seg, subseg);
8906 }
8907 #endif
8908
8909 static unsigned int
8910 encoding_length (const fragS *start_frag, offsetT start_off,
8911 const char *frag_now_ptr)
8912 {
8913 unsigned int len = 0;
8914
8915 if (start_frag != frag_now)
8916 {
8917 const fragS *fr = start_frag;
8918
8919 do {
8920 len += fr->fr_fix;
8921 fr = fr->fr_next;
8922 } while (fr && fr != frag_now);
8923 }
8924
8925 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8926 }
8927
8928 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8929 be macro-fused with conditional jumps.
8930 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8931 or is one of the following format:
8932
8933 cmp m, imm
8934 add m, imm
8935 sub m, imm
8936 test m, imm
8937 and m, imm
8938 inc m
8939 dec m
8940
8941 it is unfusible. */
8942
8943 static int
8944 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8945 {
8946 /* No RIP address. */
8947 if (i.base_reg && i.base_reg->reg_num == RegIP)
8948 return 0;
8949
8950 /* No VEX/EVEX encoding. */
8951 if (is_any_vex_encoding (&i.tm))
8952 return 0;
8953
8954 /* add, sub without add/sub m, imm. */
8955 if (i.tm.base_opcode <= 5
8956 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8957 || ((i.tm.base_opcode | 3) == 0x83
8958 && (i.tm.extension_opcode == 0x5
8959 || i.tm.extension_opcode == 0x0)))
8960 {
8961 *mf_cmp_p = mf_cmp_alu_cmp;
8962 return !(i.mem_operands && i.imm_operands);
8963 }
8964
8965 /* and without and m, imm. */
8966 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8967 || ((i.tm.base_opcode | 3) == 0x83
8968 && i.tm.extension_opcode == 0x4))
8969 {
8970 *mf_cmp_p = mf_cmp_test_and;
8971 return !(i.mem_operands && i.imm_operands);
8972 }
8973
8974 /* test without test m imm. */
8975 if ((i.tm.base_opcode | 1) == 0x85
8976 || (i.tm.base_opcode | 1) == 0xa9
8977 || ((i.tm.base_opcode | 1) == 0xf7
8978 && i.tm.extension_opcode == 0))
8979 {
8980 *mf_cmp_p = mf_cmp_test_and;
8981 return !(i.mem_operands && i.imm_operands);
8982 }
8983
8984 /* cmp without cmp m, imm. */
8985 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8986 || ((i.tm.base_opcode | 3) == 0x83
8987 && (i.tm.extension_opcode == 0x7)))
8988 {
8989 *mf_cmp_p = mf_cmp_alu_cmp;
8990 return !(i.mem_operands && i.imm_operands);
8991 }
8992
8993 /* inc, dec without inc/dec m. */
8994 if ((i.tm.cpu_flags.bitfield.cpuno64
8995 && (i.tm.base_opcode | 0xf) == 0x4f)
8996 || ((i.tm.base_opcode | 1) == 0xff
8997 && i.tm.extension_opcode <= 0x1))
8998 {
8999 *mf_cmp_p = mf_cmp_incdec;
9000 return !i.mem_operands;
9001 }
9002
9003 return 0;
9004 }
9005
9006 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
9007
9008 static int
9009 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9010 {
9011 /* NB: Don't work with COND_JUMP86 without i386. */
9012 if (!align_branch_power
9013 || now_seg == absolute_section
9014 || !cpu_arch_flags.bitfield.cpui386
9015 || !(align_branch & align_branch_fused_bit))
9016 return 0;
9017
9018 if (maybe_fused_with_jcc_p (mf_cmp_p))
9019 {
9020 if (last_insn.kind == last_insn_other
9021 || last_insn.seg != now_seg)
9022 return 1;
9023 if (flag_debug)
9024 as_warn_where (last_insn.file, last_insn.line,
9025 _("`%s` skips -malign-branch-boundary on `%s`"),
9026 last_insn.name, i.tm.name);
9027 }
9028
9029 return 0;
9030 }
9031
9032 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
9033
9034 static int
9035 add_branch_prefix_frag_p (void)
9036 {
9037 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
9038 to PadLock instructions since they include prefixes in opcode. */
9039 if (!align_branch_power
9040 || !align_branch_prefix_size
9041 || now_seg == absolute_section
9042 || i.tm.cpu_flags.bitfield.cpupadlock
9043 || !cpu_arch_flags.bitfield.cpui386)
9044 return 0;
9045
9046 /* Don't add prefix if it is a prefix or there is no operand in case
9047 that segment prefix is special. */
9048 if (!i.operands || i.tm.opcode_modifier.isprefix)
9049 return 0;
9050
9051 if (last_insn.kind == last_insn_other
9052 || last_insn.seg != now_seg)
9053 return 1;
9054
9055 if (flag_debug)
9056 as_warn_where (last_insn.file, last_insn.line,
9057 _("`%s` skips -malign-branch-boundary on `%s`"),
9058 last_insn.name, i.tm.name);
9059
9060 return 0;
9061 }
9062
9063 /* Return 1 if a BRANCH_PADDING frag should be generated. */
9064
9065 static int
9066 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9067 enum mf_jcc_kind *mf_jcc_p)
9068 {
9069 int add_padding;
9070
9071 /* NB: Don't work with COND_JUMP86 without i386. */
9072 if (!align_branch_power
9073 || now_seg == absolute_section
9074 || !cpu_arch_flags.bitfield.cpui386)
9075 return 0;
9076
9077 add_padding = 0;
9078
9079 /* Check for jcc and direct jmp. */
9080 if (i.tm.opcode_modifier.jump == JUMP)
9081 {
9082 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9083 {
9084 *branch_p = align_branch_jmp;
9085 add_padding = align_branch & align_branch_jmp_bit;
9086 }
9087 else
9088 {
9089 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9090 igore the lowest bit. */
9091 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9092 *branch_p = align_branch_jcc;
9093 if ((align_branch & align_branch_jcc_bit))
9094 add_padding = 1;
9095 }
9096 }
9097 else if (is_any_vex_encoding (&i.tm))
9098 return 0;
9099 else if ((i.tm.base_opcode | 1) == 0xc3)
9100 {
9101 /* Near ret. */
9102 *branch_p = align_branch_ret;
9103 if ((align_branch & align_branch_ret_bit))
9104 add_padding = 1;
9105 }
9106 else
9107 {
9108 /* Check for indirect jmp, direct and indirect calls. */
9109 if (i.tm.base_opcode == 0xe8)
9110 {
9111 /* Direct call. */
9112 *branch_p = align_branch_call;
9113 if ((align_branch & align_branch_call_bit))
9114 add_padding = 1;
9115 }
9116 else if (i.tm.base_opcode == 0xff
9117 && (i.tm.extension_opcode == 2
9118 || i.tm.extension_opcode == 4))
9119 {
9120 /* Indirect call and jmp. */
9121 *branch_p = align_branch_indirect;
9122 if ((align_branch & align_branch_indirect_bit))
9123 add_padding = 1;
9124 }
9125
9126 if (add_padding
9127 && i.disp_operands
9128 && tls_get_addr
9129 && (i.op[0].disps->X_op == O_symbol
9130 || (i.op[0].disps->X_op == O_subtract
9131 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9132 {
9133 symbolS *s = i.op[0].disps->X_add_symbol;
9134 /* No padding to call to global or undefined tls_get_addr. */
9135 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9136 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9137 return 0;
9138 }
9139 }
9140
9141 if (add_padding
9142 && last_insn.kind != last_insn_other
9143 && last_insn.seg == now_seg)
9144 {
9145 if (flag_debug)
9146 as_warn_where (last_insn.file, last_insn.line,
9147 _("`%s` skips -malign-branch-boundary on `%s`"),
9148 last_insn.name, i.tm.name);
9149 return 0;
9150 }
9151
9152 return add_padding;
9153 }
9154
9155 static void
9156 output_insn (void)
9157 {
9158 fragS *insn_start_frag;
9159 offsetT insn_start_off;
9160 fragS *fragP = NULL;
9161 enum align_branch_kind branch = align_branch_none;
9162 /* The initializer is arbitrary just to avoid uninitialized error.
9163 it's actually either assigned in add_branch_padding_frag_p
9164 or never be used. */
9165 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9166
9167 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9168 if (IS_ELF && x86_used_note && now_seg != absolute_section)
9169 {
9170 if (i.tm.cpu_flags.bitfield.cpucmov)
9171 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_CMOV;
9172 if (i.tm.cpu_flags.bitfield.cpusse)
9173 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE;
9174 if (i.tm.cpu_flags.bitfield.cpusse2)
9175 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE2;
9176 if (i.tm.cpu_flags.bitfield.cpusse3)
9177 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE3;
9178 if (i.tm.cpu_flags.bitfield.cpussse3)
9179 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSSE3;
9180 if (i.tm.cpu_flags.bitfield.cpusse4_1)
9181 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_1;
9182 if (i.tm.cpu_flags.bitfield.cpusse4_2)
9183 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_SSE4_2;
9184 if (i.tm.cpu_flags.bitfield.cpuavx)
9185 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX;
9186 if (i.tm.cpu_flags.bitfield.cpuavx2)
9187 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX2;
9188 if (i.tm.cpu_flags.bitfield.cpufma)
9189 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_FMA;
9190 if (i.tm.cpu_flags.bitfield.cpuavx512f)
9191 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512F;
9192 if (i.tm.cpu_flags.bitfield.cpuavx512cd)
9193 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512CD;
9194 if (i.tm.cpu_flags.bitfield.cpuavx512er)
9195 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512ER;
9196 if (i.tm.cpu_flags.bitfield.cpuavx512pf)
9197 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512PF;
9198 if (i.tm.cpu_flags.bitfield.cpuavx512vl)
9199 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512VL;
9200 if (i.tm.cpu_flags.bitfield.cpuavx512dq)
9201 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512DQ;
9202 if (i.tm.cpu_flags.bitfield.cpuavx512bw)
9203 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512BW;
9204 if (i.tm.cpu_flags.bitfield.cpuavx512_4fmaps)
9205 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4FMAPS;
9206 if (i.tm.cpu_flags.bitfield.cpuavx512_4vnniw)
9207 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_4VNNIW;
9208 if (i.tm.cpu_flags.bitfield.cpuavx512_bitalg)
9209 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BITALG;
9210 if (i.tm.cpu_flags.bitfield.cpuavx512ifma)
9211 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_IFMA;
9212 if (i.tm.cpu_flags.bitfield.cpuavx512vbmi)
9213 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI;
9214 if (i.tm.cpu_flags.bitfield.cpuavx512_vbmi2)
9215 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VBMI2;
9216 if (i.tm.cpu_flags.bitfield.cpuavx512_vnni)
9217 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_VNNI;
9218 if (i.tm.cpu_flags.bitfield.cpuavx512_bf16)
9219 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_AVX512_BF16;
9220
9221 if (i.tm.cpu_flags.bitfield.cpu8087
9222 || i.tm.cpu_flags.bitfield.cpu287
9223 || i.tm.cpu_flags.bitfield.cpu387
9224 || i.tm.cpu_flags.bitfield.cpu687
9225 || i.tm.cpu_flags.bitfield.cpufisttp)
9226 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9227 if ((i.xstate & xstate_mmx)
9228 || i.tm.base_opcode == 0xf77 /* emms */
9229 || i.tm.base_opcode == 0xf0e /* femms */)
9230 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9231 if ((i.xstate & xstate_xmm)
9232 || i.tm.cpu_flags.bitfield.cpuwidekl
9233 || i.tm.cpu_flags.bitfield.cpukl)
9234 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9235 if ((i.xstate & xstate_ymm) == xstate_ymm)
9236 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9237 if ((i.xstate & xstate_zmm) == xstate_zmm)
9238 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9239 if (i.tm.cpu_flags.bitfield.cpufxsr)
9240 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9241 if (i.tm.cpu_flags.bitfield.cpuxsave)
9242 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9243 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9244 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9245 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9246 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9247
9248 if ((i.xstate & xstate_tmm) == xstate_tmm
9249 || i.tm.cpu_flags.bitfield.cpuamx_tile)
9250 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9251 }
9252 #endif
9253
9254 /* Tie dwarf2 debug info to the address at the start of the insn.
9255 We can't do this after the insn has been output as the current
9256 frag may have been closed off. eg. by frag_var. */
9257 dwarf2_emit_insn (0);
9258
9259 insn_start_frag = frag_now;
9260 insn_start_off = frag_now_fix ();
9261
9262 if (add_branch_padding_frag_p (&branch, &mf_jcc))
9263 {
9264 char *p;
9265 /* Branch can be 8 bytes. Leave some room for prefixes. */
9266 unsigned int max_branch_padding_size = 14;
9267
9268 /* Align section to boundary. */
9269 record_alignment (now_seg, align_branch_power);
9270
9271 /* Make room for padding. */
9272 frag_grow (max_branch_padding_size);
9273
9274 /* Start of the padding. */
9275 p = frag_more (0);
9276
9277 fragP = frag_now;
9278
9279 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9280 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9281 NULL, 0, p);
9282
9283 fragP->tc_frag_data.mf_type = mf_jcc;
9284 fragP->tc_frag_data.branch_type = branch;
9285 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9286 }
9287
9288 /* Output jumps. */
9289 if (i.tm.opcode_modifier.jump == JUMP)
9290 output_branch ();
9291 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9292 || i.tm.opcode_modifier.jump == JUMP_DWORD)
9293 output_jump ();
9294 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9295 output_interseg_jump ();
9296 else
9297 {
9298 /* Output normal instructions here. */
9299 char *p;
9300 unsigned char *q;
9301 unsigned int j;
9302 unsigned int prefix;
9303 enum mf_cmp_kind mf_cmp;
9304
9305 if (avoid_fence
9306 && (i.tm.base_opcode == 0xfaee8
9307 || i.tm.base_opcode == 0xfaef0
9308 || i.tm.base_opcode == 0xfaef8))
9309 {
9310 /* Encode lfence, mfence, and sfence as
9311 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9312 if (now_seg != absolute_section)
9313 {
9314 offsetT val = 0x240483f0ULL;
9315
9316 p = frag_more (5);
9317 md_number_to_chars (p, val, 5);
9318 }
9319 else
9320 abs_section_offset += 5;
9321 return;
9322 }
9323
9324 /* Some processors fail on LOCK prefix. This options makes
9325 assembler ignore LOCK prefix and serves as a workaround. */
9326 if (omit_lock_prefix)
9327 {
9328 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE)
9329 return;
9330 i.prefix[LOCK_PREFIX] = 0;
9331 }
9332
9333 if (branch)
9334 /* Skip if this is a branch. */
9335 ;
9336 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9337 {
9338 /* Make room for padding. */
9339 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9340 p = frag_more (0);
9341
9342 fragP = frag_now;
9343
9344 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9345 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9346 NULL, 0, p);
9347
9348 fragP->tc_frag_data.mf_type = mf_cmp;
9349 fragP->tc_frag_data.branch_type = align_branch_fused;
9350 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9351 }
9352 else if (add_branch_prefix_frag_p ())
9353 {
9354 unsigned int max_prefix_size = align_branch_prefix_size;
9355
9356 /* Make room for padding. */
9357 frag_grow (max_prefix_size);
9358 p = frag_more (0);
9359
9360 fragP = frag_now;
9361
9362 frag_var (rs_machine_dependent, max_prefix_size, 0,
9363 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9364 NULL, 0, p);
9365
9366 fragP->tc_frag_data.max_bytes = max_prefix_size;
9367 }
9368
9369 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9370 don't need the explicit prefix. */
9371 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9372 {
9373 switch (i.tm.opcode_length)
9374 {
9375 case 3:
9376 if (i.tm.base_opcode & 0xff000000)
9377 {
9378 prefix = (i.tm.base_opcode >> 24) & 0xff;
9379 if (!i.tm.cpu_flags.bitfield.cpupadlock
9380 || prefix != REPE_PREFIX_OPCODE
9381 || (i.prefix[REP_PREFIX] != REPE_PREFIX_OPCODE))
9382 add_prefix (prefix);
9383 }
9384 break;
9385 case 2:
9386 if ((i.tm.base_opcode & 0xff0000) != 0)
9387 {
9388 prefix = (i.tm.base_opcode >> 16) & 0xff;
9389 add_prefix (prefix);
9390 }
9391 break;
9392 case 1:
9393 break;
9394 case 0:
9395 /* Check for pseudo prefixes. */
9396 as_bad_where (insn_start_frag->fr_file,
9397 insn_start_frag->fr_line,
9398 _("pseudo prefix without instruction"));
9399 return;
9400 default:
9401 abort ();
9402 }
9403
9404 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9405 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9406 R_X86_64_GOTTPOFF relocation so that linker can safely
9407 perform IE->LE optimization. A dummy REX_OPCODE prefix
9408 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9409 relocation for GDesc -> IE/LE optimization. */
9410 if (x86_elf_abi == X86_64_X32_ABI
9411 && i.operands == 2
9412 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9413 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9414 && i.prefix[REX_PREFIX] == 0)
9415 add_prefix (REX_OPCODE);
9416 #endif
9417
9418 /* The prefix bytes. */
9419 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9420 if (*q)
9421 frag_opcode_byte (*q);
9422 }
9423 else
9424 {
9425 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9426 if (*q)
9427 switch (j)
9428 {
9429 case SEG_PREFIX:
9430 case ADDR_PREFIX:
9431 frag_opcode_byte (*q);
9432 break;
9433 default:
9434 /* There should be no other prefixes for instructions
9435 with VEX prefix. */
9436 abort ();
9437 }
9438
9439 /* For EVEX instructions i.vrex should become 0 after
9440 build_evex_prefix. For VEX instructions upper 16 registers
9441 aren't available, so VREX should be 0. */
9442 if (i.vrex)
9443 abort ();
9444 /* Now the VEX prefix. */
9445 if (now_seg != absolute_section)
9446 {
9447 p = frag_more (i.vex.length);
9448 for (j = 0; j < i.vex.length; j++)
9449 p[j] = i.vex.bytes[j];
9450 }
9451 else
9452 abs_section_offset += i.vex.length;
9453 }
9454
9455 /* Now the opcode; be careful about word order here! */
9456 if (now_seg == absolute_section)
9457 abs_section_offset += i.tm.opcode_length;
9458 else if (i.tm.opcode_length == 1)
9459 {
9460 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9461 }
9462 else
9463 {
9464 switch (i.tm.opcode_length)
9465 {
9466 case 4:
9467 p = frag_more (4);
9468 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9469 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9470 break;
9471 case 3:
9472 p = frag_more (3);
9473 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9474 break;
9475 case 2:
9476 p = frag_more (2);
9477 break;
9478 default:
9479 abort ();
9480 break;
9481 }
9482
9483 /* Put out high byte first: can't use md_number_to_chars! */
9484 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9485 *p = i.tm.base_opcode & 0xff;
9486 }
9487
9488 /* Now the modrm byte and sib byte (if present). */
9489 if (i.tm.opcode_modifier.modrm)
9490 {
9491 frag_opcode_byte ((i.rm.regmem << 0)
9492 | (i.rm.reg << 3)
9493 | (i.rm.mode << 6));
9494 /* If i.rm.regmem == ESP (4)
9495 && i.rm.mode != (Register mode)
9496 && not 16 bit
9497 ==> need second modrm byte. */
9498 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9499 && i.rm.mode != 3
9500 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9501 frag_opcode_byte ((i.sib.base << 0)
9502 | (i.sib.index << 3)
9503 | (i.sib.scale << 6));
9504 }
9505
9506 if (i.disp_operands)
9507 output_disp (insn_start_frag, insn_start_off);
9508
9509 if (i.imm_operands)
9510 output_imm (insn_start_frag, insn_start_off);
9511
9512 /*
9513 * frag_now_fix () returning plain abs_section_offset when we're in the
9514 * absolute section, and abs_section_offset not getting updated as data
9515 * gets added to the frag breaks the logic below.
9516 */
9517 if (now_seg != absolute_section)
9518 {
9519 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9520 if (j > 15)
9521 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9522 j);
9523 else if (fragP)
9524 {
9525 /* NB: Don't add prefix with GOTPC relocation since
9526 output_disp() above depends on the fixed encoding
9527 length. Can't add prefix with TLS relocation since
9528 it breaks TLS linker optimization. */
9529 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9530 /* Prefix count on the current instruction. */
9531 unsigned int count = i.vex.length;
9532 unsigned int k;
9533 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9534 /* REX byte is encoded in VEX/EVEX prefix. */
9535 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9536 count++;
9537
9538 /* Count prefixes for extended opcode maps. */
9539 if (!i.vex.length)
9540 switch (i.tm.opcode_length)
9541 {
9542 case 3:
9543 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9544 {
9545 count++;
9546 switch ((i.tm.base_opcode >> 8) & 0xff)
9547 {
9548 case 0x38:
9549 case 0x3a:
9550 count++;
9551 break;
9552 default:
9553 break;
9554 }
9555 }
9556 break;
9557 case 2:
9558 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9559 count++;
9560 break;
9561 case 1:
9562 break;
9563 default:
9564 abort ();
9565 }
9566
9567 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9568 == BRANCH_PREFIX)
9569 {
9570 /* Set the maximum prefix size in BRANCH_PREFIX
9571 frag. */
9572 if (fragP->tc_frag_data.max_bytes > max)
9573 fragP->tc_frag_data.max_bytes = max;
9574 if (fragP->tc_frag_data.max_bytes > count)
9575 fragP->tc_frag_data.max_bytes -= count;
9576 else
9577 fragP->tc_frag_data.max_bytes = 0;
9578 }
9579 else
9580 {
9581 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9582 frag. */
9583 unsigned int max_prefix_size;
9584 if (align_branch_prefix_size > max)
9585 max_prefix_size = max;
9586 else
9587 max_prefix_size = align_branch_prefix_size;
9588 if (max_prefix_size > count)
9589 fragP->tc_frag_data.max_prefix_length
9590 = max_prefix_size - count;
9591 }
9592
9593 /* Use existing segment prefix if possible. Use CS
9594 segment prefix in 64-bit mode. In 32-bit mode, use SS
9595 segment prefix with ESP/EBP base register and use DS
9596 segment prefix without ESP/EBP base register. */
9597 if (i.prefix[SEG_PREFIX])
9598 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9599 else if (flag_code == CODE_64BIT)
9600 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9601 else if (i.base_reg
9602 && (i.base_reg->reg_num == 4
9603 || i.base_reg->reg_num == 5))
9604 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9605 else
9606 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9607 }
9608 }
9609 }
9610
9611 /* NB: Don't work with COND_JUMP86 without i386. */
9612 if (align_branch_power
9613 && now_seg != absolute_section
9614 && cpu_arch_flags.bitfield.cpui386)
9615 {
9616 /* Terminate each frag so that we can add prefix and check for
9617 fused jcc. */
9618 frag_wane (frag_now);
9619 frag_new (0);
9620 }
9621
9622 #ifdef DEBUG386
9623 if (flag_debug)
9624 {
9625 pi ("" /*line*/, &i);
9626 }
9627 #endif /* DEBUG386 */
9628 }
9629
9630 /* Return the size of the displacement operand N. */
9631
9632 static int
9633 disp_size (unsigned int n)
9634 {
9635 int size = 4;
9636
9637 if (i.types[n].bitfield.disp64)
9638 size = 8;
9639 else if (i.types[n].bitfield.disp8)
9640 size = 1;
9641 else if (i.types[n].bitfield.disp16)
9642 size = 2;
9643 return size;
9644 }
9645
9646 /* Return the size of the immediate operand N. */
9647
9648 static int
9649 imm_size (unsigned int n)
9650 {
9651 int size = 4;
9652 if (i.types[n].bitfield.imm64)
9653 size = 8;
9654 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9655 size = 1;
9656 else if (i.types[n].bitfield.imm16)
9657 size = 2;
9658 return size;
9659 }
9660
9661 static void
9662 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9663 {
9664 char *p;
9665 unsigned int n;
9666
9667 for (n = 0; n < i.operands; n++)
9668 {
9669 if (operand_type_check (i.types[n], disp))
9670 {
9671 int size = disp_size (n);
9672
9673 if (now_seg == absolute_section)
9674 abs_section_offset += size;
9675 else if (i.op[n].disps->X_op == O_constant)
9676 {
9677 offsetT val = i.op[n].disps->X_add_number;
9678
9679 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9680 size);
9681 p = frag_more (size);
9682 md_number_to_chars (p, val, size);
9683 }
9684 else
9685 {
9686 enum bfd_reloc_code_real reloc_type;
9687 int sign = i.types[n].bitfield.disp32s;
9688 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9689 fixS *fixP;
9690
9691 /* We can't have 8 bit displacement here. */
9692 gas_assert (!i.types[n].bitfield.disp8);
9693
9694 /* The PC relative address is computed relative
9695 to the instruction boundary, so in case immediate
9696 fields follows, we need to adjust the value. */
9697 if (pcrel && i.imm_operands)
9698 {
9699 unsigned int n1;
9700 int sz = 0;
9701
9702 for (n1 = 0; n1 < i.operands; n1++)
9703 if (operand_type_check (i.types[n1], imm))
9704 {
9705 /* Only one immediate is allowed for PC
9706 relative address. */
9707 gas_assert (sz == 0);
9708 sz = imm_size (n1);
9709 i.op[n].disps->X_add_number -= sz;
9710 }
9711 /* We should find the immediate. */
9712 gas_assert (sz != 0);
9713 }
9714
9715 p = frag_more (size);
9716 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9717 if (GOT_symbol
9718 && GOT_symbol == i.op[n].disps->X_add_symbol
9719 && (((reloc_type == BFD_RELOC_32
9720 || reloc_type == BFD_RELOC_X86_64_32S
9721 || (reloc_type == BFD_RELOC_64
9722 && object_64bit))
9723 && (i.op[n].disps->X_op == O_symbol
9724 || (i.op[n].disps->X_op == O_add
9725 && ((symbol_get_value_expression
9726 (i.op[n].disps->X_op_symbol)->X_op)
9727 == O_subtract))))
9728 || reloc_type == BFD_RELOC_32_PCREL))
9729 {
9730 if (!object_64bit)
9731 {
9732 reloc_type = BFD_RELOC_386_GOTPC;
9733 i.has_gotpc_tls_reloc = TRUE;
9734 i.op[n].imms->X_add_number +=
9735 encoding_length (insn_start_frag, insn_start_off, p);
9736 }
9737 else if (reloc_type == BFD_RELOC_64)
9738 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9739 else
9740 /* Don't do the adjustment for x86-64, as there
9741 the pcrel addressing is relative to the _next_
9742 insn, and that is taken care of in other code. */
9743 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9744 }
9745 else if (align_branch_power)
9746 {
9747 switch (reloc_type)
9748 {
9749 case BFD_RELOC_386_TLS_GD:
9750 case BFD_RELOC_386_TLS_LDM:
9751 case BFD_RELOC_386_TLS_IE:
9752 case BFD_RELOC_386_TLS_IE_32:
9753 case BFD_RELOC_386_TLS_GOTIE:
9754 case BFD_RELOC_386_TLS_GOTDESC:
9755 case BFD_RELOC_386_TLS_DESC_CALL:
9756 case BFD_RELOC_X86_64_TLSGD:
9757 case BFD_RELOC_X86_64_TLSLD:
9758 case BFD_RELOC_X86_64_GOTTPOFF:
9759 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9760 case BFD_RELOC_X86_64_TLSDESC_CALL:
9761 i.has_gotpc_tls_reloc = TRUE;
9762 default:
9763 break;
9764 }
9765 }
9766 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9767 size, i.op[n].disps, pcrel,
9768 reloc_type);
9769 /* Check for "call/jmp *mem", "mov mem, %reg",
9770 "test %reg, mem" and "binop mem, %reg" where binop
9771 is one of adc, add, and, cmp, or, sbb, sub, xor
9772 instructions without data prefix. Always generate
9773 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9774 if (i.prefix[DATA_PREFIX] == 0
9775 && (generate_relax_relocations
9776 || (!object_64bit
9777 && i.rm.mode == 0
9778 && i.rm.regmem == 5))
9779 && (i.rm.mode == 2
9780 || (i.rm.mode == 0 && i.rm.regmem == 5))
9781 && !is_any_vex_encoding(&i.tm)
9782 && ((i.operands == 1
9783 && i.tm.base_opcode == 0xff
9784 && (i.rm.reg == 2 || i.rm.reg == 4))
9785 || (i.operands == 2
9786 && (i.tm.base_opcode == 0x8b
9787 || i.tm.base_opcode == 0x85
9788 || (i.tm.base_opcode & ~0x38) == 0x03))))
9789 {
9790 if (object_64bit)
9791 {
9792 fixP->fx_tcbit = i.rex != 0;
9793 if (i.base_reg
9794 && (i.base_reg->reg_num == RegIP))
9795 fixP->fx_tcbit2 = 1;
9796 }
9797 else
9798 fixP->fx_tcbit2 = 1;
9799 }
9800 }
9801 }
9802 }
9803 }
9804
9805 static void
9806 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9807 {
9808 char *p;
9809 unsigned int n;
9810
9811 for (n = 0; n < i.operands; n++)
9812 {
9813 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9814 if (i.rounding && (int) n == i.rounding->operand)
9815 continue;
9816
9817 if (operand_type_check (i.types[n], imm))
9818 {
9819 int size = imm_size (n);
9820
9821 if (now_seg == absolute_section)
9822 abs_section_offset += size;
9823 else if (i.op[n].imms->X_op == O_constant)
9824 {
9825 offsetT val;
9826
9827 val = offset_in_range (i.op[n].imms->X_add_number,
9828 size);
9829 p = frag_more (size);
9830 md_number_to_chars (p, val, size);
9831 }
9832 else
9833 {
9834 /* Not absolute_section.
9835 Need a 32-bit fixup (don't support 8bit
9836 non-absolute imms). Try to support other
9837 sizes ... */
9838 enum bfd_reloc_code_real reloc_type;
9839 int sign;
9840
9841 if (i.types[n].bitfield.imm32s
9842 && (i.suffix == QWORD_MNEM_SUFFIX
9843 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9844 sign = 1;
9845 else
9846 sign = 0;
9847
9848 p = frag_more (size);
9849 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9850
9851 /* This is tough to explain. We end up with this one if we
9852 * have operands that look like
9853 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9854 * obtain the absolute address of the GOT, and it is strongly
9855 * preferable from a performance point of view to avoid using
9856 * a runtime relocation for this. The actual sequence of
9857 * instructions often look something like:
9858 *
9859 * call .L66
9860 * .L66:
9861 * popl %ebx
9862 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9863 *
9864 * The call and pop essentially return the absolute address
9865 * of the label .L66 and store it in %ebx. The linker itself
9866 * will ultimately change the first operand of the addl so
9867 * that %ebx points to the GOT, but to keep things simple, the
9868 * .o file must have this operand set so that it generates not
9869 * the absolute address of .L66, but the absolute address of
9870 * itself. This allows the linker itself simply treat a GOTPC
9871 * relocation as asking for a pcrel offset to the GOT to be
9872 * added in, and the addend of the relocation is stored in the
9873 * operand field for the instruction itself.
9874 *
9875 * Our job here is to fix the operand so that it would add
9876 * the correct offset so that %ebx would point to itself. The
9877 * thing that is tricky is that .-.L66 will point to the
9878 * beginning of the instruction, so we need to further modify
9879 * the operand so that it will point to itself. There are
9880 * other cases where you have something like:
9881 *
9882 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9883 *
9884 * and here no correction would be required. Internally in
9885 * the assembler we treat operands of this form as not being
9886 * pcrel since the '.' is explicitly mentioned, and I wonder
9887 * whether it would simplify matters to do it this way. Who
9888 * knows. In earlier versions of the PIC patches, the
9889 * pcrel_adjust field was used to store the correction, but
9890 * since the expression is not pcrel, I felt it would be
9891 * confusing to do it this way. */
9892
9893 if ((reloc_type == BFD_RELOC_32
9894 || reloc_type == BFD_RELOC_X86_64_32S
9895 || reloc_type == BFD_RELOC_64)
9896 && GOT_symbol
9897 && GOT_symbol == i.op[n].imms->X_add_symbol
9898 && (i.op[n].imms->X_op == O_symbol
9899 || (i.op[n].imms->X_op == O_add
9900 && ((symbol_get_value_expression
9901 (i.op[n].imms->X_op_symbol)->X_op)
9902 == O_subtract))))
9903 {
9904 if (!object_64bit)
9905 reloc_type = BFD_RELOC_386_GOTPC;
9906 else if (size == 4)
9907 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9908 else if (size == 8)
9909 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9910 i.has_gotpc_tls_reloc = TRUE;
9911 i.op[n].imms->X_add_number +=
9912 encoding_length (insn_start_frag, insn_start_off, p);
9913 }
9914 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9915 i.op[n].imms, 0, reloc_type);
9916 }
9917 }
9918 }
9919 }
9920 \f
9921 /* x86_cons_fix_new is called via the expression parsing code when a
9922 reloc is needed. We use this hook to get the correct .got reloc. */
9923 static int cons_sign = -1;
9924
9925 void
9926 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9927 expressionS *exp, bfd_reloc_code_real_type r)
9928 {
9929 r = reloc (len, 0, cons_sign, r);
9930
9931 #ifdef TE_PE
9932 if (exp->X_op == O_secrel)
9933 {
9934 exp->X_op = O_symbol;
9935 r = BFD_RELOC_32_SECREL;
9936 }
9937 #endif
9938
9939 fix_new_exp (frag, off, len, exp, 0, r);
9940 }
9941
9942 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9943 purpose of the `.dc.a' internal pseudo-op. */
9944
9945 int
9946 x86_address_bytes (void)
9947 {
9948 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9949 return 4;
9950 return stdoutput->arch_info->bits_per_address / 8;
9951 }
9952
9953 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9954 || defined (LEX_AT)
9955 # define lex_got(reloc, adjust, types) NULL
9956 #else
9957 /* Parse operands of the form
9958 <symbol>@GOTOFF+<nnn>
9959 and similar .plt or .got references.
9960
9961 If we find one, set up the correct relocation in RELOC and copy the
9962 input string, minus the `@GOTOFF' into a malloc'd buffer for
9963 parsing by the calling routine. Return this buffer, and if ADJUST
9964 is non-null set it to the length of the string we removed from the
9965 input line. Otherwise return NULL. */
9966 static char *
9967 lex_got (enum bfd_reloc_code_real *rel,
9968 int *adjust,
9969 i386_operand_type *types)
9970 {
9971 /* Some of the relocations depend on the size of what field is to
9972 be relocated. But in our callers i386_immediate and i386_displacement
9973 we don't yet know the operand size (this will be set by insn
9974 matching). Hence we record the word32 relocation here,
9975 and adjust the reloc according to the real size in reloc(). */
9976 static const struct {
9977 const char *str;
9978 int len;
9979 const enum bfd_reloc_code_real rel[2];
9980 const i386_operand_type types64;
9981 } gotrel[] = {
9982 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9983 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
9984 BFD_RELOC_SIZE32 },
9985 OPERAND_TYPE_IMM32_64 },
9986 #endif
9987 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
9988 BFD_RELOC_X86_64_PLTOFF64 },
9989 OPERAND_TYPE_IMM64 },
9990 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
9991 BFD_RELOC_X86_64_PLT32 },
9992 OPERAND_TYPE_IMM32_32S_DISP32 },
9993 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
9994 BFD_RELOC_X86_64_GOTPLT64 },
9995 OPERAND_TYPE_IMM64_DISP64 },
9996 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
9997 BFD_RELOC_X86_64_GOTOFF64 },
9998 OPERAND_TYPE_IMM64_DISP64 },
9999 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10000 BFD_RELOC_X86_64_GOTPCREL },
10001 OPERAND_TYPE_IMM32_32S_DISP32 },
10002 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
10003 BFD_RELOC_X86_64_TLSGD },
10004 OPERAND_TYPE_IMM32_32S_DISP32 },
10005 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
10006 _dummy_first_bfd_reloc_code_real },
10007 OPERAND_TYPE_NONE },
10008 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
10009 BFD_RELOC_X86_64_TLSLD },
10010 OPERAND_TYPE_IMM32_32S_DISP32 },
10011 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10012 BFD_RELOC_X86_64_GOTTPOFF },
10013 OPERAND_TYPE_IMM32_32S_DISP32 },
10014 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
10015 BFD_RELOC_X86_64_TPOFF32 },
10016 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10017 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
10018 _dummy_first_bfd_reloc_code_real },
10019 OPERAND_TYPE_NONE },
10020 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
10021 BFD_RELOC_X86_64_DTPOFF32 },
10022 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10023 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10024 _dummy_first_bfd_reloc_code_real },
10025 OPERAND_TYPE_NONE },
10026 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10027 _dummy_first_bfd_reloc_code_real },
10028 OPERAND_TYPE_NONE },
10029 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
10030 BFD_RELOC_X86_64_GOT32 },
10031 OPERAND_TYPE_IMM32_32S_64_DISP32 },
10032 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
10033 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10034 OPERAND_TYPE_IMM32_32S_DISP32 },
10035 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
10036 BFD_RELOC_X86_64_TLSDESC_CALL },
10037 OPERAND_TYPE_IMM32_32S_DISP32 },
10038 };
10039 char *cp;
10040 unsigned int j;
10041
10042 #if defined (OBJ_MAYBE_ELF)
10043 if (!IS_ELF)
10044 return NULL;
10045 #endif
10046
10047 for (cp = input_line_pointer; *cp != '@'; cp++)
10048 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10049 return NULL;
10050
10051 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10052 {
10053 int len = gotrel[j].len;
10054 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10055 {
10056 if (gotrel[j].rel[object_64bit] != 0)
10057 {
10058 int first, second;
10059 char *tmpbuf, *past_reloc;
10060
10061 *rel = gotrel[j].rel[object_64bit];
10062
10063 if (types)
10064 {
10065 if (flag_code != CODE_64BIT)
10066 {
10067 types->bitfield.imm32 = 1;
10068 types->bitfield.disp32 = 1;
10069 }
10070 else
10071 *types = gotrel[j].types64;
10072 }
10073
10074 if (j != 0 && GOT_symbol == NULL)
10075 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10076
10077 /* The length of the first part of our input line. */
10078 first = cp - input_line_pointer;
10079
10080 /* The second part goes from after the reloc token until
10081 (and including) an end_of_line char or comma. */
10082 past_reloc = cp + 1 + len;
10083 cp = past_reloc;
10084 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10085 ++cp;
10086 second = cp + 1 - past_reloc;
10087
10088 /* Allocate and copy string. The trailing NUL shouldn't
10089 be necessary, but be safe. */
10090 tmpbuf = XNEWVEC (char, first + second + 2);
10091 memcpy (tmpbuf, input_line_pointer, first);
10092 if (second != 0 && *past_reloc != ' ')
10093 /* Replace the relocation token with ' ', so that
10094 errors like foo@GOTOFF1 will be detected. */
10095 tmpbuf[first++] = ' ';
10096 else
10097 /* Increment length by 1 if the relocation token is
10098 removed. */
10099 len++;
10100 if (adjust)
10101 *adjust = len;
10102 memcpy (tmpbuf + first, past_reloc, second);
10103 tmpbuf[first + second] = '\0';
10104 return tmpbuf;
10105 }
10106
10107 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10108 gotrel[j].str, 1 << (5 + object_64bit));
10109 return NULL;
10110 }
10111 }
10112
10113 /* Might be a symbol version string. Don't as_bad here. */
10114 return NULL;
10115 }
10116 #endif
10117
10118 #ifdef TE_PE
10119 #ifdef lex_got
10120 #undef lex_got
10121 #endif
10122 /* Parse operands of the form
10123 <symbol>@SECREL32+<nnn>
10124
10125 If we find one, set up the correct relocation in RELOC and copy the
10126 input string, minus the `@SECREL32' into a malloc'd buffer for
10127 parsing by the calling routine. Return this buffer, and if ADJUST
10128 is non-null set it to the length of the string we removed from the
10129 input line. Otherwise return NULL.
10130
10131 This function is copied from the ELF version above adjusted for PE targets. */
10132
10133 static char *
10134 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10135 int *adjust ATTRIBUTE_UNUSED,
10136 i386_operand_type *types)
10137 {
10138 static const struct
10139 {
10140 const char *str;
10141 int len;
10142 const enum bfd_reloc_code_real rel[2];
10143 const i386_operand_type types64;
10144 }
10145 gotrel[] =
10146 {
10147 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10148 BFD_RELOC_32_SECREL },
10149 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10150 };
10151
10152 char *cp;
10153 unsigned j;
10154
10155 for (cp = input_line_pointer; *cp != '@'; cp++)
10156 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10157 return NULL;
10158
10159 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10160 {
10161 int len = gotrel[j].len;
10162
10163 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10164 {
10165 if (gotrel[j].rel[object_64bit] != 0)
10166 {
10167 int first, second;
10168 char *tmpbuf, *past_reloc;
10169
10170 *rel = gotrel[j].rel[object_64bit];
10171 if (adjust)
10172 *adjust = len;
10173
10174 if (types)
10175 {
10176 if (flag_code != CODE_64BIT)
10177 {
10178 types->bitfield.imm32 = 1;
10179 types->bitfield.disp32 = 1;
10180 }
10181 else
10182 *types = gotrel[j].types64;
10183 }
10184
10185 /* The length of the first part of our input line. */
10186 first = cp - input_line_pointer;
10187
10188 /* The second part goes from after the reloc token until
10189 (and including) an end_of_line char or comma. */
10190 past_reloc = cp + 1 + len;
10191 cp = past_reloc;
10192 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10193 ++cp;
10194 second = cp + 1 - past_reloc;
10195
10196 /* Allocate and copy string. The trailing NUL shouldn't
10197 be necessary, but be safe. */
10198 tmpbuf = XNEWVEC (char, first + second + 2);
10199 memcpy (tmpbuf, input_line_pointer, first);
10200 if (second != 0 && *past_reloc != ' ')
10201 /* Replace the relocation token with ' ', so that
10202 errors like foo@SECLREL321 will be detected. */
10203 tmpbuf[first++] = ' ';
10204 memcpy (tmpbuf + first, past_reloc, second);
10205 tmpbuf[first + second] = '\0';
10206 return tmpbuf;
10207 }
10208
10209 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10210 gotrel[j].str, 1 << (5 + object_64bit));
10211 return NULL;
10212 }
10213 }
10214
10215 /* Might be a symbol version string. Don't as_bad here. */
10216 return NULL;
10217 }
10218
10219 #endif /* TE_PE */
10220
10221 bfd_reloc_code_real_type
10222 x86_cons (expressionS *exp, int size)
10223 {
10224 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10225
10226 intel_syntax = -intel_syntax;
10227
10228 exp->X_md = 0;
10229 if (size == 4 || (object_64bit && size == 8))
10230 {
10231 /* Handle @GOTOFF and the like in an expression. */
10232 char *save;
10233 char *gotfree_input_line;
10234 int adjust = 0;
10235
10236 save = input_line_pointer;
10237 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10238 if (gotfree_input_line)
10239 input_line_pointer = gotfree_input_line;
10240
10241 expression (exp);
10242
10243 if (gotfree_input_line)
10244 {
10245 /* expression () has merrily parsed up to the end of line,
10246 or a comma - in the wrong buffer. Transfer how far
10247 input_line_pointer has moved to the right buffer. */
10248 input_line_pointer = (save
10249 + (input_line_pointer - gotfree_input_line)
10250 + adjust);
10251 free (gotfree_input_line);
10252 if (exp->X_op == O_constant
10253 || exp->X_op == O_absent
10254 || exp->X_op == O_illegal
10255 || exp->X_op == O_register
10256 || exp->X_op == O_big)
10257 {
10258 char c = *input_line_pointer;
10259 *input_line_pointer = 0;
10260 as_bad (_("missing or invalid expression `%s'"), save);
10261 *input_line_pointer = c;
10262 }
10263 else if ((got_reloc == BFD_RELOC_386_PLT32
10264 || got_reloc == BFD_RELOC_X86_64_PLT32)
10265 && exp->X_op != O_symbol)
10266 {
10267 char c = *input_line_pointer;
10268 *input_line_pointer = 0;
10269 as_bad (_("invalid PLT expression `%s'"), save);
10270 *input_line_pointer = c;
10271 }
10272 }
10273 }
10274 else
10275 expression (exp);
10276
10277 intel_syntax = -intel_syntax;
10278
10279 if (intel_syntax)
10280 i386_intel_simplify (exp);
10281
10282 return got_reloc;
10283 }
10284
10285 static void
10286 signed_cons (int size)
10287 {
10288 if (flag_code == CODE_64BIT)
10289 cons_sign = 1;
10290 cons (size);
10291 cons_sign = -1;
10292 }
10293
10294 #ifdef TE_PE
10295 static void
10296 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10297 {
10298 expressionS exp;
10299
10300 do
10301 {
10302 expression (&exp);
10303 if (exp.X_op == O_symbol)
10304 exp.X_op = O_secrel;
10305
10306 emit_expr (&exp, 4);
10307 }
10308 while (*input_line_pointer++ == ',');
10309
10310 input_line_pointer--;
10311 demand_empty_rest_of_line ();
10312 }
10313 #endif
10314
10315 /* Handle Vector operations. */
10316
10317 static char *
10318 check_VecOperations (char *op_string, char *op_end)
10319 {
10320 const reg_entry *mask;
10321 const char *saved;
10322 char *end_op;
10323
10324 while (*op_string
10325 && (op_end == NULL || op_string < op_end))
10326 {
10327 saved = op_string;
10328 if (*op_string == '{')
10329 {
10330 op_string++;
10331
10332 /* Check broadcasts. */
10333 if (strncmp (op_string, "1to", 3) == 0)
10334 {
10335 int bcst_type;
10336
10337 if (i.broadcast)
10338 goto duplicated_vec_op;
10339
10340 op_string += 3;
10341 if (*op_string == '8')
10342 bcst_type = 8;
10343 else if (*op_string == '4')
10344 bcst_type = 4;
10345 else if (*op_string == '2')
10346 bcst_type = 2;
10347 else if (*op_string == '1'
10348 && *(op_string+1) == '6')
10349 {
10350 bcst_type = 16;
10351 op_string++;
10352 }
10353 else
10354 {
10355 as_bad (_("Unsupported broadcast: `%s'"), saved);
10356 return NULL;
10357 }
10358 op_string++;
10359
10360 broadcast_op.type = bcst_type;
10361 broadcast_op.operand = this_operand;
10362 broadcast_op.bytes = 0;
10363 i.broadcast = &broadcast_op;
10364 }
10365 /* Check masking operation. */
10366 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10367 {
10368 if (mask == &bad_reg)
10369 return NULL;
10370
10371 /* k0 can't be used for write mask. */
10372 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10373 {
10374 as_bad (_("`%s%s' can't be used for write mask"),
10375 register_prefix, mask->reg_name);
10376 return NULL;
10377 }
10378
10379 if (!i.mask)
10380 {
10381 mask_op.mask = mask;
10382 mask_op.zeroing = 0;
10383 mask_op.operand = this_operand;
10384 i.mask = &mask_op;
10385 }
10386 else
10387 {
10388 if (i.mask->mask)
10389 goto duplicated_vec_op;
10390
10391 i.mask->mask = mask;
10392
10393 /* Only "{z}" is allowed here. No need to check
10394 zeroing mask explicitly. */
10395 if (i.mask->operand != this_operand)
10396 {
10397 as_bad (_("invalid write mask `%s'"), saved);
10398 return NULL;
10399 }
10400 }
10401
10402 op_string = end_op;
10403 }
10404 /* Check zeroing-flag for masking operation. */
10405 else if (*op_string == 'z')
10406 {
10407 if (!i.mask)
10408 {
10409 mask_op.mask = NULL;
10410 mask_op.zeroing = 1;
10411 mask_op.operand = this_operand;
10412 i.mask = &mask_op;
10413 }
10414 else
10415 {
10416 if (i.mask->zeroing)
10417 {
10418 duplicated_vec_op:
10419 as_bad (_("duplicated `%s'"), saved);
10420 return NULL;
10421 }
10422
10423 i.mask->zeroing = 1;
10424
10425 /* Only "{%k}" is allowed here. No need to check mask
10426 register explicitly. */
10427 if (i.mask->operand != this_operand)
10428 {
10429 as_bad (_("invalid zeroing-masking `%s'"),
10430 saved);
10431 return NULL;
10432 }
10433 }
10434
10435 op_string++;
10436 }
10437 else
10438 goto unknown_vec_op;
10439
10440 if (*op_string != '}')
10441 {
10442 as_bad (_("missing `}' in `%s'"), saved);
10443 return NULL;
10444 }
10445 op_string++;
10446
10447 /* Strip whitespace since the addition of pseudo prefixes
10448 changed how the scrubber treats '{'. */
10449 if (is_space_char (*op_string))
10450 ++op_string;
10451
10452 continue;
10453 }
10454 unknown_vec_op:
10455 /* We don't know this one. */
10456 as_bad (_("unknown vector operation: `%s'"), saved);
10457 return NULL;
10458 }
10459
10460 if (i.mask && i.mask->zeroing && !i.mask->mask)
10461 {
10462 as_bad (_("zeroing-masking only allowed with write mask"));
10463 return NULL;
10464 }
10465
10466 return op_string;
10467 }
10468
10469 static int
10470 i386_immediate (char *imm_start)
10471 {
10472 char *save_input_line_pointer;
10473 char *gotfree_input_line;
10474 segT exp_seg = 0;
10475 expressionS *exp;
10476 i386_operand_type types;
10477
10478 operand_type_set (&types, ~0);
10479
10480 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10481 {
10482 as_bad (_("at most %d immediate operands are allowed"),
10483 MAX_IMMEDIATE_OPERANDS);
10484 return 0;
10485 }
10486
10487 exp = &im_expressions[i.imm_operands++];
10488 i.op[this_operand].imms = exp;
10489
10490 if (is_space_char (*imm_start))
10491 ++imm_start;
10492
10493 save_input_line_pointer = input_line_pointer;
10494 input_line_pointer = imm_start;
10495
10496 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10497 if (gotfree_input_line)
10498 input_line_pointer = gotfree_input_line;
10499
10500 exp_seg = expression (exp);
10501
10502 SKIP_WHITESPACE ();
10503
10504 /* Handle vector operations. */
10505 if (*input_line_pointer == '{')
10506 {
10507 input_line_pointer = check_VecOperations (input_line_pointer,
10508 NULL);
10509 if (input_line_pointer == NULL)
10510 return 0;
10511 }
10512
10513 if (*input_line_pointer)
10514 as_bad (_("junk `%s' after expression"), input_line_pointer);
10515
10516 input_line_pointer = save_input_line_pointer;
10517 if (gotfree_input_line)
10518 {
10519 free (gotfree_input_line);
10520
10521 if (exp->X_op == O_constant || exp->X_op == O_register)
10522 exp->X_op = O_illegal;
10523 }
10524
10525 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10526 }
10527
10528 static int
10529 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10530 i386_operand_type types, const char *imm_start)
10531 {
10532 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10533 {
10534 if (imm_start)
10535 as_bad (_("missing or invalid immediate expression `%s'"),
10536 imm_start);
10537 return 0;
10538 }
10539 else if (exp->X_op == O_constant)
10540 {
10541 /* Size it properly later. */
10542 i.types[this_operand].bitfield.imm64 = 1;
10543 /* If not 64bit, sign extend val. */
10544 if (flag_code != CODE_64BIT
10545 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10546 exp->X_add_number
10547 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10548 }
10549 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10550 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10551 && exp_seg != absolute_section
10552 && exp_seg != text_section
10553 && exp_seg != data_section
10554 && exp_seg != bss_section
10555 && exp_seg != undefined_section
10556 && !bfd_is_com_section (exp_seg))
10557 {
10558 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10559 return 0;
10560 }
10561 #endif
10562 else if (!intel_syntax && exp_seg == reg_section)
10563 {
10564 if (imm_start)
10565 as_bad (_("illegal immediate register operand %s"), imm_start);
10566 return 0;
10567 }
10568 else
10569 {
10570 /* This is an address. The size of the address will be
10571 determined later, depending on destination register,
10572 suffix, or the default for the section. */
10573 i.types[this_operand].bitfield.imm8 = 1;
10574 i.types[this_operand].bitfield.imm16 = 1;
10575 i.types[this_operand].bitfield.imm32 = 1;
10576 i.types[this_operand].bitfield.imm32s = 1;
10577 i.types[this_operand].bitfield.imm64 = 1;
10578 i.types[this_operand] = operand_type_and (i.types[this_operand],
10579 types);
10580 }
10581
10582 return 1;
10583 }
10584
10585 static char *
10586 i386_scale (char *scale)
10587 {
10588 offsetT val;
10589 char *save = input_line_pointer;
10590
10591 input_line_pointer = scale;
10592 val = get_absolute_expression ();
10593
10594 switch (val)
10595 {
10596 case 1:
10597 i.log2_scale_factor = 0;
10598 break;
10599 case 2:
10600 i.log2_scale_factor = 1;
10601 break;
10602 case 4:
10603 i.log2_scale_factor = 2;
10604 break;
10605 case 8:
10606 i.log2_scale_factor = 3;
10607 break;
10608 default:
10609 {
10610 char sep = *input_line_pointer;
10611
10612 *input_line_pointer = '\0';
10613 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10614 scale);
10615 *input_line_pointer = sep;
10616 input_line_pointer = save;
10617 return NULL;
10618 }
10619 }
10620 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10621 {
10622 as_warn (_("scale factor of %d without an index register"),
10623 1 << i.log2_scale_factor);
10624 i.log2_scale_factor = 0;
10625 }
10626 scale = input_line_pointer;
10627 input_line_pointer = save;
10628 return scale;
10629 }
10630
10631 static int
10632 i386_displacement (char *disp_start, char *disp_end)
10633 {
10634 expressionS *exp;
10635 segT exp_seg = 0;
10636 char *save_input_line_pointer;
10637 char *gotfree_input_line;
10638 int override;
10639 i386_operand_type bigdisp, types = anydisp;
10640 int ret;
10641
10642 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10643 {
10644 as_bad (_("at most %d displacement operands are allowed"),
10645 MAX_MEMORY_OPERANDS);
10646 return 0;
10647 }
10648
10649 operand_type_set (&bigdisp, 0);
10650 if (i.jumpabsolute
10651 || i.types[this_operand].bitfield.baseindex
10652 || (current_templates->start->opcode_modifier.jump != JUMP
10653 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10654 {
10655 i386_addressing_mode ();
10656 override = (i.prefix[ADDR_PREFIX] != 0);
10657 if (flag_code == CODE_64BIT)
10658 {
10659 if (!override)
10660 {
10661 bigdisp.bitfield.disp32s = 1;
10662 bigdisp.bitfield.disp64 = 1;
10663 }
10664 else
10665 bigdisp.bitfield.disp32 = 1;
10666 }
10667 else if ((flag_code == CODE_16BIT) ^ override)
10668 bigdisp.bitfield.disp16 = 1;
10669 else
10670 bigdisp.bitfield.disp32 = 1;
10671 }
10672 else
10673 {
10674 /* For PC-relative branches, the width of the displacement may be
10675 dependent upon data size, but is never dependent upon address size.
10676 Also make sure to not unintentionally match against a non-PC-relative
10677 branch template. */
10678 static templates aux_templates;
10679 const insn_template *t = current_templates->start;
10680 bfd_boolean has_intel64 = FALSE;
10681
10682 aux_templates.start = t;
10683 while (++t < current_templates->end)
10684 {
10685 if (t->opcode_modifier.jump
10686 != current_templates->start->opcode_modifier.jump)
10687 break;
10688 if ((t->opcode_modifier.isa64 >= INTEL64))
10689 has_intel64 = TRUE;
10690 }
10691 if (t < current_templates->end)
10692 {
10693 aux_templates.end = t;
10694 current_templates = &aux_templates;
10695 }
10696
10697 override = (i.prefix[DATA_PREFIX] != 0);
10698 if (flag_code == CODE_64BIT)
10699 {
10700 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10701 && (!intel64 || !has_intel64))
10702 bigdisp.bitfield.disp16 = 1;
10703 else
10704 bigdisp.bitfield.disp32s = 1;
10705 }
10706 else
10707 {
10708 if (!override)
10709 override = (i.suffix == (flag_code != CODE_16BIT
10710 ? WORD_MNEM_SUFFIX
10711 : LONG_MNEM_SUFFIX));
10712 bigdisp.bitfield.disp32 = 1;
10713 if ((flag_code == CODE_16BIT) ^ override)
10714 {
10715 bigdisp.bitfield.disp32 = 0;
10716 bigdisp.bitfield.disp16 = 1;
10717 }
10718 }
10719 }
10720 i.types[this_operand] = operand_type_or (i.types[this_operand],
10721 bigdisp);
10722
10723 exp = &disp_expressions[i.disp_operands];
10724 i.op[this_operand].disps = exp;
10725 i.disp_operands++;
10726 save_input_line_pointer = input_line_pointer;
10727 input_line_pointer = disp_start;
10728 END_STRING_AND_SAVE (disp_end);
10729
10730 #ifndef GCC_ASM_O_HACK
10731 #define GCC_ASM_O_HACK 0
10732 #endif
10733 #if GCC_ASM_O_HACK
10734 END_STRING_AND_SAVE (disp_end + 1);
10735 if (i.types[this_operand].bitfield.baseIndex
10736 && displacement_string_end[-1] == '+')
10737 {
10738 /* This hack is to avoid a warning when using the "o"
10739 constraint within gcc asm statements.
10740 For instance:
10741
10742 #define _set_tssldt_desc(n,addr,limit,type) \
10743 __asm__ __volatile__ ( \
10744 "movw %w2,%0\n\t" \
10745 "movw %w1,2+%0\n\t" \
10746 "rorl $16,%1\n\t" \
10747 "movb %b1,4+%0\n\t" \
10748 "movb %4,5+%0\n\t" \
10749 "movb $0,6+%0\n\t" \
10750 "movb %h1,7+%0\n\t" \
10751 "rorl $16,%1" \
10752 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10753
10754 This works great except that the output assembler ends
10755 up looking a bit weird if it turns out that there is
10756 no offset. You end up producing code that looks like:
10757
10758 #APP
10759 movw $235,(%eax)
10760 movw %dx,2+(%eax)
10761 rorl $16,%edx
10762 movb %dl,4+(%eax)
10763 movb $137,5+(%eax)
10764 movb $0,6+(%eax)
10765 movb %dh,7+(%eax)
10766 rorl $16,%edx
10767 #NO_APP
10768
10769 So here we provide the missing zero. */
10770
10771 *displacement_string_end = '0';
10772 }
10773 #endif
10774 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10775 if (gotfree_input_line)
10776 input_line_pointer = gotfree_input_line;
10777
10778 exp_seg = expression (exp);
10779
10780 SKIP_WHITESPACE ();
10781 if (*input_line_pointer)
10782 as_bad (_("junk `%s' after expression"), input_line_pointer);
10783 #if GCC_ASM_O_HACK
10784 RESTORE_END_STRING (disp_end + 1);
10785 #endif
10786 input_line_pointer = save_input_line_pointer;
10787 if (gotfree_input_line)
10788 {
10789 free (gotfree_input_line);
10790
10791 if (exp->X_op == O_constant || exp->X_op == O_register)
10792 exp->X_op = O_illegal;
10793 }
10794
10795 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10796
10797 RESTORE_END_STRING (disp_end);
10798
10799 return ret;
10800 }
10801
10802 static int
10803 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10804 i386_operand_type types, const char *disp_start)
10805 {
10806 i386_operand_type bigdisp;
10807 int ret = 1;
10808
10809 /* We do this to make sure that the section symbol is in
10810 the symbol table. We will ultimately change the relocation
10811 to be relative to the beginning of the section. */
10812 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10813 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10814 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10815 {
10816 if (exp->X_op != O_symbol)
10817 goto inv_disp;
10818
10819 if (S_IS_LOCAL (exp->X_add_symbol)
10820 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10821 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10822 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10823 exp->X_op = O_subtract;
10824 exp->X_op_symbol = GOT_symbol;
10825 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10826 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10827 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10828 i.reloc[this_operand] = BFD_RELOC_64;
10829 else
10830 i.reloc[this_operand] = BFD_RELOC_32;
10831 }
10832
10833 else if (exp->X_op == O_absent
10834 || exp->X_op == O_illegal
10835 || exp->X_op == O_big)
10836 {
10837 inv_disp:
10838 as_bad (_("missing or invalid displacement expression `%s'"),
10839 disp_start);
10840 ret = 0;
10841 }
10842
10843 else if (flag_code == CODE_64BIT
10844 && !i.prefix[ADDR_PREFIX]
10845 && exp->X_op == O_constant)
10846 {
10847 /* Since displacement is signed extended to 64bit, don't allow
10848 disp32 and turn off disp32s if they are out of range. */
10849 i.types[this_operand].bitfield.disp32 = 0;
10850 if (!fits_in_signed_long (exp->X_add_number))
10851 {
10852 i.types[this_operand].bitfield.disp32s = 0;
10853 if (i.types[this_operand].bitfield.baseindex)
10854 {
10855 as_bad (_("0x%lx out range of signed 32bit displacement"),
10856 (long) exp->X_add_number);
10857 ret = 0;
10858 }
10859 }
10860 }
10861
10862 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10863 else if (exp->X_op != O_constant
10864 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10865 && exp_seg != absolute_section
10866 && exp_seg != text_section
10867 && exp_seg != data_section
10868 && exp_seg != bss_section
10869 && exp_seg != undefined_section
10870 && !bfd_is_com_section (exp_seg))
10871 {
10872 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10873 ret = 0;
10874 }
10875 #endif
10876
10877 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10878 /* Constants get taken care of by optimize_disp(). */
10879 && exp->X_op != O_constant)
10880 i.types[this_operand].bitfield.disp8 = 1;
10881
10882 /* Check if this is a displacement only operand. */
10883 bigdisp = i.types[this_operand];
10884 bigdisp.bitfield.disp8 = 0;
10885 bigdisp.bitfield.disp16 = 0;
10886 bigdisp.bitfield.disp32 = 0;
10887 bigdisp.bitfield.disp32s = 0;
10888 bigdisp.bitfield.disp64 = 0;
10889 if (operand_type_all_zero (&bigdisp))
10890 i.types[this_operand] = operand_type_and (i.types[this_operand],
10891 types);
10892
10893 return ret;
10894 }
10895
10896 /* Return the active addressing mode, taking address override and
10897 registers forming the address into consideration. Update the
10898 address override prefix if necessary. */
10899
10900 static enum flag_code
10901 i386_addressing_mode (void)
10902 {
10903 enum flag_code addr_mode;
10904
10905 if (i.prefix[ADDR_PREFIX])
10906 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10907 else if (flag_code == CODE_16BIT
10908 && current_templates->start->cpu_flags.bitfield.cpumpx
10909 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10910 from md_assemble() by "is not a valid base/index expression"
10911 when there is a base and/or index. */
10912 && !i.types[this_operand].bitfield.baseindex)
10913 {
10914 /* MPX insn memory operands with neither base nor index must be forced
10915 to use 32-bit addressing in 16-bit mode. */
10916 addr_mode = CODE_32BIT;
10917 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10918 ++i.prefixes;
10919 gas_assert (!i.types[this_operand].bitfield.disp16);
10920 gas_assert (!i.types[this_operand].bitfield.disp32);
10921 }
10922 else
10923 {
10924 addr_mode = flag_code;
10925
10926 #if INFER_ADDR_PREFIX
10927 if (i.mem_operands == 0)
10928 {
10929 /* Infer address prefix from the first memory operand. */
10930 const reg_entry *addr_reg = i.base_reg;
10931
10932 if (addr_reg == NULL)
10933 addr_reg = i.index_reg;
10934
10935 if (addr_reg)
10936 {
10937 if (addr_reg->reg_type.bitfield.dword)
10938 addr_mode = CODE_32BIT;
10939 else if (flag_code != CODE_64BIT
10940 && addr_reg->reg_type.bitfield.word)
10941 addr_mode = CODE_16BIT;
10942
10943 if (addr_mode != flag_code)
10944 {
10945 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10946 i.prefixes += 1;
10947 /* Change the size of any displacement too. At most one
10948 of Disp16 or Disp32 is set.
10949 FIXME. There doesn't seem to be any real need for
10950 separate Disp16 and Disp32 flags. The same goes for
10951 Imm16 and Imm32. Removing them would probably clean
10952 up the code quite a lot. */
10953 if (flag_code != CODE_64BIT
10954 && (i.types[this_operand].bitfield.disp16
10955 || i.types[this_operand].bitfield.disp32))
10956 i.types[this_operand]
10957 = operand_type_xor (i.types[this_operand], disp16_32);
10958 }
10959 }
10960 }
10961 #endif
10962 }
10963
10964 return addr_mode;
10965 }
10966
10967 /* Make sure the memory operand we've been dealt is valid.
10968 Return 1 on success, 0 on a failure. */
10969
10970 static int
10971 i386_index_check (const char *operand_string)
10972 {
10973 const char *kind = "base/index";
10974 enum flag_code addr_mode = i386_addressing_mode ();
10975
10976 if (current_templates->start->opcode_modifier.isstring
10977 && !current_templates->start->cpu_flags.bitfield.cpupadlock
10978 && (current_templates->end[-1].opcode_modifier.isstring
10979 || i.mem_operands))
10980 {
10981 /* Memory operands of string insns are special in that they only allow
10982 a single register (rDI, rSI, or rBX) as their memory address. */
10983 const reg_entry *expected_reg;
10984 static const char *di_si[][2] =
10985 {
10986 { "esi", "edi" },
10987 { "si", "di" },
10988 { "rsi", "rdi" }
10989 };
10990 static const char *bx[] = { "ebx", "bx", "rbx" };
10991
10992 kind = "string address";
10993
10994 if (current_templates->start->opcode_modifier.repprefixok)
10995 {
10996 int es_op = current_templates->end[-1].opcode_modifier.isstring
10997 - IS_STRING_ES_OP0;
10998 int op = 0;
10999
11000 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11001 || ((!i.mem_operands != !intel_syntax)
11002 && current_templates->end[-1].operand_types[1]
11003 .bitfield.baseindex))
11004 op = 1;
11005 expected_reg
11006 = (const reg_entry *) str_hash_find (reg_hash,
11007 di_si[addr_mode][op == es_op]);
11008 }
11009 else
11010 expected_reg
11011 = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11012
11013 if (i.base_reg != expected_reg
11014 || i.index_reg
11015 || operand_type_check (i.types[this_operand], disp))
11016 {
11017 /* The second memory operand must have the same size as
11018 the first one. */
11019 if (i.mem_operands
11020 && i.base_reg
11021 && !((addr_mode == CODE_64BIT
11022 && i.base_reg->reg_type.bitfield.qword)
11023 || (addr_mode == CODE_32BIT
11024 ? i.base_reg->reg_type.bitfield.dword
11025 : i.base_reg->reg_type.bitfield.word)))
11026 goto bad_address;
11027
11028 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11029 operand_string,
11030 intel_syntax ? '[' : '(',
11031 register_prefix,
11032 expected_reg->reg_name,
11033 intel_syntax ? ']' : ')');
11034 return 1;
11035 }
11036 else
11037 return 1;
11038
11039 bad_address:
11040 as_bad (_("`%s' is not a valid %s expression"),
11041 operand_string, kind);
11042 return 0;
11043 }
11044 else
11045 {
11046 if (addr_mode != CODE_16BIT)
11047 {
11048 /* 32-bit/64-bit checks. */
11049 if (i.disp_encoding == disp_encoding_16bit)
11050 {
11051 bad_disp:
11052 as_bad (_("invalid `%s' prefix"),
11053 addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11054 return 0;
11055 }
11056
11057 if ((i.base_reg
11058 && ((addr_mode == CODE_64BIT
11059 ? !i.base_reg->reg_type.bitfield.qword
11060 : !i.base_reg->reg_type.bitfield.dword)
11061 || (i.index_reg && i.base_reg->reg_num == RegIP)
11062 || i.base_reg->reg_num == RegIZ))
11063 || (i.index_reg
11064 && !i.index_reg->reg_type.bitfield.xmmword
11065 && !i.index_reg->reg_type.bitfield.ymmword
11066 && !i.index_reg->reg_type.bitfield.zmmword
11067 && ((addr_mode == CODE_64BIT
11068 ? !i.index_reg->reg_type.bitfield.qword
11069 : !i.index_reg->reg_type.bitfield.dword)
11070 || !i.index_reg->reg_type.bitfield.baseindex)))
11071 goto bad_address;
11072
11073 /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11074 if (current_templates->start->base_opcode == 0xf30f1b
11075 || (current_templates->start->base_opcode & ~1) == 0x0f1a
11076 || current_templates->start->opcode_modifier.sib == SIBMEM)
11077 {
11078 /* They cannot use RIP-relative addressing. */
11079 if (i.base_reg && i.base_reg->reg_num == RegIP)
11080 {
11081 as_bad (_("`%s' cannot be used here"), operand_string);
11082 return 0;
11083 }
11084
11085 /* bndldx and bndstx ignore their scale factor. */
11086 if ((current_templates->start->base_opcode & ~1) == 0x0f1a
11087 && i.log2_scale_factor)
11088 as_warn (_("register scaling is being ignored here"));
11089 }
11090 }
11091 else
11092 {
11093 /* 16-bit checks. */
11094 if (i.disp_encoding == disp_encoding_32bit)
11095 goto bad_disp;
11096
11097 if ((i.base_reg
11098 && (!i.base_reg->reg_type.bitfield.word
11099 || !i.base_reg->reg_type.bitfield.baseindex))
11100 || (i.index_reg
11101 && (!i.index_reg->reg_type.bitfield.word
11102 || !i.index_reg->reg_type.bitfield.baseindex
11103 || !(i.base_reg
11104 && i.base_reg->reg_num < 6
11105 && i.index_reg->reg_num >= 6
11106 && i.log2_scale_factor == 0))))
11107 goto bad_address;
11108 }
11109 }
11110 return 1;
11111 }
11112
11113 /* Handle vector immediates. */
11114
11115 static int
11116 RC_SAE_immediate (const char *imm_start)
11117 {
11118 unsigned int match_found, j;
11119 const char *pstr = imm_start;
11120 expressionS *exp;
11121
11122 if (*pstr != '{')
11123 return 0;
11124
11125 pstr++;
11126 match_found = 0;
11127 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11128 {
11129 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11130 {
11131 if (!i.rounding)
11132 {
11133 rc_op.type = RC_NamesTable[j].type;
11134 rc_op.operand = this_operand;
11135 i.rounding = &rc_op;
11136 }
11137 else
11138 {
11139 as_bad (_("duplicated `%s'"), imm_start);
11140 return 0;
11141 }
11142 pstr += RC_NamesTable[j].len;
11143 match_found = 1;
11144 break;
11145 }
11146 }
11147 if (!match_found)
11148 return 0;
11149
11150 if (*pstr++ != '}')
11151 {
11152 as_bad (_("Missing '}': '%s'"), imm_start);
11153 return 0;
11154 }
11155 /* RC/SAE immediate string should contain nothing more. */;
11156 if (*pstr != 0)
11157 {
11158 as_bad (_("Junk after '}': '%s'"), imm_start);
11159 return 0;
11160 }
11161
11162 exp = &im_expressions[i.imm_operands++];
11163 i.op[this_operand].imms = exp;
11164
11165 exp->X_op = O_constant;
11166 exp->X_add_number = 0;
11167 exp->X_add_symbol = (symbolS *) 0;
11168 exp->X_op_symbol = (symbolS *) 0;
11169
11170 i.types[this_operand].bitfield.imm8 = 1;
11171 return 1;
11172 }
11173
11174 /* Only string instructions can have a second memory operand, so
11175 reduce current_templates to just those if it contains any. */
11176 static int
11177 maybe_adjust_templates (void)
11178 {
11179 const insn_template *t;
11180
11181 gas_assert (i.mem_operands == 1);
11182
11183 for (t = current_templates->start; t < current_templates->end; ++t)
11184 if (t->opcode_modifier.isstring)
11185 break;
11186
11187 if (t < current_templates->end)
11188 {
11189 static templates aux_templates;
11190 bfd_boolean recheck;
11191
11192 aux_templates.start = t;
11193 for (; t < current_templates->end; ++t)
11194 if (!t->opcode_modifier.isstring)
11195 break;
11196 aux_templates.end = t;
11197
11198 /* Determine whether to re-check the first memory operand. */
11199 recheck = (aux_templates.start != current_templates->start
11200 || t != current_templates->end);
11201
11202 current_templates = &aux_templates;
11203
11204 if (recheck)
11205 {
11206 i.mem_operands = 0;
11207 if (i.memop1_string != NULL
11208 && i386_index_check (i.memop1_string) == 0)
11209 return 0;
11210 i.mem_operands = 1;
11211 }
11212 }
11213
11214 return 1;
11215 }
11216
11217 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
11218 on error. */
11219
11220 static int
11221 i386_att_operand (char *operand_string)
11222 {
11223 const reg_entry *r;
11224 char *end_op;
11225 char *op_string = operand_string;
11226
11227 if (is_space_char (*op_string))
11228 ++op_string;
11229
11230 /* We check for an absolute prefix (differentiating,
11231 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
11232 if (*op_string == ABSOLUTE_PREFIX)
11233 {
11234 ++op_string;
11235 if (is_space_char (*op_string))
11236 ++op_string;
11237 i.jumpabsolute = TRUE;
11238 }
11239
11240 /* Check if operand is a register. */
11241 if ((r = parse_register (op_string, &end_op)) != NULL)
11242 {
11243 i386_operand_type temp;
11244
11245 if (r == &bad_reg)
11246 return 0;
11247
11248 /* Check for a segment override by searching for ':' after a
11249 segment register. */
11250 op_string = end_op;
11251 if (is_space_char (*op_string))
11252 ++op_string;
11253 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11254 {
11255 switch (r->reg_num)
11256 {
11257 case 0:
11258 i.seg[i.mem_operands] = &es;
11259 break;
11260 case 1:
11261 i.seg[i.mem_operands] = &cs;
11262 break;
11263 case 2:
11264 i.seg[i.mem_operands] = &ss;
11265 break;
11266 case 3:
11267 i.seg[i.mem_operands] = &ds;
11268 break;
11269 case 4:
11270 i.seg[i.mem_operands] = &fs;
11271 break;
11272 case 5:
11273 i.seg[i.mem_operands] = &gs;
11274 break;
11275 }
11276
11277 /* Skip the ':' and whitespace. */
11278 ++op_string;
11279 if (is_space_char (*op_string))
11280 ++op_string;
11281
11282 if (!is_digit_char (*op_string)
11283 && !is_identifier_char (*op_string)
11284 && *op_string != '('
11285 && *op_string != ABSOLUTE_PREFIX)
11286 {
11287 as_bad (_("bad memory operand `%s'"), op_string);
11288 return 0;
11289 }
11290 /* Handle case of %es:*foo. */
11291 if (*op_string == ABSOLUTE_PREFIX)
11292 {
11293 ++op_string;
11294 if (is_space_char (*op_string))
11295 ++op_string;
11296 i.jumpabsolute = TRUE;
11297 }
11298 goto do_memory_reference;
11299 }
11300
11301 /* Handle vector operations. */
11302 if (*op_string == '{')
11303 {
11304 op_string = check_VecOperations (op_string, NULL);
11305 if (op_string == NULL)
11306 return 0;
11307 }
11308
11309 if (*op_string)
11310 {
11311 as_bad (_("junk `%s' after register"), op_string);
11312 return 0;
11313 }
11314 temp = r->reg_type;
11315 temp.bitfield.baseindex = 0;
11316 i.types[this_operand] = operand_type_or (i.types[this_operand],
11317 temp);
11318 i.types[this_operand].bitfield.unspecified = 0;
11319 i.op[this_operand].regs = r;
11320 i.reg_operands++;
11321 }
11322 else if (*op_string == REGISTER_PREFIX)
11323 {
11324 as_bad (_("bad register name `%s'"), op_string);
11325 return 0;
11326 }
11327 else if (*op_string == IMMEDIATE_PREFIX)
11328 {
11329 ++op_string;
11330 if (i.jumpabsolute)
11331 {
11332 as_bad (_("immediate operand illegal with absolute jump"));
11333 return 0;
11334 }
11335 if (!i386_immediate (op_string))
11336 return 0;
11337 }
11338 else if (RC_SAE_immediate (operand_string))
11339 {
11340 /* If it is a RC or SAE immediate, do nothing. */
11341 ;
11342 }
11343 else if (is_digit_char (*op_string)
11344 || is_identifier_char (*op_string)
11345 || *op_string == '"'
11346 || *op_string == '(')
11347 {
11348 /* This is a memory reference of some sort. */
11349 char *base_string;
11350
11351 /* Start and end of displacement string expression (if found). */
11352 char *displacement_string_start;
11353 char *displacement_string_end;
11354 char *vop_start;
11355
11356 do_memory_reference:
11357 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11358 return 0;
11359 if ((i.mem_operands == 1
11360 && !current_templates->start->opcode_modifier.isstring)
11361 || i.mem_operands == 2)
11362 {
11363 as_bad (_("too many memory references for `%s'"),
11364 current_templates->start->name);
11365 return 0;
11366 }
11367
11368 /* Check for base index form. We detect the base index form by
11369 looking for an ')' at the end of the operand, searching
11370 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11371 after the '('. */
11372 base_string = op_string + strlen (op_string);
11373
11374 /* Handle vector operations. */
11375 vop_start = strchr (op_string, '{');
11376 if (vop_start && vop_start < base_string)
11377 {
11378 if (check_VecOperations (vop_start, base_string) == NULL)
11379 return 0;
11380 base_string = vop_start;
11381 }
11382
11383 --base_string;
11384 if (is_space_char (*base_string))
11385 --base_string;
11386
11387 /* If we only have a displacement, set-up for it to be parsed later. */
11388 displacement_string_start = op_string;
11389 displacement_string_end = base_string + 1;
11390
11391 if (*base_string == ')')
11392 {
11393 char *temp_string;
11394 unsigned int parens_balanced = 1;
11395 /* We've already checked that the number of left & right ()'s are
11396 equal, so this loop will not be infinite. */
11397 do
11398 {
11399 base_string--;
11400 if (*base_string == ')')
11401 parens_balanced++;
11402 if (*base_string == '(')
11403 parens_balanced--;
11404 }
11405 while (parens_balanced);
11406
11407 temp_string = base_string;
11408
11409 /* Skip past '(' and whitespace. */
11410 ++base_string;
11411 if (is_space_char (*base_string))
11412 ++base_string;
11413
11414 if (*base_string == ','
11415 || ((i.base_reg = parse_register (base_string, &end_op))
11416 != NULL))
11417 {
11418 displacement_string_end = temp_string;
11419
11420 i.types[this_operand].bitfield.baseindex = 1;
11421
11422 if (i.base_reg)
11423 {
11424 if (i.base_reg == &bad_reg)
11425 return 0;
11426 base_string = end_op;
11427 if (is_space_char (*base_string))
11428 ++base_string;
11429 }
11430
11431 /* There may be an index reg or scale factor here. */
11432 if (*base_string == ',')
11433 {
11434 ++base_string;
11435 if (is_space_char (*base_string))
11436 ++base_string;
11437
11438 if ((i.index_reg = parse_register (base_string, &end_op))
11439 != NULL)
11440 {
11441 if (i.index_reg == &bad_reg)
11442 return 0;
11443 base_string = end_op;
11444 if (is_space_char (*base_string))
11445 ++base_string;
11446 if (*base_string == ',')
11447 {
11448 ++base_string;
11449 if (is_space_char (*base_string))
11450 ++base_string;
11451 }
11452 else if (*base_string != ')')
11453 {
11454 as_bad (_("expecting `,' or `)' "
11455 "after index register in `%s'"),
11456 operand_string);
11457 return 0;
11458 }
11459 }
11460 else if (*base_string == REGISTER_PREFIX)
11461 {
11462 end_op = strchr (base_string, ',');
11463 if (end_op)
11464 *end_op = '\0';
11465 as_bad (_("bad register name `%s'"), base_string);
11466 return 0;
11467 }
11468
11469 /* Check for scale factor. */
11470 if (*base_string != ')')
11471 {
11472 char *end_scale = i386_scale (base_string);
11473
11474 if (!end_scale)
11475 return 0;
11476
11477 base_string = end_scale;
11478 if (is_space_char (*base_string))
11479 ++base_string;
11480 if (*base_string != ')')
11481 {
11482 as_bad (_("expecting `)' "
11483 "after scale factor in `%s'"),
11484 operand_string);
11485 return 0;
11486 }
11487 }
11488 else if (!i.index_reg)
11489 {
11490 as_bad (_("expecting index register or scale factor "
11491 "after `,'; got '%c'"),
11492 *base_string);
11493 return 0;
11494 }
11495 }
11496 else if (*base_string != ')')
11497 {
11498 as_bad (_("expecting `,' or `)' "
11499 "after base register in `%s'"),
11500 operand_string);
11501 return 0;
11502 }
11503 }
11504 else if (*base_string == REGISTER_PREFIX)
11505 {
11506 end_op = strchr (base_string, ',');
11507 if (end_op)
11508 *end_op = '\0';
11509 as_bad (_("bad register name `%s'"), base_string);
11510 return 0;
11511 }
11512 }
11513
11514 /* If there's an expression beginning the operand, parse it,
11515 assuming displacement_string_start and
11516 displacement_string_end are meaningful. */
11517 if (displacement_string_start != displacement_string_end)
11518 {
11519 if (!i386_displacement (displacement_string_start,
11520 displacement_string_end))
11521 return 0;
11522 }
11523
11524 /* Special case for (%dx) while doing input/output op. */
11525 if (i.base_reg
11526 && i.base_reg->reg_type.bitfield.instance == RegD
11527 && i.base_reg->reg_type.bitfield.word
11528 && i.index_reg == 0
11529 && i.log2_scale_factor == 0
11530 && i.seg[i.mem_operands] == 0
11531 && !operand_type_check (i.types[this_operand], disp))
11532 {
11533 i.types[this_operand] = i.base_reg->reg_type;
11534 return 1;
11535 }
11536
11537 if (i386_index_check (operand_string) == 0)
11538 return 0;
11539 i.flags[this_operand] |= Operand_Mem;
11540 if (i.mem_operands == 0)
11541 i.memop1_string = xstrdup (operand_string);
11542 i.mem_operands++;
11543 }
11544 else
11545 {
11546 /* It's not a memory operand; argh! */
11547 as_bad (_("invalid char %s beginning operand %d `%s'"),
11548 output_invalid (*op_string),
11549 this_operand + 1,
11550 op_string);
11551 return 0;
11552 }
11553 return 1; /* Normal return. */
11554 }
11555 \f
11556 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11557 that an rs_machine_dependent frag may reach. */
11558
11559 unsigned int
11560 i386_frag_max_var (fragS *frag)
11561 {
11562 /* The only relaxable frags are for jumps.
11563 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11564 gas_assert (frag->fr_type == rs_machine_dependent);
11565 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11566 }
11567
11568 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11569 static int
11570 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11571 {
11572 /* STT_GNU_IFUNC symbol must go through PLT. */
11573 if ((symbol_get_bfdsym (fr_symbol)->flags
11574 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11575 return 0;
11576
11577 if (!S_IS_EXTERNAL (fr_symbol))
11578 /* Symbol may be weak or local. */
11579 return !S_IS_WEAK (fr_symbol);
11580
11581 /* Global symbols with non-default visibility can't be preempted. */
11582 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11583 return 1;
11584
11585 if (fr_var != NO_RELOC)
11586 switch ((enum bfd_reloc_code_real) fr_var)
11587 {
11588 case BFD_RELOC_386_PLT32:
11589 case BFD_RELOC_X86_64_PLT32:
11590 /* Symbol with PLT relocation may be preempted. */
11591 return 0;
11592 default:
11593 abort ();
11594 }
11595
11596 /* Global symbols with default visibility in a shared library may be
11597 preempted by another definition. */
11598 return !shared;
11599 }
11600 #endif
11601
11602 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11603 Note also work for Skylake and Cascadelake.
11604 ---------------------------------------------------------------------
11605 | JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11606 | ------ | ----------- | ------- | -------- |
11607 | Jo | N | N | Y |
11608 | Jno | N | N | Y |
11609 | Jc/Jb | Y | N | Y |
11610 | Jae/Jnb | Y | N | Y |
11611 | Je/Jz | Y | Y | Y |
11612 | Jne/Jnz | Y | Y | Y |
11613 | Jna/Jbe | Y | N | Y |
11614 | Ja/Jnbe | Y | N | Y |
11615 | Js | N | N | Y |
11616 | Jns | N | N | Y |
11617 | Jp/Jpe | N | N | Y |
11618 | Jnp/Jpo | N | N | Y |
11619 | Jl/Jnge | Y | Y | Y |
11620 | Jge/Jnl | Y | Y | Y |
11621 | Jle/Jng | Y | Y | Y |
11622 | Jg/Jnle | Y | Y | Y |
11623 --------------------------------------------------------------------- */
11624 static int
11625 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11626 {
11627 if (mf_cmp == mf_cmp_alu_cmp)
11628 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11629 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11630 if (mf_cmp == mf_cmp_incdec)
11631 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11632 || mf_jcc == mf_jcc_jle);
11633 if (mf_cmp == mf_cmp_test_and)
11634 return 1;
11635 return 0;
11636 }
11637
11638 /* Return the next non-empty frag. */
11639
11640 static fragS *
11641 i386_next_non_empty_frag (fragS *fragP)
11642 {
11643 /* There may be a frag with a ".fill 0" when there is no room in
11644 the current frag for frag_grow in output_insn. */
11645 for (fragP = fragP->fr_next;
11646 (fragP != NULL
11647 && fragP->fr_type == rs_fill
11648 && fragP->fr_fix == 0);
11649 fragP = fragP->fr_next)
11650 ;
11651 return fragP;
11652 }
11653
11654 /* Return the next jcc frag after BRANCH_PADDING. */
11655
11656 static fragS *
11657 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11658 {
11659 fragS *branch_fragP;
11660 if (!pad_fragP)
11661 return NULL;
11662
11663 if (pad_fragP->fr_type == rs_machine_dependent
11664 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11665 == BRANCH_PADDING))
11666 {
11667 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11668 if (branch_fragP->fr_type != rs_machine_dependent)
11669 return NULL;
11670 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11671 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11672 pad_fragP->tc_frag_data.mf_type))
11673 return branch_fragP;
11674 }
11675
11676 return NULL;
11677 }
11678
11679 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11680
11681 static void
11682 i386_classify_machine_dependent_frag (fragS *fragP)
11683 {
11684 fragS *cmp_fragP;
11685 fragS *pad_fragP;
11686 fragS *branch_fragP;
11687 fragS *next_fragP;
11688 unsigned int max_prefix_length;
11689
11690 if (fragP->tc_frag_data.classified)
11691 return;
11692
11693 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11694 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11695 for (next_fragP = fragP;
11696 next_fragP != NULL;
11697 next_fragP = next_fragP->fr_next)
11698 {
11699 next_fragP->tc_frag_data.classified = 1;
11700 if (next_fragP->fr_type == rs_machine_dependent)
11701 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11702 {
11703 case BRANCH_PADDING:
11704 /* The BRANCH_PADDING frag must be followed by a branch
11705 frag. */
11706 branch_fragP = i386_next_non_empty_frag (next_fragP);
11707 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11708 break;
11709 case FUSED_JCC_PADDING:
11710 /* Check if this is a fused jcc:
11711 FUSED_JCC_PADDING
11712 CMP like instruction
11713 BRANCH_PADDING
11714 COND_JUMP
11715 */
11716 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11717 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11718 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11719 if (branch_fragP)
11720 {
11721 /* The BRANCH_PADDING frag is merged with the
11722 FUSED_JCC_PADDING frag. */
11723 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11724 /* CMP like instruction size. */
11725 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11726 frag_wane (pad_fragP);
11727 /* Skip to branch_fragP. */
11728 next_fragP = branch_fragP;
11729 }
11730 else if (next_fragP->tc_frag_data.max_prefix_length)
11731 {
11732 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11733 a fused jcc. */
11734 next_fragP->fr_subtype
11735 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11736 next_fragP->tc_frag_data.max_bytes
11737 = next_fragP->tc_frag_data.max_prefix_length;
11738 /* This will be updated in the BRANCH_PREFIX scan. */
11739 next_fragP->tc_frag_data.max_prefix_length = 0;
11740 }
11741 else
11742 frag_wane (next_fragP);
11743 break;
11744 }
11745 }
11746
11747 /* Stop if there is no BRANCH_PREFIX. */
11748 if (!align_branch_prefix_size)
11749 return;
11750
11751 /* Scan for BRANCH_PREFIX. */
11752 for (; fragP != NULL; fragP = fragP->fr_next)
11753 {
11754 if (fragP->fr_type != rs_machine_dependent
11755 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11756 != BRANCH_PREFIX))
11757 continue;
11758
11759 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11760 COND_JUMP_PREFIX. */
11761 max_prefix_length = 0;
11762 for (next_fragP = fragP;
11763 next_fragP != NULL;
11764 next_fragP = next_fragP->fr_next)
11765 {
11766 if (next_fragP->fr_type == rs_fill)
11767 /* Skip rs_fill frags. */
11768 continue;
11769 else if (next_fragP->fr_type != rs_machine_dependent)
11770 /* Stop for all other frags. */
11771 break;
11772
11773 /* rs_machine_dependent frags. */
11774 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11775 == BRANCH_PREFIX)
11776 {
11777 /* Count BRANCH_PREFIX frags. */
11778 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11779 {
11780 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11781 frag_wane (next_fragP);
11782 }
11783 else
11784 max_prefix_length
11785 += next_fragP->tc_frag_data.max_bytes;
11786 }
11787 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11788 == BRANCH_PADDING)
11789 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11790 == FUSED_JCC_PADDING))
11791 {
11792 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11793 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11794 break;
11795 }
11796 else
11797 /* Stop for other rs_machine_dependent frags. */
11798 break;
11799 }
11800
11801 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11802
11803 /* Skip to the next frag. */
11804 fragP = next_fragP;
11805 }
11806 }
11807
11808 /* Compute padding size for
11809
11810 FUSED_JCC_PADDING
11811 CMP like instruction
11812 BRANCH_PADDING
11813 COND_JUMP/UNCOND_JUMP
11814
11815 or
11816
11817 BRANCH_PADDING
11818 COND_JUMP/UNCOND_JUMP
11819 */
11820
11821 static int
11822 i386_branch_padding_size (fragS *fragP, offsetT address)
11823 {
11824 unsigned int offset, size, padding_size;
11825 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11826
11827 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11828 if (!address)
11829 address = fragP->fr_address;
11830 address += fragP->fr_fix;
11831
11832 /* CMP like instrunction size. */
11833 size = fragP->tc_frag_data.cmp_size;
11834
11835 /* The base size of the branch frag. */
11836 size += branch_fragP->fr_fix;
11837
11838 /* Add opcode and displacement bytes for the rs_machine_dependent
11839 branch frag. */
11840 if (branch_fragP->fr_type == rs_machine_dependent)
11841 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11842
11843 /* Check if branch is within boundary and doesn't end at the last
11844 byte. */
11845 offset = address & ((1U << align_branch_power) - 1);
11846 if ((offset + size) >= (1U << align_branch_power))
11847 /* Padding needed to avoid crossing boundary. */
11848 padding_size = (1U << align_branch_power) - offset;
11849 else
11850 /* No padding needed. */
11851 padding_size = 0;
11852
11853 /* The return value may be saved in tc_frag_data.length which is
11854 unsigned byte. */
11855 if (!fits_in_unsigned_byte (padding_size))
11856 abort ();
11857
11858 return padding_size;
11859 }
11860
11861 /* i386_generic_table_relax_frag()
11862
11863 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11864 grow/shrink padding to align branch frags. Hand others to
11865 relax_frag(). */
11866
11867 long
11868 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11869 {
11870 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11871 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11872 {
11873 long padding_size = i386_branch_padding_size (fragP, 0);
11874 long grow = padding_size - fragP->tc_frag_data.length;
11875
11876 /* When the BRANCH_PREFIX frag is used, the computed address
11877 must match the actual address and there should be no padding. */
11878 if (fragP->tc_frag_data.padding_address
11879 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11880 || padding_size))
11881 abort ();
11882
11883 /* Update the padding size. */
11884 if (grow)
11885 fragP->tc_frag_data.length = padding_size;
11886
11887 return grow;
11888 }
11889 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11890 {
11891 fragS *padding_fragP, *next_fragP;
11892 long padding_size, left_size, last_size;
11893
11894 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11895 if (!padding_fragP)
11896 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11897 return (fragP->tc_frag_data.length
11898 - fragP->tc_frag_data.last_length);
11899
11900 /* Compute the relative address of the padding frag in the very
11901 first time where the BRANCH_PREFIX frag sizes are zero. */
11902 if (!fragP->tc_frag_data.padding_address)
11903 fragP->tc_frag_data.padding_address
11904 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11905
11906 /* First update the last length from the previous interation. */
11907 left_size = fragP->tc_frag_data.prefix_length;
11908 for (next_fragP = fragP;
11909 next_fragP != padding_fragP;
11910 next_fragP = next_fragP->fr_next)
11911 if (next_fragP->fr_type == rs_machine_dependent
11912 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11913 == BRANCH_PREFIX))
11914 {
11915 if (left_size)
11916 {
11917 int max = next_fragP->tc_frag_data.max_bytes;
11918 if (max)
11919 {
11920 int size;
11921 if (max > left_size)
11922 size = left_size;
11923 else
11924 size = max;
11925 left_size -= size;
11926 next_fragP->tc_frag_data.last_length = size;
11927 }
11928 }
11929 else
11930 next_fragP->tc_frag_data.last_length = 0;
11931 }
11932
11933 /* Check the padding size for the padding frag. */
11934 padding_size = i386_branch_padding_size
11935 (padding_fragP, (fragP->fr_address
11936 + fragP->tc_frag_data.padding_address));
11937
11938 last_size = fragP->tc_frag_data.prefix_length;
11939 /* Check if there is change from the last interation. */
11940 if (padding_size == last_size)
11941 {
11942 /* Update the expected address of the padding frag. */
11943 padding_fragP->tc_frag_data.padding_address
11944 = (fragP->fr_address + padding_size
11945 + fragP->tc_frag_data.padding_address);
11946 return 0;
11947 }
11948
11949 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11950 {
11951 /* No padding if there is no sufficient room. Clear the
11952 expected address of the padding frag. */
11953 padding_fragP->tc_frag_data.padding_address = 0;
11954 padding_size = 0;
11955 }
11956 else
11957 /* Store the expected address of the padding frag. */
11958 padding_fragP->tc_frag_data.padding_address
11959 = (fragP->fr_address + padding_size
11960 + fragP->tc_frag_data.padding_address);
11961
11962 fragP->tc_frag_data.prefix_length = padding_size;
11963
11964 /* Update the length for the current interation. */
11965 left_size = padding_size;
11966 for (next_fragP = fragP;
11967 next_fragP != padding_fragP;
11968 next_fragP = next_fragP->fr_next)
11969 if (next_fragP->fr_type == rs_machine_dependent
11970 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11971 == BRANCH_PREFIX))
11972 {
11973 if (left_size)
11974 {
11975 int max = next_fragP->tc_frag_data.max_bytes;
11976 if (max)
11977 {
11978 int size;
11979 if (max > left_size)
11980 size = left_size;
11981 else
11982 size = max;
11983 left_size -= size;
11984 next_fragP->tc_frag_data.length = size;
11985 }
11986 }
11987 else
11988 next_fragP->tc_frag_data.length = 0;
11989 }
11990
11991 return (fragP->tc_frag_data.length
11992 - fragP->tc_frag_data.last_length);
11993 }
11994 return relax_frag (segment, fragP, stretch);
11995 }
11996
11997 /* md_estimate_size_before_relax()
11998
11999 Called just before relax() for rs_machine_dependent frags. The x86
12000 assembler uses these frags to handle variable size jump
12001 instructions.
12002
12003 Any symbol that is now undefined will not become defined.
12004 Return the correct fr_subtype in the frag.
12005 Return the initial "guess for variable size of frag" to caller.
12006 The guess is actually the growth beyond the fixed part. Whatever
12007 we do to grow the fixed or variable part contributes to our
12008 returned value. */
12009
12010 int
12011 md_estimate_size_before_relax (fragS *fragP, segT segment)
12012 {
12013 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12014 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12015 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12016 {
12017 i386_classify_machine_dependent_frag (fragP);
12018 return fragP->tc_frag_data.length;
12019 }
12020
12021 /* We've already got fragP->fr_subtype right; all we have to do is
12022 check for un-relaxable symbols. On an ELF system, we can't relax
12023 an externally visible symbol, because it may be overridden by a
12024 shared library. */
12025 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12026 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12027 || (IS_ELF
12028 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12029 fragP->fr_var))
12030 #endif
12031 #if defined (OBJ_COFF) && defined (TE_PE)
12032 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12033 && S_IS_WEAK (fragP->fr_symbol))
12034 #endif
12035 )
12036 {
12037 /* Symbol is undefined in this segment, or we need to keep a
12038 reloc so that weak symbols can be overridden. */
12039 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12040 enum bfd_reloc_code_real reloc_type;
12041 unsigned char *opcode;
12042 int old_fr_fix;
12043
12044 if (fragP->fr_var != NO_RELOC)
12045 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12046 else if (size == 2)
12047 reloc_type = BFD_RELOC_16_PCREL;
12048 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12049 else if (need_plt32_p (fragP->fr_symbol))
12050 reloc_type = BFD_RELOC_X86_64_PLT32;
12051 #endif
12052 else
12053 reloc_type = BFD_RELOC_32_PCREL;
12054
12055 old_fr_fix = fragP->fr_fix;
12056 opcode = (unsigned char *) fragP->fr_opcode;
12057
12058 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12059 {
12060 case UNCOND_JUMP:
12061 /* Make jmp (0xeb) a (d)word displacement jump. */
12062 opcode[0] = 0xe9;
12063 fragP->fr_fix += size;
12064 fix_new (fragP, old_fr_fix, size,
12065 fragP->fr_symbol,
12066 fragP->fr_offset, 1,
12067 reloc_type);
12068 break;
12069
12070 case COND_JUMP86:
12071 if (size == 2
12072 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12073 {
12074 /* Negate the condition, and branch past an
12075 unconditional jump. */
12076 opcode[0] ^= 1;
12077 opcode[1] = 3;
12078 /* Insert an unconditional jump. */
12079 opcode[2] = 0xe9;
12080 /* We added two extra opcode bytes, and have a two byte
12081 offset. */
12082 fragP->fr_fix += 2 + 2;
12083 fix_new (fragP, old_fr_fix + 2, 2,
12084 fragP->fr_symbol,
12085 fragP->fr_offset, 1,
12086 reloc_type);
12087 break;
12088 }
12089 /* Fall through. */
12090
12091 case COND_JUMP:
12092 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12093 {
12094 fixS *fixP;
12095
12096 fragP->fr_fix += 1;
12097 fixP = fix_new (fragP, old_fr_fix, 1,
12098 fragP->fr_symbol,
12099 fragP->fr_offset, 1,
12100 BFD_RELOC_8_PCREL);
12101 fixP->fx_signed = 1;
12102 break;
12103 }
12104
12105 /* This changes the byte-displacement jump 0x7N
12106 to the (d)word-displacement jump 0x0f,0x8N. */
12107 opcode[1] = opcode[0] + 0x10;
12108 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12109 /* We've added an opcode byte. */
12110 fragP->fr_fix += 1 + size;
12111 fix_new (fragP, old_fr_fix + 1, size,
12112 fragP->fr_symbol,
12113 fragP->fr_offset, 1,
12114 reloc_type);
12115 break;
12116
12117 default:
12118 BAD_CASE (fragP->fr_subtype);
12119 break;
12120 }
12121 frag_wane (fragP);
12122 return fragP->fr_fix - old_fr_fix;
12123 }
12124
12125 /* Guess size depending on current relax state. Initially the relax
12126 state will correspond to a short jump and we return 1, because
12127 the variable part of the frag (the branch offset) is one byte
12128 long. However, we can relax a section more than once and in that
12129 case we must either set fr_subtype back to the unrelaxed state,
12130 or return the value for the appropriate branch. */
12131 return md_relax_table[fragP->fr_subtype].rlx_length;
12132 }
12133
12134 /* Called after relax() is finished.
12135
12136 In: Address of frag.
12137 fr_type == rs_machine_dependent.
12138 fr_subtype is what the address relaxed to.
12139
12140 Out: Any fixSs and constants are set up.
12141 Caller will turn frag into a ".space 0". */
12142
12143 void
12144 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12145 fragS *fragP)
12146 {
12147 unsigned char *opcode;
12148 unsigned char *where_to_put_displacement = NULL;
12149 offsetT target_address;
12150 offsetT opcode_address;
12151 unsigned int extension = 0;
12152 offsetT displacement_from_opcode_start;
12153
12154 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12155 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12156 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12157 {
12158 /* Generate nop padding. */
12159 unsigned int size = fragP->tc_frag_data.length;
12160 if (size)
12161 {
12162 if (size > fragP->tc_frag_data.max_bytes)
12163 abort ();
12164
12165 if (flag_debug)
12166 {
12167 const char *msg;
12168 const char *branch = "branch";
12169 const char *prefix = "";
12170 fragS *padding_fragP;
12171 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12172 == BRANCH_PREFIX)
12173 {
12174 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12175 switch (fragP->tc_frag_data.default_prefix)
12176 {
12177 default:
12178 abort ();
12179 break;
12180 case CS_PREFIX_OPCODE:
12181 prefix = " cs";
12182 break;
12183 case DS_PREFIX_OPCODE:
12184 prefix = " ds";
12185 break;
12186 case ES_PREFIX_OPCODE:
12187 prefix = " es";
12188 break;
12189 case FS_PREFIX_OPCODE:
12190 prefix = " fs";
12191 break;
12192 case GS_PREFIX_OPCODE:
12193 prefix = " gs";
12194 break;
12195 case SS_PREFIX_OPCODE:
12196 prefix = " ss";
12197 break;
12198 }
12199 if (padding_fragP)
12200 msg = _("%s:%u: add %d%s at 0x%llx to align "
12201 "%s within %d-byte boundary\n");
12202 else
12203 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12204 "align %s within %d-byte boundary\n");
12205 }
12206 else
12207 {
12208 padding_fragP = fragP;
12209 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12210 "%s within %d-byte boundary\n");
12211 }
12212
12213 if (padding_fragP)
12214 switch (padding_fragP->tc_frag_data.branch_type)
12215 {
12216 case align_branch_jcc:
12217 branch = "jcc";
12218 break;
12219 case align_branch_fused:
12220 branch = "fused jcc";
12221 break;
12222 case align_branch_jmp:
12223 branch = "jmp";
12224 break;
12225 case align_branch_call:
12226 branch = "call";
12227 break;
12228 case align_branch_indirect:
12229 branch = "indiret branch";
12230 break;
12231 case align_branch_ret:
12232 branch = "ret";
12233 break;
12234 default:
12235 break;
12236 }
12237
12238 fprintf (stdout, msg,
12239 fragP->fr_file, fragP->fr_line, size, prefix,
12240 (long long) fragP->fr_address, branch,
12241 1 << align_branch_power);
12242 }
12243 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12244 memset (fragP->fr_opcode,
12245 fragP->tc_frag_data.default_prefix, size);
12246 else
12247 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12248 size, 0);
12249 fragP->fr_fix += size;
12250 }
12251 return;
12252 }
12253
12254 opcode = (unsigned char *) fragP->fr_opcode;
12255
12256 /* Address we want to reach in file space. */
12257 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12258
12259 /* Address opcode resides at in file space. */
12260 opcode_address = fragP->fr_address + fragP->fr_fix;
12261
12262 /* Displacement from opcode start to fill into instruction. */
12263 displacement_from_opcode_start = target_address - opcode_address;
12264
12265 if ((fragP->fr_subtype & BIG) == 0)
12266 {
12267 /* Don't have to change opcode. */
12268 extension = 1; /* 1 opcode + 1 displacement */
12269 where_to_put_displacement = &opcode[1];
12270 }
12271 else
12272 {
12273 if (no_cond_jump_promotion
12274 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12275 as_warn_where (fragP->fr_file, fragP->fr_line,
12276 _("long jump required"));
12277
12278 switch (fragP->fr_subtype)
12279 {
12280 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12281 extension = 4; /* 1 opcode + 4 displacement */
12282 opcode[0] = 0xe9;
12283 where_to_put_displacement = &opcode[1];
12284 break;
12285
12286 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12287 extension = 2; /* 1 opcode + 2 displacement */
12288 opcode[0] = 0xe9;
12289 where_to_put_displacement = &opcode[1];
12290 break;
12291
12292 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12293 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12294 extension = 5; /* 2 opcode + 4 displacement */
12295 opcode[1] = opcode[0] + 0x10;
12296 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12297 where_to_put_displacement = &opcode[2];
12298 break;
12299
12300 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12301 extension = 3; /* 2 opcode + 2 displacement */
12302 opcode[1] = opcode[0] + 0x10;
12303 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12304 where_to_put_displacement = &opcode[2];
12305 break;
12306
12307 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12308 extension = 4;
12309 opcode[0] ^= 1;
12310 opcode[1] = 3;
12311 opcode[2] = 0xe9;
12312 where_to_put_displacement = &opcode[3];
12313 break;
12314
12315 default:
12316 BAD_CASE (fragP->fr_subtype);
12317 break;
12318 }
12319 }
12320
12321 /* If size if less then four we are sure that the operand fits,
12322 but if it's 4, then it could be that the displacement is larger
12323 then -/+ 2GB. */
12324 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12325 && object_64bit
12326 && ((addressT) (displacement_from_opcode_start - extension
12327 + ((addressT) 1 << 31))
12328 > (((addressT) 2 << 31) - 1)))
12329 {
12330 as_bad_where (fragP->fr_file, fragP->fr_line,
12331 _("jump target out of range"));
12332 /* Make us emit 0. */
12333 displacement_from_opcode_start = extension;
12334 }
12335 /* Now put displacement after opcode. */
12336 md_number_to_chars ((char *) where_to_put_displacement,
12337 (valueT) (displacement_from_opcode_start - extension),
12338 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12339 fragP->fr_fix += extension;
12340 }
12341 \f
12342 /* Apply a fixup (fixP) to segment data, once it has been determined
12343 by our caller that we have all the info we need to fix it up.
12344
12345 Parameter valP is the pointer to the value of the bits.
12346
12347 On the 386, immediates, displacements, and data pointers are all in
12348 the same (little-endian) format, so we don't need to care about which
12349 we are handling. */
12350
12351 void
12352 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12353 {
12354 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12355 valueT value = *valP;
12356
12357 #if !defined (TE_Mach)
12358 if (fixP->fx_pcrel)
12359 {
12360 switch (fixP->fx_r_type)
12361 {
12362 default:
12363 break;
12364
12365 case BFD_RELOC_64:
12366 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12367 break;
12368 case BFD_RELOC_32:
12369 case BFD_RELOC_X86_64_32S:
12370 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12371 break;
12372 case BFD_RELOC_16:
12373 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12374 break;
12375 case BFD_RELOC_8:
12376 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12377 break;
12378 }
12379 }
12380
12381 if (fixP->fx_addsy != NULL
12382 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12383 || fixP->fx_r_type == BFD_RELOC_64_PCREL
12384 || fixP->fx_r_type == BFD_RELOC_16_PCREL
12385 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12386 && !use_rela_relocations)
12387 {
12388 /* This is a hack. There should be a better way to handle this.
12389 This covers for the fact that bfd_install_relocation will
12390 subtract the current location (for partial_inplace, PC relative
12391 relocations); see more below. */
12392 #ifndef OBJ_AOUT
12393 if (IS_ELF
12394 #ifdef TE_PE
12395 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12396 #endif
12397 )
12398 value += fixP->fx_where + fixP->fx_frag->fr_address;
12399 #endif
12400 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12401 if (IS_ELF)
12402 {
12403 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12404
12405 if ((sym_seg == seg
12406 || (symbol_section_p (fixP->fx_addsy)
12407 && sym_seg != absolute_section))
12408 && !generic_force_reloc (fixP))
12409 {
12410 /* Yes, we add the values in twice. This is because
12411 bfd_install_relocation subtracts them out again. I think
12412 bfd_install_relocation is broken, but I don't dare change
12413 it. FIXME. */
12414 value += fixP->fx_where + fixP->fx_frag->fr_address;
12415 }
12416 }
12417 #endif
12418 #if defined (OBJ_COFF) && defined (TE_PE)
12419 /* For some reason, the PE format does not store a
12420 section address offset for a PC relative symbol. */
12421 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12422 || S_IS_WEAK (fixP->fx_addsy))
12423 value += md_pcrel_from (fixP);
12424 #endif
12425 }
12426 #if defined (OBJ_COFF) && defined (TE_PE)
12427 if (fixP->fx_addsy != NULL
12428 && S_IS_WEAK (fixP->fx_addsy)
12429 /* PR 16858: Do not modify weak function references. */
12430 && ! fixP->fx_pcrel)
12431 {
12432 #if !defined (TE_PEP)
12433 /* For x86 PE weak function symbols are neither PC-relative
12434 nor do they set S_IS_FUNCTION. So the only reliable way
12435 to detect them is to check the flags of their containing
12436 section. */
12437 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12438 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12439 ;
12440 else
12441 #endif
12442 value -= S_GET_VALUE (fixP->fx_addsy);
12443 }
12444 #endif
12445
12446 /* Fix a few things - the dynamic linker expects certain values here,
12447 and we must not disappoint it. */
12448 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12449 if (IS_ELF && fixP->fx_addsy)
12450 switch (fixP->fx_r_type)
12451 {
12452 case BFD_RELOC_386_PLT32:
12453 case BFD_RELOC_X86_64_PLT32:
12454 /* Make the jump instruction point to the address of the operand.
12455 At runtime we merely add the offset to the actual PLT entry.
12456 NB: Subtract the offset size only for jump instructions. */
12457 if (fixP->fx_pcrel)
12458 value = -4;
12459 break;
12460
12461 case BFD_RELOC_386_TLS_GD:
12462 case BFD_RELOC_386_TLS_LDM:
12463 case BFD_RELOC_386_TLS_IE_32:
12464 case BFD_RELOC_386_TLS_IE:
12465 case BFD_RELOC_386_TLS_GOTIE:
12466 case BFD_RELOC_386_TLS_GOTDESC:
12467 case BFD_RELOC_X86_64_TLSGD:
12468 case BFD_RELOC_X86_64_TLSLD:
12469 case BFD_RELOC_X86_64_GOTTPOFF:
12470 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12471 value = 0; /* Fully resolved at runtime. No addend. */
12472 /* Fallthrough */
12473 case BFD_RELOC_386_TLS_LE:
12474 case BFD_RELOC_386_TLS_LDO_32:
12475 case BFD_RELOC_386_TLS_LE_32:
12476 case BFD_RELOC_X86_64_DTPOFF32:
12477 case BFD_RELOC_X86_64_DTPOFF64:
12478 case BFD_RELOC_X86_64_TPOFF32:
12479 case BFD_RELOC_X86_64_TPOFF64:
12480 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12481 break;
12482
12483 case BFD_RELOC_386_TLS_DESC_CALL:
12484 case BFD_RELOC_X86_64_TLSDESC_CALL:
12485 value = 0; /* Fully resolved at runtime. No addend. */
12486 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12487 fixP->fx_done = 0;
12488 return;
12489
12490 case BFD_RELOC_VTABLE_INHERIT:
12491 case BFD_RELOC_VTABLE_ENTRY:
12492 fixP->fx_done = 0;
12493 return;
12494
12495 default:
12496 break;
12497 }
12498 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
12499 *valP = value;
12500 #endif /* !defined (TE_Mach) */
12501
12502 /* Are we finished with this relocation now? */
12503 if (fixP->fx_addsy == NULL)
12504 fixP->fx_done = 1;
12505 #if defined (OBJ_COFF) && defined (TE_PE)
12506 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12507 {
12508 fixP->fx_done = 0;
12509 /* Remember value for tc_gen_reloc. */
12510 fixP->fx_addnumber = value;
12511 /* Clear out the frag for now. */
12512 value = 0;
12513 }
12514 #endif
12515 else if (use_rela_relocations)
12516 {
12517 fixP->fx_no_overflow = 1;
12518 /* Remember value for tc_gen_reloc. */
12519 fixP->fx_addnumber = value;
12520 value = 0;
12521 }
12522
12523 md_number_to_chars (p, value, fixP->fx_size);
12524 }
12525 \f
12526 const char *
12527 md_atof (int type, char *litP, int *sizeP)
12528 {
12529 /* This outputs the LITTLENUMs in REVERSE order;
12530 in accord with the bigendian 386. */
12531 return ieee_md_atof (type, litP, sizeP, FALSE);
12532 }
12533 \f
12534 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12535
12536 static char *
12537 output_invalid (int c)
12538 {
12539 if (ISPRINT (c))
12540 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12541 "'%c'", c);
12542 else
12543 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12544 "(0x%x)", (unsigned char) c);
12545 return output_invalid_buf;
12546 }
12547
12548 /* Verify that @r can be used in the current context. */
12549
12550 static bfd_boolean check_register (const reg_entry *r)
12551 {
12552 if (allow_pseudo_reg)
12553 return TRUE;
12554
12555 if (operand_type_all_zero (&r->reg_type))
12556 return FALSE;
12557
12558 if ((r->reg_type.bitfield.dword
12559 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12560 || r->reg_type.bitfield.class == RegCR
12561 || r->reg_type.bitfield.class == RegDR)
12562 && !cpu_arch_flags.bitfield.cpui386)
12563 return FALSE;
12564
12565 if (r->reg_type.bitfield.class == RegTR
12566 && (flag_code == CODE_64BIT
12567 || !cpu_arch_flags.bitfield.cpui386
12568 || cpu_arch_isa_flags.bitfield.cpui586
12569 || cpu_arch_isa_flags.bitfield.cpui686))
12570 return FALSE;
12571
12572 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12573 return FALSE;
12574
12575 if (!cpu_arch_flags.bitfield.cpuavx512f)
12576 {
12577 if (r->reg_type.bitfield.zmmword
12578 || r->reg_type.bitfield.class == RegMask)
12579 return FALSE;
12580
12581 if (!cpu_arch_flags.bitfield.cpuavx)
12582 {
12583 if (r->reg_type.bitfield.ymmword)
12584 return FALSE;
12585
12586 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12587 return FALSE;
12588 }
12589 }
12590
12591 if (r->reg_type.bitfield.tmmword
12592 && (!cpu_arch_flags.bitfield.cpuamx_tile
12593 || flag_code != CODE_64BIT))
12594 return FALSE;
12595
12596 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12597 return FALSE;
12598
12599 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12600 if (!allow_index_reg && r->reg_num == RegIZ)
12601 return FALSE;
12602
12603 /* Upper 16 vector registers are only available with VREX in 64bit
12604 mode, and require EVEX encoding. */
12605 if (r->reg_flags & RegVRex)
12606 {
12607 if (!cpu_arch_flags.bitfield.cpuavx512f
12608 || flag_code != CODE_64BIT)
12609 return FALSE;
12610
12611 if (i.vec_encoding == vex_encoding_default)
12612 i.vec_encoding = vex_encoding_evex;
12613 else if (i.vec_encoding != vex_encoding_evex)
12614 i.vec_encoding = vex_encoding_error;
12615 }
12616
12617 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12618 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12619 && flag_code != CODE_64BIT)
12620 return FALSE;
12621
12622 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12623 && !intel_syntax)
12624 return FALSE;
12625
12626 return TRUE;
12627 }
12628
12629 /* REG_STRING starts *before* REGISTER_PREFIX. */
12630
12631 static const reg_entry *
12632 parse_real_register (char *reg_string, char **end_op)
12633 {
12634 char *s = reg_string;
12635 char *p;
12636 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12637 const reg_entry *r;
12638
12639 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12640 if (*s == REGISTER_PREFIX)
12641 ++s;
12642
12643 if (is_space_char (*s))
12644 ++s;
12645
12646 p = reg_name_given;
12647 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12648 {
12649 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12650 return (const reg_entry *) NULL;
12651 s++;
12652 }
12653
12654 /* For naked regs, make sure that we are not dealing with an identifier.
12655 This prevents confusing an identifier like `eax_var' with register
12656 `eax'. */
12657 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12658 return (const reg_entry *) NULL;
12659
12660 *end_op = s;
12661
12662 r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12663
12664 /* Handle floating point regs, allowing spaces in the (i) part. */
12665 if (r == i386_regtab /* %st is first entry of table */)
12666 {
12667 if (!cpu_arch_flags.bitfield.cpu8087
12668 && !cpu_arch_flags.bitfield.cpu287
12669 && !cpu_arch_flags.bitfield.cpu387
12670 && !allow_pseudo_reg)
12671 return (const reg_entry *) NULL;
12672
12673 if (is_space_char (*s))
12674 ++s;
12675 if (*s == '(')
12676 {
12677 ++s;
12678 if (is_space_char (*s))
12679 ++s;
12680 if (*s >= '0' && *s <= '7')
12681 {
12682 int fpr = *s - '0';
12683 ++s;
12684 if (is_space_char (*s))
12685 ++s;
12686 if (*s == ')')
12687 {
12688 *end_op = s + 1;
12689 r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12690 know (r);
12691 return r + fpr;
12692 }
12693 }
12694 /* We have "%st(" then garbage. */
12695 return (const reg_entry *) NULL;
12696 }
12697 }
12698
12699 return r && check_register (r) ? r : NULL;
12700 }
12701
12702 /* REG_STRING starts *before* REGISTER_PREFIX. */
12703
12704 static const reg_entry *
12705 parse_register (char *reg_string, char **end_op)
12706 {
12707 const reg_entry *r;
12708
12709 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12710 r = parse_real_register (reg_string, end_op);
12711 else
12712 r = NULL;
12713 if (!r)
12714 {
12715 char *save = input_line_pointer;
12716 char c;
12717 symbolS *symbolP;
12718
12719 input_line_pointer = reg_string;
12720 c = get_symbol_name (&reg_string);
12721 symbolP = symbol_find (reg_string);
12722 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12723 {
12724 const expressionS *e = symbol_get_value_expression (symbolP);
12725
12726 know (e->X_op == O_register);
12727 know (e->X_add_number >= 0
12728 && (valueT) e->X_add_number < i386_regtab_size);
12729 r = i386_regtab + e->X_add_number;
12730 if (!check_register (r))
12731 {
12732 as_bad (_("register '%s%s' cannot be used here"),
12733 register_prefix, r->reg_name);
12734 r = &bad_reg;
12735 }
12736 *end_op = input_line_pointer;
12737 }
12738 *input_line_pointer = c;
12739 input_line_pointer = save;
12740 }
12741 return r;
12742 }
12743
12744 int
12745 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12746 {
12747 const reg_entry *r;
12748 char *end = input_line_pointer;
12749
12750 *end = *nextcharP;
12751 r = parse_register (name, &input_line_pointer);
12752 if (r && end <= input_line_pointer)
12753 {
12754 *nextcharP = *input_line_pointer;
12755 *input_line_pointer = 0;
12756 if (r != &bad_reg)
12757 {
12758 e->X_op = O_register;
12759 e->X_add_number = r - i386_regtab;
12760 }
12761 else
12762 e->X_op = O_illegal;
12763 return 1;
12764 }
12765 input_line_pointer = end;
12766 *end = 0;
12767 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12768 }
12769
12770 void
12771 md_operand (expressionS *e)
12772 {
12773 char *end;
12774 const reg_entry *r;
12775
12776 switch (*input_line_pointer)
12777 {
12778 case REGISTER_PREFIX:
12779 r = parse_real_register (input_line_pointer, &end);
12780 if (r)
12781 {
12782 e->X_op = O_register;
12783 e->X_add_number = r - i386_regtab;
12784 input_line_pointer = end;
12785 }
12786 break;
12787
12788 case '[':
12789 gas_assert (intel_syntax);
12790 end = input_line_pointer++;
12791 expression (e);
12792 if (*input_line_pointer == ']')
12793 {
12794 ++input_line_pointer;
12795 e->X_op_symbol = make_expr_symbol (e);
12796 e->X_add_symbol = NULL;
12797 e->X_add_number = 0;
12798 e->X_op = O_index;
12799 }
12800 else
12801 {
12802 e->X_op = O_absent;
12803 input_line_pointer = end;
12804 }
12805 break;
12806 }
12807 }
12808
12809 \f
12810 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12811 const char *md_shortopts = "kVQ:sqnO::";
12812 #else
12813 const char *md_shortopts = "qnO::";
12814 #endif
12815
12816 #define OPTION_32 (OPTION_MD_BASE + 0)
12817 #define OPTION_64 (OPTION_MD_BASE + 1)
12818 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12819 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12820 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12821 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12822 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12823 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12824 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12825 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12826 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12827 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12828 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12829 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12830 #define OPTION_X32 (OPTION_MD_BASE + 14)
12831 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12832 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12833 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12834 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12835 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12836 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12837 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12838 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12839 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12840 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12841 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12842 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12843 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12844 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12845 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12846 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12847 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12848 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12849 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12850
12851 struct option md_longopts[] =
12852 {
12853 {"32", no_argument, NULL, OPTION_32},
12854 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12855 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12856 {"64", no_argument, NULL, OPTION_64},
12857 #endif
12858 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12859 {"x32", no_argument, NULL, OPTION_X32},
12860 {"mshared", no_argument, NULL, OPTION_MSHARED},
12861 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12862 #endif
12863 {"divide", no_argument, NULL, OPTION_DIVIDE},
12864 {"march", required_argument, NULL, OPTION_MARCH},
12865 {"mtune", required_argument, NULL, OPTION_MTUNE},
12866 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12867 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12868 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12869 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12870 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12871 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12872 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12873 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12874 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12875 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12876 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12877 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12878 # if defined (TE_PE) || defined (TE_PEP)
12879 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12880 #endif
12881 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12882 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12883 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12884 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12885 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12886 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12887 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12888 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12889 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12890 {"mlfence-before-indirect-branch", required_argument, NULL,
12891 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12892 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12893 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12894 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12895 {NULL, no_argument, NULL, 0}
12896 };
12897 size_t md_longopts_size = sizeof (md_longopts);
12898
12899 int
12900 md_parse_option (int c, const char *arg)
12901 {
12902 unsigned int j;
12903 char *arch, *next, *saved, *type;
12904
12905 switch (c)
12906 {
12907 case 'n':
12908 optimize_align_code = 0;
12909 break;
12910
12911 case 'q':
12912 quiet_warnings = 1;
12913 break;
12914
12915 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12916 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12917 should be emitted or not. FIXME: Not implemented. */
12918 case 'Q':
12919 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12920 return 0;
12921 break;
12922
12923 /* -V: SVR4 argument to print version ID. */
12924 case 'V':
12925 print_version_id ();
12926 break;
12927
12928 /* -k: Ignore for FreeBSD compatibility. */
12929 case 'k':
12930 break;
12931
12932 case 's':
12933 /* -s: On i386 Solaris, this tells the native assembler to use
12934 .stab instead of .stab.excl. We always use .stab anyhow. */
12935 break;
12936
12937 case OPTION_MSHARED:
12938 shared = 1;
12939 break;
12940
12941 case OPTION_X86_USED_NOTE:
12942 if (strcasecmp (arg, "yes") == 0)
12943 x86_used_note = 1;
12944 else if (strcasecmp (arg, "no") == 0)
12945 x86_used_note = 0;
12946 else
12947 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12948 break;
12949
12950
12951 #endif
12952 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12953 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12954 case OPTION_64:
12955 {
12956 const char **list, **l;
12957
12958 list = bfd_target_list ();
12959 for (l = list; *l != NULL; l++)
12960 if (CONST_STRNEQ (*l, "elf64-x86-64")
12961 || strcmp (*l, "coff-x86-64") == 0
12962 || strcmp (*l, "pe-x86-64") == 0
12963 || strcmp (*l, "pei-x86-64") == 0
12964 || strcmp (*l, "mach-o-x86-64") == 0)
12965 {
12966 default_arch = "x86_64";
12967 break;
12968 }
12969 if (*l == NULL)
12970 as_fatal (_("no compiled in support for x86_64"));
12971 free (list);
12972 }
12973 break;
12974 #endif
12975
12976 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12977 case OPTION_X32:
12978 if (IS_ELF)
12979 {
12980 const char **list, **l;
12981
12982 list = bfd_target_list ();
12983 for (l = list; *l != NULL; l++)
12984 if (CONST_STRNEQ (*l, "elf32-x86-64"))
12985 {
12986 default_arch = "x86_64:32";
12987 break;
12988 }
12989 if (*l == NULL)
12990 as_fatal (_("no compiled in support for 32bit x86_64"));
12991 free (list);
12992 }
12993 else
12994 as_fatal (_("32bit x86_64 is only supported for ELF"));
12995 break;
12996 #endif
12997
12998 case OPTION_32:
12999 default_arch = "i386";
13000 break;
13001
13002 case OPTION_DIVIDE:
13003 #ifdef SVR4_COMMENT_CHARS
13004 {
13005 char *n, *t;
13006 const char *s;
13007
13008 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13009 t = n;
13010 for (s = i386_comment_chars; *s != '\0'; s++)
13011 if (*s != '/')
13012 *t++ = *s;
13013 *t = '\0';
13014 i386_comment_chars = n;
13015 }
13016 #endif
13017 break;
13018
13019 case OPTION_MARCH:
13020 saved = xstrdup (arg);
13021 arch = saved;
13022 /* Allow -march=+nosse. */
13023 if (*arch == '+')
13024 arch++;
13025 do
13026 {
13027 if (*arch == '.')
13028 as_fatal (_("invalid -march= option: `%s'"), arg);
13029 next = strchr (arch, '+');
13030 if (next)
13031 *next++ = '\0';
13032 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13033 {
13034 if (strcmp (arch, cpu_arch [j].name) == 0)
13035 {
13036 /* Processor. */
13037 if (! cpu_arch[j].flags.bitfield.cpui386)
13038 continue;
13039
13040 cpu_arch_name = cpu_arch[j].name;
13041 cpu_sub_arch_name = NULL;
13042 cpu_arch_flags = cpu_arch[j].flags;
13043 cpu_arch_isa = cpu_arch[j].type;
13044 cpu_arch_isa_flags = cpu_arch[j].flags;
13045 if (!cpu_arch_tune_set)
13046 {
13047 cpu_arch_tune = cpu_arch_isa;
13048 cpu_arch_tune_flags = cpu_arch_isa_flags;
13049 }
13050 break;
13051 }
13052 else if (*cpu_arch [j].name == '.'
13053 && strcmp (arch, cpu_arch [j].name + 1) == 0)
13054 {
13055 /* ISA extension. */
13056 i386_cpu_flags flags;
13057
13058 flags = cpu_flags_or (cpu_arch_flags,
13059 cpu_arch[j].flags);
13060
13061 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13062 {
13063 if (cpu_sub_arch_name)
13064 {
13065 char *name = cpu_sub_arch_name;
13066 cpu_sub_arch_name = concat (name,
13067 cpu_arch[j].name,
13068 (const char *) NULL);
13069 free (name);
13070 }
13071 else
13072 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13073 cpu_arch_flags = flags;
13074 cpu_arch_isa_flags = flags;
13075 }
13076 else
13077 cpu_arch_isa_flags
13078 = cpu_flags_or (cpu_arch_isa_flags,
13079 cpu_arch[j].flags);
13080 break;
13081 }
13082 }
13083
13084 if (j >= ARRAY_SIZE (cpu_arch))
13085 {
13086 /* Disable an ISA extension. */
13087 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13088 if (strcmp (arch, cpu_noarch [j].name) == 0)
13089 {
13090 i386_cpu_flags flags;
13091
13092 flags = cpu_flags_and_not (cpu_arch_flags,
13093 cpu_noarch[j].flags);
13094 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13095 {
13096 if (cpu_sub_arch_name)
13097 {
13098 char *name = cpu_sub_arch_name;
13099 cpu_sub_arch_name = concat (arch,
13100 (const char *) NULL);
13101 free (name);
13102 }
13103 else
13104 cpu_sub_arch_name = xstrdup (arch);
13105 cpu_arch_flags = flags;
13106 cpu_arch_isa_flags = flags;
13107 }
13108 break;
13109 }
13110
13111 if (j >= ARRAY_SIZE (cpu_noarch))
13112 j = ARRAY_SIZE (cpu_arch);
13113 }
13114
13115 if (j >= ARRAY_SIZE (cpu_arch))
13116 as_fatal (_("invalid -march= option: `%s'"), arg);
13117
13118 arch = next;
13119 }
13120 while (next != NULL);
13121 free (saved);
13122 break;
13123
13124 case OPTION_MTUNE:
13125 if (*arg == '.')
13126 as_fatal (_("invalid -mtune= option: `%s'"), arg);
13127 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13128 {
13129 if (strcmp (arg, cpu_arch [j].name) == 0)
13130 {
13131 cpu_arch_tune_set = 1;
13132 cpu_arch_tune = cpu_arch [j].type;
13133 cpu_arch_tune_flags = cpu_arch[j].flags;
13134 break;
13135 }
13136 }
13137 if (j >= ARRAY_SIZE (cpu_arch))
13138 as_fatal (_("invalid -mtune= option: `%s'"), arg);
13139 break;
13140
13141 case OPTION_MMNEMONIC:
13142 if (strcasecmp (arg, "att") == 0)
13143 intel_mnemonic = 0;
13144 else if (strcasecmp (arg, "intel") == 0)
13145 intel_mnemonic = 1;
13146 else
13147 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13148 break;
13149
13150 case OPTION_MSYNTAX:
13151 if (strcasecmp (arg, "att") == 0)
13152 intel_syntax = 0;
13153 else if (strcasecmp (arg, "intel") == 0)
13154 intel_syntax = 1;
13155 else
13156 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13157 break;
13158
13159 case OPTION_MINDEX_REG:
13160 allow_index_reg = 1;
13161 break;
13162
13163 case OPTION_MNAKED_REG:
13164 allow_naked_reg = 1;
13165 break;
13166
13167 case OPTION_MSSE2AVX:
13168 sse2avx = 1;
13169 break;
13170
13171 case OPTION_MSSE_CHECK:
13172 if (strcasecmp (arg, "error") == 0)
13173 sse_check = check_error;
13174 else if (strcasecmp (arg, "warning") == 0)
13175 sse_check = check_warning;
13176 else if (strcasecmp (arg, "none") == 0)
13177 sse_check = check_none;
13178 else
13179 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13180 break;
13181
13182 case OPTION_MOPERAND_CHECK:
13183 if (strcasecmp (arg, "error") == 0)
13184 operand_check = check_error;
13185 else if (strcasecmp (arg, "warning") == 0)
13186 operand_check = check_warning;
13187 else if (strcasecmp (arg, "none") == 0)
13188 operand_check = check_none;
13189 else
13190 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13191 break;
13192
13193 case OPTION_MAVXSCALAR:
13194 if (strcasecmp (arg, "128") == 0)
13195 avxscalar = vex128;
13196 else if (strcasecmp (arg, "256") == 0)
13197 avxscalar = vex256;
13198 else
13199 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13200 break;
13201
13202 case OPTION_MVEXWIG:
13203 if (strcmp (arg, "0") == 0)
13204 vexwig = vexw0;
13205 else if (strcmp (arg, "1") == 0)
13206 vexwig = vexw1;
13207 else
13208 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13209 break;
13210
13211 case OPTION_MADD_BND_PREFIX:
13212 add_bnd_prefix = 1;
13213 break;
13214
13215 case OPTION_MEVEXLIG:
13216 if (strcmp (arg, "128") == 0)
13217 evexlig = evexl128;
13218 else if (strcmp (arg, "256") == 0)
13219 evexlig = evexl256;
13220 else if (strcmp (arg, "512") == 0)
13221 evexlig = evexl512;
13222 else
13223 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13224 break;
13225
13226 case OPTION_MEVEXRCIG:
13227 if (strcmp (arg, "rne") == 0)
13228 evexrcig = rne;
13229 else if (strcmp (arg, "rd") == 0)
13230 evexrcig = rd;
13231 else if (strcmp (arg, "ru") == 0)
13232 evexrcig = ru;
13233 else if (strcmp (arg, "rz") == 0)
13234 evexrcig = rz;
13235 else
13236 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13237 break;
13238
13239 case OPTION_MEVEXWIG:
13240 if (strcmp (arg, "0") == 0)
13241 evexwig = evexw0;
13242 else if (strcmp (arg, "1") == 0)
13243 evexwig = evexw1;
13244 else
13245 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13246 break;
13247
13248 # if defined (TE_PE) || defined (TE_PEP)
13249 case OPTION_MBIG_OBJ:
13250 use_big_obj = 1;
13251 break;
13252 #endif
13253
13254 case OPTION_MOMIT_LOCK_PREFIX:
13255 if (strcasecmp (arg, "yes") == 0)
13256 omit_lock_prefix = 1;
13257 else if (strcasecmp (arg, "no") == 0)
13258 omit_lock_prefix = 0;
13259 else
13260 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13261 break;
13262
13263 case OPTION_MFENCE_AS_LOCK_ADD:
13264 if (strcasecmp (arg, "yes") == 0)
13265 avoid_fence = 1;
13266 else if (strcasecmp (arg, "no") == 0)
13267 avoid_fence = 0;
13268 else
13269 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13270 break;
13271
13272 case OPTION_MLFENCE_AFTER_LOAD:
13273 if (strcasecmp (arg, "yes") == 0)
13274 lfence_after_load = 1;
13275 else if (strcasecmp (arg, "no") == 0)
13276 lfence_after_load = 0;
13277 else
13278 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13279 break;
13280
13281 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13282 if (strcasecmp (arg, "all") == 0)
13283 {
13284 lfence_before_indirect_branch = lfence_branch_all;
13285 if (lfence_before_ret == lfence_before_ret_none)
13286 lfence_before_ret = lfence_before_ret_shl;
13287 }
13288 else if (strcasecmp (arg, "memory") == 0)
13289 lfence_before_indirect_branch = lfence_branch_memory;
13290 else if (strcasecmp (arg, "register") == 0)
13291 lfence_before_indirect_branch = lfence_branch_register;
13292 else if (strcasecmp (arg, "none") == 0)
13293 lfence_before_indirect_branch = lfence_branch_none;
13294 else
13295 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13296 arg);
13297 break;
13298
13299 case OPTION_MLFENCE_BEFORE_RET:
13300 if (strcasecmp (arg, "or") == 0)
13301 lfence_before_ret = lfence_before_ret_or;
13302 else if (strcasecmp (arg, "not") == 0)
13303 lfence_before_ret = lfence_before_ret_not;
13304 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13305 lfence_before_ret = lfence_before_ret_shl;
13306 else if (strcasecmp (arg, "none") == 0)
13307 lfence_before_ret = lfence_before_ret_none;
13308 else
13309 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13310 arg);
13311 break;
13312
13313 case OPTION_MRELAX_RELOCATIONS:
13314 if (strcasecmp (arg, "yes") == 0)
13315 generate_relax_relocations = 1;
13316 else if (strcasecmp (arg, "no") == 0)
13317 generate_relax_relocations = 0;
13318 else
13319 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13320 break;
13321
13322 case OPTION_MALIGN_BRANCH_BOUNDARY:
13323 {
13324 char *end;
13325 long int align = strtoul (arg, &end, 0);
13326 if (*end == '\0')
13327 {
13328 if (align == 0)
13329 {
13330 align_branch_power = 0;
13331 break;
13332 }
13333 else if (align >= 16)
13334 {
13335 int align_power;
13336 for (align_power = 0;
13337 (align & 1) == 0;
13338 align >>= 1, align_power++)
13339 continue;
13340 /* Limit alignment power to 31. */
13341 if (align == 1 && align_power < 32)
13342 {
13343 align_branch_power = align_power;
13344 break;
13345 }
13346 }
13347 }
13348 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13349 }
13350 break;
13351
13352 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13353 {
13354 char *end;
13355 int align = strtoul (arg, &end, 0);
13356 /* Some processors only support 5 prefixes. */
13357 if (*end == '\0' && align >= 0 && align < 6)
13358 {
13359 align_branch_prefix_size = align;
13360 break;
13361 }
13362 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13363 arg);
13364 }
13365 break;
13366
13367 case OPTION_MALIGN_BRANCH:
13368 align_branch = 0;
13369 saved = xstrdup (arg);
13370 type = saved;
13371 do
13372 {
13373 next = strchr (type, '+');
13374 if (next)
13375 *next++ = '\0';
13376 if (strcasecmp (type, "jcc") == 0)
13377 align_branch |= align_branch_jcc_bit;
13378 else if (strcasecmp (type, "fused") == 0)
13379 align_branch |= align_branch_fused_bit;
13380 else if (strcasecmp (type, "jmp") == 0)
13381 align_branch |= align_branch_jmp_bit;
13382 else if (strcasecmp (type, "call") == 0)
13383 align_branch |= align_branch_call_bit;
13384 else if (strcasecmp (type, "ret") == 0)
13385 align_branch |= align_branch_ret_bit;
13386 else if (strcasecmp (type, "indirect") == 0)
13387 align_branch |= align_branch_indirect_bit;
13388 else
13389 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13390 type = next;
13391 }
13392 while (next != NULL);
13393 free (saved);
13394 break;
13395
13396 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13397 align_branch_power = 5;
13398 align_branch_prefix_size = 5;
13399 align_branch = (align_branch_jcc_bit
13400 | align_branch_fused_bit
13401 | align_branch_jmp_bit);
13402 break;
13403
13404 case OPTION_MAMD64:
13405 isa64 = amd64;
13406 break;
13407
13408 case OPTION_MINTEL64:
13409 isa64 = intel64;
13410 break;
13411
13412 case 'O':
13413 if (arg == NULL)
13414 {
13415 optimize = 1;
13416 /* Turn off -Os. */
13417 optimize_for_space = 0;
13418 }
13419 else if (*arg == 's')
13420 {
13421 optimize_for_space = 1;
13422 /* Turn on all encoding optimizations. */
13423 optimize = INT_MAX;
13424 }
13425 else
13426 {
13427 optimize = atoi (arg);
13428 /* Turn off -Os. */
13429 optimize_for_space = 0;
13430 }
13431 break;
13432
13433 default:
13434 return 0;
13435 }
13436 return 1;
13437 }
13438
13439 #define MESSAGE_TEMPLATE \
13440 " "
13441
13442 static char *
13443 output_message (FILE *stream, char *p, char *message, char *start,
13444 int *left_p, const char *name, int len)
13445 {
13446 int size = sizeof (MESSAGE_TEMPLATE);
13447 int left = *left_p;
13448
13449 /* Reserve 2 spaces for ", " or ",\0" */
13450 left -= len + 2;
13451
13452 /* Check if there is any room. */
13453 if (left >= 0)
13454 {
13455 if (p != start)
13456 {
13457 *p++ = ',';
13458 *p++ = ' ';
13459 }
13460 p = mempcpy (p, name, len);
13461 }
13462 else
13463 {
13464 /* Output the current message now and start a new one. */
13465 *p++ = ',';
13466 *p = '\0';
13467 fprintf (stream, "%s\n", message);
13468 p = start;
13469 left = size - (start - message) - len - 2;
13470
13471 gas_assert (left >= 0);
13472
13473 p = mempcpy (p, name, len);
13474 }
13475
13476 *left_p = left;
13477 return p;
13478 }
13479
13480 static void
13481 show_arch (FILE *stream, int ext, int check)
13482 {
13483 static char message[] = MESSAGE_TEMPLATE;
13484 char *start = message + 27;
13485 char *p;
13486 int size = sizeof (MESSAGE_TEMPLATE);
13487 int left;
13488 const char *name;
13489 int len;
13490 unsigned int j;
13491
13492 p = start;
13493 left = size - (start - message);
13494 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13495 {
13496 /* Should it be skipped? */
13497 if (cpu_arch [j].skip)
13498 continue;
13499
13500 name = cpu_arch [j].name;
13501 len = cpu_arch [j].len;
13502 if (*name == '.')
13503 {
13504 /* It is an extension. Skip if we aren't asked to show it. */
13505 if (ext)
13506 {
13507 name++;
13508 len--;
13509 }
13510 else
13511 continue;
13512 }
13513 else if (ext)
13514 {
13515 /* It is an processor. Skip if we show only extension. */
13516 continue;
13517 }
13518 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13519 {
13520 /* It is an impossible processor - skip. */
13521 continue;
13522 }
13523
13524 p = output_message (stream, p, message, start, &left, name, len);
13525 }
13526
13527 /* Display disabled extensions. */
13528 if (ext)
13529 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13530 {
13531 name = cpu_noarch [j].name;
13532 len = cpu_noarch [j].len;
13533 p = output_message (stream, p, message, start, &left, name,
13534 len);
13535 }
13536
13537 *p = '\0';
13538 fprintf (stream, "%s\n", message);
13539 }
13540
13541 void
13542 md_show_usage (FILE *stream)
13543 {
13544 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13545 fprintf (stream, _("\
13546 -Qy, -Qn ignored\n\
13547 -V print assembler version number\n\
13548 -k ignored\n"));
13549 #endif
13550 fprintf (stream, _("\
13551 -n Do not optimize code alignment\n\
13552 -q quieten some warnings\n"));
13553 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13554 fprintf (stream, _("\
13555 -s ignored\n"));
13556 #endif
13557 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13558 || defined (TE_PE) || defined (TE_PEP))
13559 fprintf (stream, _("\
13560 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
13561 #endif
13562 #ifdef SVR4_COMMENT_CHARS
13563 fprintf (stream, _("\
13564 --divide do not treat `/' as a comment character\n"));
13565 #else
13566 fprintf (stream, _("\
13567 --divide ignored\n"));
13568 #endif
13569 fprintf (stream, _("\
13570 -march=CPU[,+EXTENSION...]\n\
13571 generate code for CPU and EXTENSION, CPU is one of:\n"));
13572 show_arch (stream, 0, 1);
13573 fprintf (stream, _("\
13574 EXTENSION is combination of:\n"));
13575 show_arch (stream, 1, 0);
13576 fprintf (stream, _("\
13577 -mtune=CPU optimize for CPU, CPU is one of:\n"));
13578 show_arch (stream, 0, 0);
13579 fprintf (stream, _("\
13580 -msse2avx encode SSE instructions with VEX prefix\n"));
13581 fprintf (stream, _("\
13582 -msse-check=[none|error|warning] (default: warning)\n\
13583 check SSE instructions\n"));
13584 fprintf (stream, _("\
13585 -moperand-check=[none|error|warning] (default: warning)\n\
13586 check operand combinations for validity\n"));
13587 fprintf (stream, _("\
13588 -mavxscalar=[128|256] (default: 128)\n\
13589 encode scalar AVX instructions with specific vector\n\
13590 length\n"));
13591 fprintf (stream, _("\
13592 -mvexwig=[0|1] (default: 0)\n\
13593 encode VEX instructions with specific VEX.W value\n\
13594 for VEX.W bit ignored instructions\n"));
13595 fprintf (stream, _("\
13596 -mevexlig=[128|256|512] (default: 128)\n\
13597 encode scalar EVEX instructions with specific vector\n\
13598 length\n"));
13599 fprintf (stream, _("\
13600 -mevexwig=[0|1] (default: 0)\n\
13601 encode EVEX instructions with specific EVEX.W value\n\
13602 for EVEX.W bit ignored instructions\n"));
13603 fprintf (stream, _("\
13604 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13605 encode EVEX instructions with specific EVEX.RC value\n\
13606 for SAE-only ignored instructions\n"));
13607 fprintf (stream, _("\
13608 -mmnemonic=[att|intel] "));
13609 if (SYSV386_COMPAT)
13610 fprintf (stream, _("(default: att)\n"));
13611 else
13612 fprintf (stream, _("(default: intel)\n"));
13613 fprintf (stream, _("\
13614 use AT&T/Intel mnemonic\n"));
13615 fprintf (stream, _("\
13616 -msyntax=[att|intel] (default: att)\n\
13617 use AT&T/Intel syntax\n"));
13618 fprintf (stream, _("\
13619 -mindex-reg support pseudo index registers\n"));
13620 fprintf (stream, _("\
13621 -mnaked-reg don't require `%%' prefix for registers\n"));
13622 fprintf (stream, _("\
13623 -madd-bnd-prefix add BND prefix for all valid branches\n"));
13624 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13625 fprintf (stream, _("\
13626 -mshared disable branch optimization for shared code\n"));
13627 fprintf (stream, _("\
13628 -mx86-used-note=[no|yes] "));
13629 if (DEFAULT_X86_USED_NOTE)
13630 fprintf (stream, _("(default: yes)\n"));
13631 else
13632 fprintf (stream, _("(default: no)\n"));
13633 fprintf (stream, _("\
13634 generate x86 used ISA and feature properties\n"));
13635 #endif
13636 #if defined (TE_PE) || defined (TE_PEP)
13637 fprintf (stream, _("\
13638 -mbig-obj generate big object files\n"));
13639 #endif
13640 fprintf (stream, _("\
13641 -momit-lock-prefix=[no|yes] (default: no)\n\
13642 strip all lock prefixes\n"));
13643 fprintf (stream, _("\
13644 -mfence-as-lock-add=[no|yes] (default: no)\n\
13645 encode lfence, mfence and sfence as\n\
13646 lock addl $0x0, (%%{re}sp)\n"));
13647 fprintf (stream, _("\
13648 -mrelax-relocations=[no|yes] "));
13649 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13650 fprintf (stream, _("(default: yes)\n"));
13651 else
13652 fprintf (stream, _("(default: no)\n"));
13653 fprintf (stream, _("\
13654 generate relax relocations\n"));
13655 fprintf (stream, _("\
13656 -malign-branch-boundary=NUM (default: 0)\n\
13657 align branches within NUM byte boundary\n"));
13658 fprintf (stream, _("\
13659 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13660 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13661 indirect\n\
13662 specify types of branches to align\n"));
13663 fprintf (stream, _("\
13664 -malign-branch-prefix-size=NUM (default: 5)\n\
13665 align branches with NUM prefixes per instruction\n"));
13666 fprintf (stream, _("\
13667 -mbranches-within-32B-boundaries\n\
13668 align branches within 32 byte boundary\n"));
13669 fprintf (stream, _("\
13670 -mlfence-after-load=[no|yes] (default: no)\n\
13671 generate lfence after load\n"));
13672 fprintf (stream, _("\
13673 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13674 generate lfence before indirect near branch\n"));
13675 fprintf (stream, _("\
13676 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13677 generate lfence before ret\n"));
13678 fprintf (stream, _("\
13679 -mamd64 accept only AMD64 ISA [default]\n"));
13680 fprintf (stream, _("\
13681 -mintel64 accept only Intel64 ISA\n"));
13682 }
13683
13684 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13685 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13686 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13687
13688 /* Pick the target format to use. */
13689
13690 const char *
13691 i386_target_format (void)
13692 {
13693 if (!strncmp (default_arch, "x86_64", 6))
13694 {
13695 update_code_flag (CODE_64BIT, 1);
13696 if (default_arch[6] == '\0')
13697 x86_elf_abi = X86_64_ABI;
13698 else
13699 x86_elf_abi = X86_64_X32_ABI;
13700 }
13701 else if (!strcmp (default_arch, "i386"))
13702 update_code_flag (CODE_32BIT, 1);
13703 else if (!strcmp (default_arch, "iamcu"))
13704 {
13705 update_code_flag (CODE_32BIT, 1);
13706 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13707 {
13708 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13709 cpu_arch_name = "iamcu";
13710 cpu_sub_arch_name = NULL;
13711 cpu_arch_flags = iamcu_flags;
13712 cpu_arch_isa = PROCESSOR_IAMCU;
13713 cpu_arch_isa_flags = iamcu_flags;
13714 if (!cpu_arch_tune_set)
13715 {
13716 cpu_arch_tune = cpu_arch_isa;
13717 cpu_arch_tune_flags = cpu_arch_isa_flags;
13718 }
13719 }
13720 else if (cpu_arch_isa != PROCESSOR_IAMCU)
13721 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13722 cpu_arch_name);
13723 }
13724 else
13725 as_fatal (_("unknown architecture"));
13726
13727 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13728 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13729 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13730 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13731
13732 switch (OUTPUT_FLAVOR)
13733 {
13734 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13735 case bfd_target_aout_flavour:
13736 return AOUT_TARGET_FORMAT;
13737 #endif
13738 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13739 # if defined (TE_PE) || defined (TE_PEP)
13740 case bfd_target_coff_flavour:
13741 if (flag_code == CODE_64BIT)
13742 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13743 else
13744 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13745 # elif defined (TE_GO32)
13746 case bfd_target_coff_flavour:
13747 return "coff-go32";
13748 # else
13749 case bfd_target_coff_flavour:
13750 return "coff-i386";
13751 # endif
13752 #endif
13753 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13754 case bfd_target_elf_flavour:
13755 {
13756 const char *format;
13757
13758 switch (x86_elf_abi)
13759 {
13760 default:
13761 format = ELF_TARGET_FORMAT;
13762 #ifndef TE_SOLARIS
13763 tls_get_addr = "___tls_get_addr";
13764 #endif
13765 break;
13766 case X86_64_ABI:
13767 use_rela_relocations = 1;
13768 object_64bit = 1;
13769 #ifndef TE_SOLARIS
13770 tls_get_addr = "__tls_get_addr";
13771 #endif
13772 format = ELF_TARGET_FORMAT64;
13773 break;
13774 case X86_64_X32_ABI:
13775 use_rela_relocations = 1;
13776 object_64bit = 1;
13777 #ifndef TE_SOLARIS
13778 tls_get_addr = "__tls_get_addr";
13779 #endif
13780 disallow_64bit_reloc = 1;
13781 format = ELF_TARGET_FORMAT32;
13782 break;
13783 }
13784 if (cpu_arch_isa == PROCESSOR_L1OM)
13785 {
13786 if (x86_elf_abi != X86_64_ABI)
13787 as_fatal (_("Intel L1OM is 64bit only"));
13788 return ELF_TARGET_L1OM_FORMAT;
13789 }
13790 else if (cpu_arch_isa == PROCESSOR_K1OM)
13791 {
13792 if (x86_elf_abi != X86_64_ABI)
13793 as_fatal (_("Intel K1OM is 64bit only"));
13794 return ELF_TARGET_K1OM_FORMAT;
13795 }
13796 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13797 {
13798 if (x86_elf_abi != I386_ABI)
13799 as_fatal (_("Intel MCU is 32bit only"));
13800 return ELF_TARGET_IAMCU_FORMAT;
13801 }
13802 else
13803 return format;
13804 }
13805 #endif
13806 #if defined (OBJ_MACH_O)
13807 case bfd_target_mach_o_flavour:
13808 if (flag_code == CODE_64BIT)
13809 {
13810 use_rela_relocations = 1;
13811 object_64bit = 1;
13812 return "mach-o-x86-64";
13813 }
13814 else
13815 return "mach-o-i386";
13816 #endif
13817 default:
13818 abort ();
13819 return NULL;
13820 }
13821 }
13822
13823 #endif /* OBJ_MAYBE_ more than one */
13824 \f
13825 symbolS *
13826 md_undefined_symbol (char *name)
13827 {
13828 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13829 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13830 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13831 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13832 {
13833 if (!GOT_symbol)
13834 {
13835 if (symbol_find (name))
13836 as_bad (_("GOT already in symbol table"));
13837 GOT_symbol = symbol_new (name, undefined_section,
13838 &zero_address_frag, 0);
13839 };
13840 return GOT_symbol;
13841 }
13842 return 0;
13843 }
13844
13845 /* Round up a section size to the appropriate boundary. */
13846
13847 valueT
13848 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13849 {
13850 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13851 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13852 {
13853 /* For a.out, force the section size to be aligned. If we don't do
13854 this, BFD will align it for us, but it will not write out the
13855 final bytes of the section. This may be a bug in BFD, but it is
13856 easier to fix it here since that is how the other a.out targets
13857 work. */
13858 int align;
13859
13860 align = bfd_section_alignment (segment);
13861 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13862 }
13863 #endif
13864
13865 return size;
13866 }
13867
13868 /* On the i386, PC-relative offsets are relative to the start of the
13869 next instruction. That is, the address of the offset, plus its
13870 size, since the offset is always the last part of the insn. */
13871
13872 long
13873 md_pcrel_from (fixS *fixP)
13874 {
13875 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13876 }
13877
13878 #ifndef I386COFF
13879
13880 static void
13881 s_bss (int ignore ATTRIBUTE_UNUSED)
13882 {
13883 int temp;
13884
13885 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13886 if (IS_ELF)
13887 obj_elf_section_change_hook ();
13888 #endif
13889 temp = get_absolute_expression ();
13890 subseg_set (bss_section, (subsegT) temp);
13891 demand_empty_rest_of_line ();
13892 }
13893
13894 #endif
13895
13896 /* Remember constant directive. */
13897
13898 void
13899 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13900 {
13901 if (last_insn.kind != last_insn_directive
13902 && (bfd_section_flags (now_seg) & SEC_CODE))
13903 {
13904 last_insn.seg = now_seg;
13905 last_insn.kind = last_insn_directive;
13906 last_insn.name = "constant directive";
13907 last_insn.file = as_where (&last_insn.line);
13908 if (lfence_before_ret != lfence_before_ret_none)
13909 {
13910 if (lfence_before_indirect_branch != lfence_branch_none)
13911 as_warn (_("constant directive skips -mlfence-before-ret "
13912 "and -mlfence-before-indirect-branch"));
13913 else
13914 as_warn (_("constant directive skips -mlfence-before-ret"));
13915 }
13916 else if (lfence_before_indirect_branch != lfence_branch_none)
13917 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13918 }
13919 }
13920
13921 void
13922 i386_validate_fix (fixS *fixp)
13923 {
13924 if (fixp->fx_subsy)
13925 {
13926 if (fixp->fx_subsy == GOT_symbol)
13927 {
13928 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13929 {
13930 if (!object_64bit)
13931 abort ();
13932 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13933 if (fixp->fx_tcbit2)
13934 fixp->fx_r_type = (fixp->fx_tcbit
13935 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13936 : BFD_RELOC_X86_64_GOTPCRELX);
13937 else
13938 #endif
13939 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13940 }
13941 else
13942 {
13943 if (!object_64bit)
13944 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13945 else
13946 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13947 }
13948 fixp->fx_subsy = 0;
13949 }
13950 }
13951 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13952 else
13953 {
13954 /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
13955 to section. Since PLT32 relocation must be against symbols,
13956 turn such PLT32 relocation into PC32 relocation. */
13957 if (fixp->fx_addsy
13958 && (fixp->fx_r_type == BFD_RELOC_386_PLT32
13959 || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
13960 && symbol_section_p (fixp->fx_addsy))
13961 fixp->fx_r_type = BFD_RELOC_32_PCREL;
13962 if (!object_64bit)
13963 {
13964 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13965 && fixp->fx_tcbit2)
13966 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
13967 }
13968 }
13969 #endif
13970 }
13971
13972 arelent *
13973 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
13974 {
13975 arelent *rel;
13976 bfd_reloc_code_real_type code;
13977
13978 switch (fixp->fx_r_type)
13979 {
13980 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13981 case BFD_RELOC_SIZE32:
13982 case BFD_RELOC_SIZE64:
13983 if (S_IS_DEFINED (fixp->fx_addsy)
13984 && !S_IS_EXTERNAL (fixp->fx_addsy))
13985 {
13986 /* Resolve size relocation against local symbol to size of
13987 the symbol plus addend. */
13988 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
13989 if (fixp->fx_r_type == BFD_RELOC_SIZE32
13990 && !fits_in_unsigned_long (value))
13991 as_bad_where (fixp->fx_file, fixp->fx_line,
13992 _("symbol size computation overflow"));
13993 fixp->fx_addsy = NULL;
13994 fixp->fx_subsy = NULL;
13995 md_apply_fix (fixp, (valueT *) &value, NULL);
13996 return NULL;
13997 }
13998 #endif
13999 /* Fall through. */
14000
14001 case BFD_RELOC_X86_64_PLT32:
14002 case BFD_RELOC_X86_64_GOT32:
14003 case BFD_RELOC_X86_64_GOTPCREL:
14004 case BFD_RELOC_X86_64_GOTPCRELX:
14005 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14006 case BFD_RELOC_386_PLT32:
14007 case BFD_RELOC_386_GOT32:
14008 case BFD_RELOC_386_GOT32X:
14009 case BFD_RELOC_386_GOTOFF:
14010 case BFD_RELOC_386_GOTPC:
14011 case BFD_RELOC_386_TLS_GD:
14012 case BFD_RELOC_386_TLS_LDM:
14013 case BFD_RELOC_386_TLS_LDO_32:
14014 case BFD_RELOC_386_TLS_IE_32:
14015 case BFD_RELOC_386_TLS_IE:
14016 case BFD_RELOC_386_TLS_GOTIE:
14017 case BFD_RELOC_386_TLS_LE_32:
14018 case BFD_RELOC_386_TLS_LE:
14019 case BFD_RELOC_386_TLS_GOTDESC:
14020 case BFD_RELOC_386_TLS_DESC_CALL:
14021 case BFD_RELOC_X86_64_TLSGD:
14022 case BFD_RELOC_X86_64_TLSLD:
14023 case BFD_RELOC_X86_64_DTPOFF32:
14024 case BFD_RELOC_X86_64_DTPOFF64:
14025 case BFD_RELOC_X86_64_GOTTPOFF:
14026 case BFD_RELOC_X86_64_TPOFF32:
14027 case BFD_RELOC_X86_64_TPOFF64:
14028 case BFD_RELOC_X86_64_GOTOFF64:
14029 case BFD_RELOC_X86_64_GOTPC32:
14030 case BFD_RELOC_X86_64_GOT64:
14031 case BFD_RELOC_X86_64_GOTPCREL64:
14032 case BFD_RELOC_X86_64_GOTPC64:
14033 case BFD_RELOC_X86_64_GOTPLT64:
14034 case BFD_RELOC_X86_64_PLTOFF64:
14035 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14036 case BFD_RELOC_X86_64_TLSDESC_CALL:
14037 case BFD_RELOC_RVA:
14038 case BFD_RELOC_VTABLE_ENTRY:
14039 case BFD_RELOC_VTABLE_INHERIT:
14040 #ifdef TE_PE
14041 case BFD_RELOC_32_SECREL:
14042 #endif
14043 code = fixp->fx_r_type;
14044 break;
14045 case BFD_RELOC_X86_64_32S:
14046 if (!fixp->fx_pcrel)
14047 {
14048 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
14049 code = fixp->fx_r_type;
14050 break;
14051 }
14052 /* Fall through. */
14053 default:
14054 if (fixp->fx_pcrel)
14055 {
14056 switch (fixp->fx_size)
14057 {
14058 default:
14059 as_bad_where (fixp->fx_file, fixp->fx_line,
14060 _("can not do %d byte pc-relative relocation"),
14061 fixp->fx_size);
14062 code = BFD_RELOC_32_PCREL;
14063 break;
14064 case 1: code = BFD_RELOC_8_PCREL; break;
14065 case 2: code = BFD_RELOC_16_PCREL; break;
14066 case 4: code = BFD_RELOC_32_PCREL; break;
14067 #ifdef BFD64
14068 case 8: code = BFD_RELOC_64_PCREL; break;
14069 #endif
14070 }
14071 }
14072 else
14073 {
14074 switch (fixp->fx_size)
14075 {
14076 default:
14077 as_bad_where (fixp->fx_file, fixp->fx_line,
14078 _("can not do %d byte relocation"),
14079 fixp->fx_size);
14080 code = BFD_RELOC_32;
14081 break;
14082 case 1: code = BFD_RELOC_8; break;
14083 case 2: code = BFD_RELOC_16; break;
14084 case 4: code = BFD_RELOC_32; break;
14085 #ifdef BFD64
14086 case 8: code = BFD_RELOC_64; break;
14087 #endif
14088 }
14089 }
14090 break;
14091 }
14092
14093 if ((code == BFD_RELOC_32
14094 || code == BFD_RELOC_32_PCREL
14095 || code == BFD_RELOC_X86_64_32S)
14096 && GOT_symbol
14097 && fixp->fx_addsy == GOT_symbol)
14098 {
14099 if (!object_64bit)
14100 code = BFD_RELOC_386_GOTPC;
14101 else
14102 code = BFD_RELOC_X86_64_GOTPC32;
14103 }
14104 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14105 && GOT_symbol
14106 && fixp->fx_addsy == GOT_symbol)
14107 {
14108 code = BFD_RELOC_X86_64_GOTPC64;
14109 }
14110
14111 rel = XNEW (arelent);
14112 rel->sym_ptr_ptr = XNEW (asymbol *);
14113 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14114
14115 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14116
14117 if (!use_rela_relocations)
14118 {
14119 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14120 vtable entry to be used in the relocation's section offset. */
14121 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14122 rel->address = fixp->fx_offset;
14123 #if defined (OBJ_COFF) && defined (TE_PE)
14124 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14125 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14126 else
14127 #endif
14128 rel->addend = 0;
14129 }
14130 /* Use the rela in 64bit mode. */
14131 else
14132 {
14133 if (disallow_64bit_reloc)
14134 switch (code)
14135 {
14136 case BFD_RELOC_X86_64_DTPOFF64:
14137 case BFD_RELOC_X86_64_TPOFF64:
14138 case BFD_RELOC_64_PCREL:
14139 case BFD_RELOC_X86_64_GOTOFF64:
14140 case BFD_RELOC_X86_64_GOT64:
14141 case BFD_RELOC_X86_64_GOTPCREL64:
14142 case BFD_RELOC_X86_64_GOTPC64:
14143 case BFD_RELOC_X86_64_GOTPLT64:
14144 case BFD_RELOC_X86_64_PLTOFF64:
14145 as_bad_where (fixp->fx_file, fixp->fx_line,
14146 _("cannot represent relocation type %s in x32 mode"),
14147 bfd_get_reloc_code_name (code));
14148 break;
14149 default:
14150 break;
14151 }
14152
14153 if (!fixp->fx_pcrel)
14154 rel->addend = fixp->fx_offset;
14155 else
14156 switch (code)
14157 {
14158 case BFD_RELOC_X86_64_PLT32:
14159 case BFD_RELOC_X86_64_GOT32:
14160 case BFD_RELOC_X86_64_GOTPCREL:
14161 case BFD_RELOC_X86_64_GOTPCRELX:
14162 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14163 case BFD_RELOC_X86_64_TLSGD:
14164 case BFD_RELOC_X86_64_TLSLD:
14165 case BFD_RELOC_X86_64_GOTTPOFF:
14166 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14167 case BFD_RELOC_X86_64_TLSDESC_CALL:
14168 rel->addend = fixp->fx_offset - fixp->fx_size;
14169 break;
14170 default:
14171 rel->addend = (section->vma
14172 - fixp->fx_size
14173 + fixp->fx_addnumber
14174 + md_pcrel_from (fixp));
14175 break;
14176 }
14177 }
14178
14179 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14180 if (rel->howto == NULL)
14181 {
14182 as_bad_where (fixp->fx_file, fixp->fx_line,
14183 _("cannot represent relocation type %s"),
14184 bfd_get_reloc_code_name (code));
14185 /* Set howto to a garbage value so that we can keep going. */
14186 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14187 gas_assert (rel->howto != NULL);
14188 }
14189
14190 return rel;
14191 }
14192
14193 #include "tc-i386-intel.c"
14194
14195 void
14196 tc_x86_parse_to_dw2regnum (expressionS *exp)
14197 {
14198 int saved_naked_reg;
14199 char saved_register_dot;
14200
14201 saved_naked_reg = allow_naked_reg;
14202 allow_naked_reg = 1;
14203 saved_register_dot = register_chars['.'];
14204 register_chars['.'] = '.';
14205 allow_pseudo_reg = 1;
14206 expression_and_evaluate (exp);
14207 allow_pseudo_reg = 0;
14208 register_chars['.'] = saved_register_dot;
14209 allow_naked_reg = saved_naked_reg;
14210
14211 if (exp->X_op == O_register && exp->X_add_number >= 0)
14212 {
14213 if ((addressT) exp->X_add_number < i386_regtab_size)
14214 {
14215 exp->X_op = O_constant;
14216 exp->X_add_number = i386_regtab[exp->X_add_number]
14217 .dw2_regnum[flag_code >> 1];
14218 }
14219 else
14220 exp->X_op = O_illegal;
14221 }
14222 }
14223
14224 void
14225 tc_x86_frame_initial_instructions (void)
14226 {
14227 static unsigned int sp_regno[2];
14228
14229 if (!sp_regno[flag_code >> 1])
14230 {
14231 char *saved_input = input_line_pointer;
14232 char sp[][4] = {"esp", "rsp"};
14233 expressionS exp;
14234
14235 input_line_pointer = sp[flag_code >> 1];
14236 tc_x86_parse_to_dw2regnum (&exp);
14237 gas_assert (exp.X_op == O_constant);
14238 sp_regno[flag_code >> 1] = exp.X_add_number;
14239 input_line_pointer = saved_input;
14240 }
14241
14242 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14243 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14244 }
14245
14246 int
14247 x86_dwarf2_addr_size (void)
14248 {
14249 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14250 if (x86_elf_abi == X86_64_X32_ABI)
14251 return 4;
14252 #endif
14253 return bfd_arch_bits_per_address (stdoutput) / 8;
14254 }
14255
14256 int
14257 i386_elf_section_type (const char *str, size_t len)
14258 {
14259 if (flag_code == CODE_64BIT
14260 && len == sizeof ("unwind") - 1
14261 && strncmp (str, "unwind", 6) == 0)
14262 return SHT_X86_64_UNWIND;
14263
14264 return -1;
14265 }
14266
14267 #ifdef TE_SOLARIS
14268 void
14269 i386_solaris_fix_up_eh_frame (segT sec)
14270 {
14271 if (flag_code == CODE_64BIT)
14272 elf_section_type (sec) = SHT_X86_64_UNWIND;
14273 }
14274 #endif
14275
14276 #ifdef TE_PE
14277 void
14278 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14279 {
14280 expressionS exp;
14281
14282 exp.X_op = O_secrel;
14283 exp.X_add_symbol = symbol;
14284 exp.X_add_number = 0;
14285 emit_expr (&exp, size);
14286 }
14287 #endif
14288
14289 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14290 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14291
14292 bfd_vma
14293 x86_64_section_letter (int letter, const char **ptr_msg)
14294 {
14295 if (flag_code == CODE_64BIT)
14296 {
14297 if (letter == 'l')
14298 return SHF_X86_64_LARGE;
14299
14300 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14301 }
14302 else
14303 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14304 return -1;
14305 }
14306
14307 bfd_vma
14308 x86_64_section_word (char *str, size_t len)
14309 {
14310 if (len == 5 && flag_code == CODE_64BIT && CONST_STRNEQ (str, "large"))
14311 return SHF_X86_64_LARGE;
14312
14313 return -1;
14314 }
14315
14316 static void
14317 handle_large_common (int small ATTRIBUTE_UNUSED)
14318 {
14319 if (flag_code != CODE_64BIT)
14320 {
14321 s_comm_internal (0, elf_common_parse);
14322 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14323 }
14324 else
14325 {
14326 static segT lbss_section;
14327 asection *saved_com_section_ptr = elf_com_section_ptr;
14328 asection *saved_bss_section = bss_section;
14329
14330 if (lbss_section == NULL)
14331 {
14332 flagword applicable;
14333 segT seg = now_seg;
14334 subsegT subseg = now_subseg;
14335
14336 /* The .lbss section is for local .largecomm symbols. */
14337 lbss_section = subseg_new (".lbss", 0);
14338 applicable = bfd_applicable_section_flags (stdoutput);
14339 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14340 seg_info (lbss_section)->bss = 1;
14341
14342 subseg_set (seg, subseg);
14343 }
14344
14345 elf_com_section_ptr = &_bfd_elf_large_com_section;
14346 bss_section = lbss_section;
14347
14348 s_comm_internal (0, elf_common_parse);
14349
14350 elf_com_section_ptr = saved_com_section_ptr;
14351 bss_section = saved_bss_section;
14352 }
14353 }
14354 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */