x86: fix CMPXCHG8B special case when disallowing q suffix outside of 64-bit mode
[binutils-gdb.git] / gas / config / tc-i386.c
1 /* tc-i386.c -- Assemble code for the Intel 80386
2 Copyright (C) 1989-2021 Free Software Foundation, Inc.
3
4 This file is part of GAS, the GNU Assembler.
5
6 GAS is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3, or (at your option)
9 any later version.
10
11 GAS is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with GAS; see the file COPYING. If not, write to the Free
18 Software Foundation, 51 Franklin Street - Fifth Floor, Boston, MA
19 02110-1301, USA. */
20
21 /* Intel 80386 machine specific gas.
22 Written by Eliot Dresselhaus (eliot@mgm.mit.edu).
23 x86_64 support by Jan Hubicka (jh@suse.cz)
24 VIA PadLock support by Michal Ludvig (mludvig@suse.cz)
25 Bugs & suggestions are completely welcome. This is free software.
26 Please help us make it better. */
27
28 #include "as.h"
29 #include "safe-ctype.h"
30 #include "subsegs.h"
31 #include "dwarf2dbg.h"
32 #include "dw2gencfi.h"
33 #include "elf/x86-64.h"
34 #include "opcodes/i386-init.h"
35
36 #ifdef HAVE_LIMITS_H
37 #include <limits.h>
38 #else
39 #ifdef HAVE_SYS_PARAM_H
40 #include <sys/param.h>
41 #endif
42 #ifndef INT_MAX
43 #define INT_MAX (int) (((unsigned) (-1)) >> 1)
44 #endif
45 #endif
46
47 #ifndef INFER_ADDR_PREFIX
48 #define INFER_ADDR_PREFIX 1
49 #endif
50
51 #ifndef DEFAULT_ARCH
52 #define DEFAULT_ARCH "i386"
53 #endif
54
55 #ifndef INLINE
56 #if __GNUC__ >= 2
57 #define INLINE __inline__
58 #else
59 #define INLINE
60 #endif
61 #endif
62
63 /* Prefixes will be emitted in the order defined below.
64 WAIT_PREFIX must be the first prefix since FWAIT is really is an
65 instruction, and so must come before any prefixes.
66 The preferred prefix order is SEG_PREFIX, ADDR_PREFIX, DATA_PREFIX,
67 REP_PREFIX/HLE_PREFIX, LOCK_PREFIX. */
68 #define WAIT_PREFIX 0
69 #define SEG_PREFIX 1
70 #define ADDR_PREFIX 2
71 #define DATA_PREFIX 3
72 #define REP_PREFIX 4
73 #define HLE_PREFIX REP_PREFIX
74 #define BND_PREFIX REP_PREFIX
75 #define LOCK_PREFIX 5
76 #define REX_PREFIX 6 /* must come last. */
77 #define MAX_PREFIXES 7 /* max prefixes per opcode */
78
79 /* we define the syntax here (modulo base,index,scale syntax) */
80 #define REGISTER_PREFIX '%'
81 #define IMMEDIATE_PREFIX '$'
82 #define ABSOLUTE_PREFIX '*'
83
84 /* these are the instruction mnemonic suffixes in AT&T syntax or
85 memory operand size in Intel syntax. */
86 #define WORD_MNEM_SUFFIX 'w'
87 #define BYTE_MNEM_SUFFIX 'b'
88 #define SHORT_MNEM_SUFFIX 's'
89 #define LONG_MNEM_SUFFIX 'l'
90 #define QWORD_MNEM_SUFFIX 'q'
91 /* Intel Syntax. Use a non-ascii letter since since it never appears
92 in instructions. */
93 #define LONG_DOUBLE_MNEM_SUFFIX '\1'
94
95 #define END_OF_INSN '\0'
96
97 /* This matches the C -> StaticRounding alias in the opcode table. */
98 #define commutative staticrounding
99
100 /*
101 'templates' is for grouping together 'template' structures for opcodes
102 of the same name. This is only used for storing the insns in the grand
103 ole hash table of insns.
104 The templates themselves start at START and range up to (but not including)
105 END.
106 */
107 typedef struct
108 {
109 const insn_template *start;
110 const insn_template *end;
111 }
112 templates;
113
114 /* 386 operand encoding bytes: see 386 book for details of this. */
115 typedef struct
116 {
117 unsigned int regmem; /* codes register or memory operand */
118 unsigned int reg; /* codes register operand (or extended opcode) */
119 unsigned int mode; /* how to interpret regmem & reg */
120 }
121 modrm_byte;
122
123 /* x86-64 extension prefix. */
124 typedef int rex_byte;
125
126 /* 386 opcode byte to code indirect addressing. */
127 typedef struct
128 {
129 unsigned base;
130 unsigned index;
131 unsigned scale;
132 }
133 sib_byte;
134
135 /* x86 arch names, types and features */
136 typedef struct
137 {
138 const char *name; /* arch name */
139 unsigned int len; /* arch string length */
140 enum processor_type type; /* arch type */
141 i386_cpu_flags flags; /* cpu feature flags */
142 unsigned int skip; /* show_arch should skip this. */
143 }
144 arch_entry;
145
146 /* Used to turn off indicated flags. */
147 typedef struct
148 {
149 const char *name; /* arch name */
150 unsigned int len; /* arch string length */
151 i386_cpu_flags flags; /* cpu feature flags */
152 }
153 noarch_entry;
154
155 static void update_code_flag (int, int);
156 static void set_code_flag (int);
157 static void set_16bit_gcc_code_flag (int);
158 static void set_intel_syntax (int);
159 static void set_intel_mnemonic (int);
160 static void set_allow_index_reg (int);
161 static void set_check (int);
162 static void set_cpu_arch (int);
163 #ifdef TE_PE
164 static void pe_directive_secrel (int);
165 #endif
166 static void signed_cons (int);
167 static char *output_invalid (int c);
168 static int i386_finalize_immediate (segT, expressionS *, i386_operand_type,
169 const char *);
170 static int i386_finalize_displacement (segT, expressionS *, i386_operand_type,
171 const char *);
172 static int i386_att_operand (char *);
173 static int i386_intel_operand (char *, int);
174 static int i386_intel_simplify (expressionS *);
175 static int i386_intel_parse_name (const char *, expressionS *);
176 static const reg_entry *parse_register (char *, char **);
177 static char *parse_insn (char *, char *);
178 static char *parse_operands (char *, const char *);
179 static void swap_operands (void);
180 static void swap_2_operands (int, int);
181 static enum flag_code i386_addressing_mode (void);
182 static void optimize_imm (void);
183 static void optimize_disp (void);
184 static const insn_template *match_template (char);
185 static int check_string (void);
186 static int process_suffix (void);
187 static int check_byte_reg (void);
188 static int check_long_reg (void);
189 static int check_qword_reg (void);
190 static int check_word_reg (void);
191 static int finalize_imm (void);
192 static int process_operands (void);
193 static const seg_entry *build_modrm_byte (void);
194 static void output_insn (void);
195 static void output_imm (fragS *, offsetT);
196 static void output_disp (fragS *, offsetT);
197 #ifndef I386COFF
198 static void s_bss (int);
199 #endif
200 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
201 static void handle_large_common (int small ATTRIBUTE_UNUSED);
202
203 /* GNU_PROPERTY_X86_ISA_1_USED. */
204 static unsigned int x86_isa_1_used;
205 /* GNU_PROPERTY_X86_FEATURE_2_USED. */
206 static unsigned int x86_feature_2_used;
207 /* Generate x86 used ISA and feature properties. */
208 static unsigned int x86_used_note = DEFAULT_X86_USED_NOTE;
209 #endif
210
211 static const char *default_arch = DEFAULT_ARCH;
212
213 /* parse_register() returns this when a register alias cannot be used. */
214 static const reg_entry bad_reg = { "<bad>", OPERAND_TYPE_NONE, 0, 0,
215 { Dw2Inval, Dw2Inval } };
216
217 /* This struct describes rounding control and SAE in the instruction. */
218 struct RC_Operation
219 {
220 enum rc_type
221 {
222 rne = 0,
223 rd,
224 ru,
225 rz,
226 saeonly
227 } type;
228 int operand;
229 };
230
231 static struct RC_Operation rc_op;
232
233 /* The struct describes masking, applied to OPERAND in the instruction.
234 MASK is a pointer to the corresponding mask register. ZEROING tells
235 whether merging or zeroing mask is used. */
236 struct Mask_Operation
237 {
238 const reg_entry *mask;
239 unsigned int zeroing;
240 /* The operand where this operation is associated. */
241 int operand;
242 };
243
244 static struct Mask_Operation mask_op;
245
246 /* The struct describes broadcasting, applied to OPERAND. FACTOR is
247 broadcast factor. */
248 struct Broadcast_Operation
249 {
250 /* Type of broadcast: {1to2}, {1to4}, {1to8}, or {1to16}. */
251 int type;
252
253 /* Index of broadcasted operand. */
254 int operand;
255
256 /* Number of bytes to broadcast. */
257 int bytes;
258 };
259
260 static struct Broadcast_Operation broadcast_op;
261
262 /* VEX prefix. */
263 typedef struct
264 {
265 /* VEX prefix is either 2 byte or 3 byte. EVEX is 4 byte. */
266 unsigned char bytes[4];
267 unsigned int length;
268 /* Destination or source register specifier. */
269 const reg_entry *register_specifier;
270 } vex_prefix;
271
272 /* 'md_assemble ()' gathers together information and puts it into a
273 i386_insn. */
274
275 union i386_op
276 {
277 expressionS *disps;
278 expressionS *imms;
279 const reg_entry *regs;
280 };
281
282 enum i386_error
283 {
284 operand_size_mismatch,
285 operand_type_mismatch,
286 register_type_mismatch,
287 number_of_operands_mismatch,
288 invalid_instruction_suffix,
289 bad_imm4,
290 unsupported_with_intel_mnemonic,
291 unsupported_syntax,
292 unsupported,
293 invalid_sib_address,
294 invalid_vsib_address,
295 invalid_vector_register_set,
296 invalid_tmm_register_set,
297 unsupported_vector_index_register,
298 unsupported_broadcast,
299 broadcast_needed,
300 unsupported_masking,
301 mask_not_on_destination,
302 no_default_mask,
303 unsupported_rc_sae,
304 rc_sae_operand_not_last_imm,
305 invalid_register_operand,
306 };
307
308 struct _i386_insn
309 {
310 /* TM holds the template for the insn were currently assembling. */
311 insn_template tm;
312
313 /* SUFFIX holds the instruction size suffix for byte, word, dword
314 or qword, if given. */
315 char suffix;
316
317 /* OPCODE_LENGTH holds the number of base opcode bytes. */
318 unsigned char opcode_length;
319
320 /* OPERANDS gives the number of given operands. */
321 unsigned int operands;
322
323 /* REG_OPERANDS, DISP_OPERANDS, MEM_OPERANDS, IMM_OPERANDS give the number
324 of given register, displacement, memory operands and immediate
325 operands. */
326 unsigned int reg_operands, disp_operands, mem_operands, imm_operands;
327
328 /* TYPES [i] is the type (see above #defines) which tells us how to
329 use OP[i] for the corresponding operand. */
330 i386_operand_type types[MAX_OPERANDS];
331
332 /* Displacement expression, immediate expression, or register for each
333 operand. */
334 union i386_op op[MAX_OPERANDS];
335
336 /* Flags for operands. */
337 unsigned int flags[MAX_OPERANDS];
338 #define Operand_PCrel 1
339 #define Operand_Mem 2
340
341 /* Relocation type for operand */
342 enum bfd_reloc_code_real reloc[MAX_OPERANDS];
343
344 /* BASE_REG, INDEX_REG, and LOG2_SCALE_FACTOR are used to encode
345 the base index byte below. */
346 const reg_entry *base_reg;
347 const reg_entry *index_reg;
348 unsigned int log2_scale_factor;
349
350 /* SEG gives the seg_entries of this insn. They are zero unless
351 explicit segment overrides are given. */
352 const seg_entry *seg[2];
353
354 /* Copied first memory operand string, for re-checking. */
355 char *memop1_string;
356
357 /* PREFIX holds all the given prefix opcodes (usually null).
358 PREFIXES is the number of prefix opcodes. */
359 unsigned int prefixes;
360 unsigned char prefix[MAX_PREFIXES];
361
362 /* Register is in low 3 bits of opcode. */
363 bfd_boolean short_form;
364
365 /* The operand to a branch insn indicates an absolute branch. */
366 bfd_boolean jumpabsolute;
367
368 /* Extended states. */
369 enum
370 {
371 /* Use MMX state. */
372 xstate_mmx = 1 << 0,
373 /* Use XMM state. */
374 xstate_xmm = 1 << 1,
375 /* Use YMM state. */
376 xstate_ymm = 1 << 2 | xstate_xmm,
377 /* Use ZMM state. */
378 xstate_zmm = 1 << 3 | xstate_ymm,
379 /* Use TMM state. */
380 xstate_tmm = 1 << 4,
381 /* Use MASK state. */
382 xstate_mask = 1 << 5
383 } xstate;
384
385 /* Has GOTPC or TLS relocation. */
386 bfd_boolean has_gotpc_tls_reloc;
387
388 /* RM and SIB are the modrm byte and the sib byte where the
389 addressing modes of this insn are encoded. */
390 modrm_byte rm;
391 rex_byte rex;
392 rex_byte vrex;
393 sib_byte sib;
394 vex_prefix vex;
395
396 /* Masking attributes. */
397 struct Mask_Operation *mask;
398
399 /* Rounding control and SAE attributes. */
400 struct RC_Operation *rounding;
401
402 /* Broadcasting attributes. */
403 struct Broadcast_Operation *broadcast;
404
405 /* Compressed disp8*N attribute. */
406 unsigned int memshift;
407
408 /* Prefer load or store in encoding. */
409 enum
410 {
411 dir_encoding_default = 0,
412 dir_encoding_load,
413 dir_encoding_store,
414 dir_encoding_swap
415 } dir_encoding;
416
417 /* Prefer 8bit, 16bit, 32bit displacement in encoding. */
418 enum
419 {
420 disp_encoding_default = 0,
421 disp_encoding_8bit,
422 disp_encoding_16bit,
423 disp_encoding_32bit
424 } disp_encoding;
425
426 /* Prefer the REX byte in encoding. */
427 bfd_boolean rex_encoding;
428
429 /* Disable instruction size optimization. */
430 bfd_boolean no_optimize;
431
432 /* How to encode vector instructions. */
433 enum
434 {
435 vex_encoding_default = 0,
436 vex_encoding_vex,
437 vex_encoding_vex3,
438 vex_encoding_evex,
439 vex_encoding_error
440 } vec_encoding;
441
442 /* REP prefix. */
443 const char *rep_prefix;
444
445 /* HLE prefix. */
446 const char *hle_prefix;
447
448 /* Have BND prefix. */
449 const char *bnd_prefix;
450
451 /* Have NOTRACK prefix. */
452 const char *notrack_prefix;
453
454 /* Error message. */
455 enum i386_error error;
456 };
457
458 typedef struct _i386_insn i386_insn;
459
460 /* Link RC type with corresponding string, that'll be looked for in
461 asm. */
462 struct RC_name
463 {
464 enum rc_type type;
465 const char *name;
466 unsigned int len;
467 };
468
469 static const struct RC_name RC_NamesTable[] =
470 {
471 { rne, STRING_COMMA_LEN ("rn-sae") },
472 { rd, STRING_COMMA_LEN ("rd-sae") },
473 { ru, STRING_COMMA_LEN ("ru-sae") },
474 { rz, STRING_COMMA_LEN ("rz-sae") },
475 { saeonly, STRING_COMMA_LEN ("sae") },
476 };
477
478 /* List of chars besides those in app.c:symbol_chars that can start an
479 operand. Used to prevent the scrubber eating vital white-space. */
480 const char extra_symbol_chars[] = "*%-([{}"
481 #ifdef LEX_AT
482 "@"
483 #endif
484 #ifdef LEX_QM
485 "?"
486 #endif
487 ;
488
489 #if ((defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)) \
490 && !defined (TE_GNU) \
491 && !defined (TE_LINUX) \
492 && !defined (TE_FreeBSD) \
493 && !defined (TE_DragonFly) \
494 && !defined (TE_NetBSD))
495 /* This array holds the chars that always start a comment. If the
496 pre-processor is disabled, these aren't very useful. The option
497 --divide will remove '/' from this list. */
498 const char *i386_comment_chars = "#/";
499 #define SVR4_COMMENT_CHARS 1
500 #define PREFIX_SEPARATOR '\\'
501
502 #else
503 const char *i386_comment_chars = "#";
504 #define PREFIX_SEPARATOR '/'
505 #endif
506
507 /* This array holds the chars that only start a comment at the beginning of
508 a line. If the line seems to have the form '# 123 filename'
509 .line and .file directives will appear in the pre-processed output.
510 Note that input_file.c hand checks for '#' at the beginning of the
511 first line of the input file. This is because the compiler outputs
512 #NO_APP at the beginning of its output.
513 Also note that comments started like this one will always work if
514 '/' isn't otherwise defined. */
515 const char line_comment_chars[] = "#/";
516
517 const char line_separator_chars[] = ";";
518
519 /* Chars that can be used to separate mant from exp in floating point
520 nums. */
521 const char EXP_CHARS[] = "eE";
522
523 /* Chars that mean this number is a floating point constant
524 As in 0f12.456
525 or 0d1.2345e12. */
526 const char FLT_CHARS[] = "fFdDxX";
527
528 /* Tables for lexical analysis. */
529 static char mnemonic_chars[256];
530 static char register_chars[256];
531 static char operand_chars[256];
532 static char identifier_chars[256];
533 static char digit_chars[256];
534
535 /* Lexical macros. */
536 #define is_mnemonic_char(x) (mnemonic_chars[(unsigned char) x])
537 #define is_operand_char(x) (operand_chars[(unsigned char) x])
538 #define is_register_char(x) (register_chars[(unsigned char) x])
539 #define is_space_char(x) ((x) == ' ')
540 #define is_identifier_char(x) (identifier_chars[(unsigned char) x])
541 #define is_digit_char(x) (digit_chars[(unsigned char) x])
542
543 /* All non-digit non-letter characters that may occur in an operand. */
544 static char operand_special_chars[] = "%$-+(,)*._~/<>|&^!:[@]";
545
546 /* md_assemble() always leaves the strings it's passed unaltered. To
547 effect this we maintain a stack of saved characters that we've smashed
548 with '\0's (indicating end of strings for various sub-fields of the
549 assembler instruction). */
550 static char save_stack[32];
551 static char *save_stack_p;
552 #define END_STRING_AND_SAVE(s) \
553 do { *save_stack_p++ = *(s); *(s) = '\0'; } while (0)
554 #define RESTORE_END_STRING(s) \
555 do { *(s) = *--save_stack_p; } while (0)
556
557 /* The instruction we're assembling. */
558 static i386_insn i;
559
560 /* Possible templates for current insn. */
561 static const templates *current_templates;
562
563 /* Per instruction expressionS buffers: max displacements & immediates. */
564 static expressionS disp_expressions[MAX_MEMORY_OPERANDS];
565 static expressionS im_expressions[MAX_IMMEDIATE_OPERANDS];
566
567 /* Current operand we are working on. */
568 static int this_operand = -1;
569
570 /* We support four different modes. FLAG_CODE variable is used to distinguish
571 these. */
572
573 enum flag_code {
574 CODE_32BIT,
575 CODE_16BIT,
576 CODE_64BIT };
577
578 static enum flag_code flag_code;
579 static unsigned int object_64bit;
580 static unsigned int disallow_64bit_reloc;
581 static int use_rela_relocations = 0;
582 /* __tls_get_addr/___tls_get_addr symbol for TLS. */
583 static const char *tls_get_addr;
584
585 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
586 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
587 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
588
589 /* The ELF ABI to use. */
590 enum x86_elf_abi
591 {
592 I386_ABI,
593 X86_64_ABI,
594 X86_64_X32_ABI
595 };
596
597 static enum x86_elf_abi x86_elf_abi = I386_ABI;
598 #endif
599
600 #if defined (TE_PE) || defined (TE_PEP)
601 /* Use big object file format. */
602 static int use_big_obj = 0;
603 #endif
604
605 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
606 /* 1 if generating code for a shared library. */
607 static int shared = 0;
608 #endif
609
610 /* 1 for intel syntax,
611 0 if att syntax. */
612 static int intel_syntax = 0;
613
614 static enum x86_64_isa
615 {
616 amd64 = 1, /* AMD64 ISA. */
617 intel64 /* Intel64 ISA. */
618 } isa64;
619
620 /* 1 for intel mnemonic,
621 0 if att mnemonic. */
622 static int intel_mnemonic = !SYSV386_COMPAT;
623
624 /* 1 if pseudo registers are permitted. */
625 static int allow_pseudo_reg = 0;
626
627 /* 1 if register prefix % not required. */
628 static int allow_naked_reg = 0;
629
630 /* 1 if the assembler should add BND prefix for all control-transferring
631 instructions supporting it, even if this prefix wasn't specified
632 explicitly. */
633 static int add_bnd_prefix = 0;
634
635 /* 1 if pseudo index register, eiz/riz, is allowed . */
636 static int allow_index_reg = 0;
637
638 /* 1 if the assembler should ignore LOCK prefix, even if it was
639 specified explicitly. */
640 static int omit_lock_prefix = 0;
641
642 /* 1 if the assembler should encode lfence, mfence, and sfence as
643 "lock addl $0, (%{re}sp)". */
644 static int avoid_fence = 0;
645
646 /* 1 if lfence should be inserted after every load. */
647 static int lfence_after_load = 0;
648
649 /* Non-zero if lfence should be inserted before indirect branch. */
650 static enum lfence_before_indirect_branch_kind
651 {
652 lfence_branch_none = 0,
653 lfence_branch_register,
654 lfence_branch_memory,
655 lfence_branch_all
656 }
657 lfence_before_indirect_branch;
658
659 /* Non-zero if lfence should be inserted before ret. */
660 static enum lfence_before_ret_kind
661 {
662 lfence_before_ret_none = 0,
663 lfence_before_ret_not,
664 lfence_before_ret_or,
665 lfence_before_ret_shl
666 }
667 lfence_before_ret;
668
669 /* Types of previous instruction is .byte or prefix. */
670 static struct
671 {
672 segT seg;
673 const char *file;
674 const char *name;
675 unsigned int line;
676 enum last_insn_kind
677 {
678 last_insn_other = 0,
679 last_insn_directive,
680 last_insn_prefix
681 } kind;
682 } last_insn;
683
684 /* 1 if the assembler should generate relax relocations. */
685
686 static int generate_relax_relocations
687 = DEFAULT_GENERATE_X86_RELAX_RELOCATIONS;
688
689 static enum check_kind
690 {
691 check_none = 0,
692 check_warning,
693 check_error
694 }
695 sse_check, operand_check = check_warning;
696
697 /* Non-zero if branches should be aligned within power of 2 boundary. */
698 static int align_branch_power = 0;
699
700 /* Types of branches to align. */
701 enum align_branch_kind
702 {
703 align_branch_none = 0,
704 align_branch_jcc = 1,
705 align_branch_fused = 2,
706 align_branch_jmp = 3,
707 align_branch_call = 4,
708 align_branch_indirect = 5,
709 align_branch_ret = 6
710 };
711
712 /* Type bits of branches to align. */
713 enum align_branch_bit
714 {
715 align_branch_jcc_bit = 1 << align_branch_jcc,
716 align_branch_fused_bit = 1 << align_branch_fused,
717 align_branch_jmp_bit = 1 << align_branch_jmp,
718 align_branch_call_bit = 1 << align_branch_call,
719 align_branch_indirect_bit = 1 << align_branch_indirect,
720 align_branch_ret_bit = 1 << align_branch_ret
721 };
722
723 static unsigned int align_branch = (align_branch_jcc_bit
724 | align_branch_fused_bit
725 | align_branch_jmp_bit);
726
727 /* Types of condition jump used by macro-fusion. */
728 enum mf_jcc_kind
729 {
730 mf_jcc_jo = 0, /* base opcode 0x70 */
731 mf_jcc_jc, /* base opcode 0x72 */
732 mf_jcc_je, /* base opcode 0x74 */
733 mf_jcc_jna, /* base opcode 0x76 */
734 mf_jcc_js, /* base opcode 0x78 */
735 mf_jcc_jp, /* base opcode 0x7a */
736 mf_jcc_jl, /* base opcode 0x7c */
737 mf_jcc_jle, /* base opcode 0x7e */
738 };
739
740 /* Types of compare flag-modifying insntructions used by macro-fusion. */
741 enum mf_cmp_kind
742 {
743 mf_cmp_test_and, /* test/cmp */
744 mf_cmp_alu_cmp, /* add/sub/cmp */
745 mf_cmp_incdec /* inc/dec */
746 };
747
748 /* The maximum padding size for fused jcc. CMP like instruction can
749 be 9 bytes and jcc can be 6 bytes. Leave room just in case for
750 prefixes. */
751 #define MAX_FUSED_JCC_PADDING_SIZE 20
752
753 /* The maximum number of prefixes added for an instruction. */
754 static unsigned int align_branch_prefix_size = 5;
755
756 /* Optimization:
757 1. Clear the REX_W bit with register operand if possible.
758 2. Above plus use 128bit vector instruction to clear the full vector
759 register.
760 */
761 static int optimize = 0;
762
763 /* Optimization:
764 1. Clear the REX_W bit with register operand if possible.
765 2. Above plus use 128bit vector instruction to clear the full vector
766 register.
767 3. Above plus optimize "test{q,l,w} $imm8,%r{64,32,16}" to
768 "testb $imm7,%r8".
769 */
770 static int optimize_for_space = 0;
771
772 /* Register prefix used for error message. */
773 static const char *register_prefix = "%";
774
775 /* Used in 16 bit gcc mode to add an l suffix to call, ret, enter,
776 leave, push, and pop instructions so that gcc has the same stack
777 frame as in 32 bit mode. */
778 static char stackop_size = '\0';
779
780 /* Non-zero to optimize code alignment. */
781 int optimize_align_code = 1;
782
783 /* Non-zero to quieten some warnings. */
784 static int quiet_warnings = 0;
785
786 /* CPU name. */
787 static const char *cpu_arch_name = NULL;
788 static char *cpu_sub_arch_name = NULL;
789
790 /* CPU feature flags. */
791 static i386_cpu_flags cpu_arch_flags = CPU_UNKNOWN_FLAGS;
792
793 /* If we have selected a cpu we are generating instructions for. */
794 static int cpu_arch_tune_set = 0;
795
796 /* Cpu we are generating instructions for. */
797 enum processor_type cpu_arch_tune = PROCESSOR_UNKNOWN;
798
799 /* CPU feature flags of cpu we are generating instructions for. */
800 static i386_cpu_flags cpu_arch_tune_flags;
801
802 /* CPU instruction set architecture used. */
803 enum processor_type cpu_arch_isa = PROCESSOR_UNKNOWN;
804
805 /* CPU feature flags of instruction set architecture used. */
806 i386_cpu_flags cpu_arch_isa_flags;
807
808 /* If set, conditional jumps are not automatically promoted to handle
809 larger than a byte offset. */
810 static unsigned int no_cond_jump_promotion = 0;
811
812 /* Encode SSE instructions with VEX prefix. */
813 static unsigned int sse2avx;
814
815 /* Encode scalar AVX instructions with specific vector length. */
816 static enum
817 {
818 vex128 = 0,
819 vex256
820 } avxscalar;
821
822 /* Encode VEX WIG instructions with specific vex.w. */
823 static enum
824 {
825 vexw0 = 0,
826 vexw1
827 } vexwig;
828
829 /* Encode scalar EVEX LIG instructions with specific vector length. */
830 static enum
831 {
832 evexl128 = 0,
833 evexl256,
834 evexl512
835 } evexlig;
836
837 /* Encode EVEX WIG instructions with specific evex.w. */
838 static enum
839 {
840 evexw0 = 0,
841 evexw1
842 } evexwig;
843
844 /* Value to encode in EVEX RC bits, for SAE-only instructions. */
845 static enum rc_type evexrcig = rne;
846
847 /* Pre-defined "_GLOBAL_OFFSET_TABLE_". */
848 static symbolS *GOT_symbol;
849
850 /* The dwarf2 return column, adjusted for 32 or 64 bit. */
851 unsigned int x86_dwarf2_return_column;
852
853 /* The dwarf2 data alignment, adjusted for 32 or 64 bit. */
854 int x86_cie_data_alignment;
855
856 /* Interface to relax_segment.
857 There are 3 major relax states for 386 jump insns because the
858 different types of jumps add different sizes to frags when we're
859 figuring out what sort of jump to choose to reach a given label.
860
861 BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING are used to align
862 branches which are handled by md_estimate_size_before_relax() and
863 i386_generic_table_relax_frag(). */
864
865 /* Types. */
866 #define UNCOND_JUMP 0
867 #define COND_JUMP 1
868 #define COND_JUMP86 2
869 #define BRANCH_PADDING 3
870 #define BRANCH_PREFIX 4
871 #define FUSED_JCC_PADDING 5
872
873 /* Sizes. */
874 #define CODE16 1
875 #define SMALL 0
876 #define SMALL16 (SMALL | CODE16)
877 #define BIG 2
878 #define BIG16 (BIG | CODE16)
879
880 #ifndef INLINE
881 #ifdef __GNUC__
882 #define INLINE __inline__
883 #else
884 #define INLINE
885 #endif
886 #endif
887
888 #define ENCODE_RELAX_STATE(type, size) \
889 ((relax_substateT) (((type) << 2) | (size)))
890 #define TYPE_FROM_RELAX_STATE(s) \
891 ((s) >> 2)
892 #define DISP_SIZE_FROM_RELAX_STATE(s) \
893 ((((s) & 3) == BIG ? 4 : (((s) & 3) == BIG16 ? 2 : 1)))
894
895 /* This table is used by relax_frag to promote short jumps to long
896 ones where necessary. SMALL (short) jumps may be promoted to BIG
897 (32 bit long) ones, and SMALL16 jumps to BIG16 (16 bit long). We
898 don't allow a short jump in a 32 bit code segment to be promoted to
899 a 16 bit offset jump because it's slower (requires data size
900 prefix), and doesn't work, unless the destination is in the bottom
901 64k of the code segment (The top 16 bits of eip are zeroed). */
902
903 const relax_typeS md_relax_table[] =
904 {
905 /* The fields are:
906 1) most positive reach of this state,
907 2) most negative reach of this state,
908 3) how many bytes this mode will have in the variable part of the frag
909 4) which index into the table to try if we can't fit into this one. */
910
911 /* UNCOND_JUMP states. */
912 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG)},
913 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16)},
914 /* dword jmp adds 4 bytes to frag:
915 0 extra opcode bytes, 4 displacement bytes. */
916 {0, 0, 4, 0},
917 /* word jmp adds 2 byte2 to frag:
918 0 extra opcode bytes, 2 displacement bytes. */
919 {0, 0, 2, 0},
920
921 /* COND_JUMP states. */
922 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG)},
923 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP, BIG16)},
924 /* dword conditionals adds 5 bytes to frag:
925 1 extra opcode byte, 4 displacement bytes. */
926 {0, 0, 5, 0},
927 /* word conditionals add 3 bytes to frag:
928 1 extra opcode byte, 2 displacement bytes. */
929 {0, 0, 3, 0},
930
931 /* COND_JUMP86 states. */
932 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG)},
933 {127 + 1, -128 + 1, 1, ENCODE_RELAX_STATE (COND_JUMP86, BIG16)},
934 /* dword conditionals adds 5 bytes to frag:
935 1 extra opcode byte, 4 displacement bytes. */
936 {0, 0, 5, 0},
937 /* word conditionals add 4 bytes to frag:
938 1 displacement byte and a 3 byte long branch insn. */
939 {0, 0, 4, 0}
940 };
941
942 static const arch_entry cpu_arch[] =
943 {
944 /* Do not replace the first two entries - i386_target_format()
945 relies on them being there in this order. */
946 { STRING_COMMA_LEN ("generic32"), PROCESSOR_GENERIC32,
947 CPU_GENERIC32_FLAGS, 0 },
948 { STRING_COMMA_LEN ("generic64"), PROCESSOR_GENERIC64,
949 CPU_GENERIC64_FLAGS, 0 },
950 { STRING_COMMA_LEN ("i8086"), PROCESSOR_UNKNOWN,
951 CPU_NONE_FLAGS, 0 },
952 { STRING_COMMA_LEN ("i186"), PROCESSOR_UNKNOWN,
953 CPU_I186_FLAGS, 0 },
954 { STRING_COMMA_LEN ("i286"), PROCESSOR_UNKNOWN,
955 CPU_I286_FLAGS, 0 },
956 { STRING_COMMA_LEN ("i386"), PROCESSOR_I386,
957 CPU_I386_FLAGS, 0 },
958 { STRING_COMMA_LEN ("i486"), PROCESSOR_I486,
959 CPU_I486_FLAGS, 0 },
960 { STRING_COMMA_LEN ("i586"), PROCESSOR_PENTIUM,
961 CPU_I586_FLAGS, 0 },
962 { STRING_COMMA_LEN ("i686"), PROCESSOR_PENTIUMPRO,
963 CPU_I686_FLAGS, 0 },
964 { STRING_COMMA_LEN ("pentium"), PROCESSOR_PENTIUM,
965 CPU_I586_FLAGS, 0 },
966 { STRING_COMMA_LEN ("pentiumpro"), PROCESSOR_PENTIUMPRO,
967 CPU_PENTIUMPRO_FLAGS, 0 },
968 { STRING_COMMA_LEN ("pentiumii"), PROCESSOR_PENTIUMPRO,
969 CPU_P2_FLAGS, 0 },
970 { STRING_COMMA_LEN ("pentiumiii"),PROCESSOR_PENTIUMPRO,
971 CPU_P3_FLAGS, 0 },
972 { STRING_COMMA_LEN ("pentium4"), PROCESSOR_PENTIUM4,
973 CPU_P4_FLAGS, 0 },
974 { STRING_COMMA_LEN ("prescott"), PROCESSOR_NOCONA,
975 CPU_CORE_FLAGS, 0 },
976 { STRING_COMMA_LEN ("nocona"), PROCESSOR_NOCONA,
977 CPU_NOCONA_FLAGS, 0 },
978 { STRING_COMMA_LEN ("yonah"), PROCESSOR_CORE,
979 CPU_CORE_FLAGS, 1 },
980 { STRING_COMMA_LEN ("core"), PROCESSOR_CORE,
981 CPU_CORE_FLAGS, 0 },
982 { STRING_COMMA_LEN ("merom"), PROCESSOR_CORE2,
983 CPU_CORE2_FLAGS, 1 },
984 { STRING_COMMA_LEN ("core2"), PROCESSOR_CORE2,
985 CPU_CORE2_FLAGS, 0 },
986 { STRING_COMMA_LEN ("corei7"), PROCESSOR_COREI7,
987 CPU_COREI7_FLAGS, 0 },
988 { STRING_COMMA_LEN ("l1om"), PROCESSOR_L1OM,
989 CPU_L1OM_FLAGS, 0 },
990 { STRING_COMMA_LEN ("k1om"), PROCESSOR_K1OM,
991 CPU_K1OM_FLAGS, 0 },
992 { STRING_COMMA_LEN ("iamcu"), PROCESSOR_IAMCU,
993 CPU_IAMCU_FLAGS, 0 },
994 { STRING_COMMA_LEN ("k6"), PROCESSOR_K6,
995 CPU_K6_FLAGS, 0 },
996 { STRING_COMMA_LEN ("k6_2"), PROCESSOR_K6,
997 CPU_K6_2_FLAGS, 0 },
998 { STRING_COMMA_LEN ("athlon"), PROCESSOR_ATHLON,
999 CPU_ATHLON_FLAGS, 0 },
1000 { STRING_COMMA_LEN ("sledgehammer"), PROCESSOR_K8,
1001 CPU_K8_FLAGS, 1 },
1002 { STRING_COMMA_LEN ("opteron"), PROCESSOR_K8,
1003 CPU_K8_FLAGS, 0 },
1004 { STRING_COMMA_LEN ("k8"), PROCESSOR_K8,
1005 CPU_K8_FLAGS, 0 },
1006 { STRING_COMMA_LEN ("amdfam10"), PROCESSOR_AMDFAM10,
1007 CPU_AMDFAM10_FLAGS, 0 },
1008 { STRING_COMMA_LEN ("bdver1"), PROCESSOR_BD,
1009 CPU_BDVER1_FLAGS, 0 },
1010 { STRING_COMMA_LEN ("bdver2"), PROCESSOR_BD,
1011 CPU_BDVER2_FLAGS, 0 },
1012 { STRING_COMMA_LEN ("bdver3"), PROCESSOR_BD,
1013 CPU_BDVER3_FLAGS, 0 },
1014 { STRING_COMMA_LEN ("bdver4"), PROCESSOR_BD,
1015 CPU_BDVER4_FLAGS, 0 },
1016 { STRING_COMMA_LEN ("znver1"), PROCESSOR_ZNVER,
1017 CPU_ZNVER1_FLAGS, 0 },
1018 { STRING_COMMA_LEN ("znver2"), PROCESSOR_ZNVER,
1019 CPU_ZNVER2_FLAGS, 0 },
1020 { STRING_COMMA_LEN ("znver3"), PROCESSOR_ZNVER,
1021 CPU_ZNVER3_FLAGS, 0 },
1022 { STRING_COMMA_LEN ("btver1"), PROCESSOR_BT,
1023 CPU_BTVER1_FLAGS, 0 },
1024 { STRING_COMMA_LEN ("btver2"), PROCESSOR_BT,
1025 CPU_BTVER2_FLAGS, 0 },
1026 { STRING_COMMA_LEN (".8087"), PROCESSOR_UNKNOWN,
1027 CPU_8087_FLAGS, 0 },
1028 { STRING_COMMA_LEN (".287"), PROCESSOR_UNKNOWN,
1029 CPU_287_FLAGS, 0 },
1030 { STRING_COMMA_LEN (".387"), PROCESSOR_UNKNOWN,
1031 CPU_387_FLAGS, 0 },
1032 { STRING_COMMA_LEN (".687"), PROCESSOR_UNKNOWN,
1033 CPU_687_FLAGS, 0 },
1034 { STRING_COMMA_LEN (".cmov"), PROCESSOR_UNKNOWN,
1035 CPU_CMOV_FLAGS, 0 },
1036 { STRING_COMMA_LEN (".fxsr"), PROCESSOR_UNKNOWN,
1037 CPU_FXSR_FLAGS, 0 },
1038 { STRING_COMMA_LEN (".mmx"), PROCESSOR_UNKNOWN,
1039 CPU_MMX_FLAGS, 0 },
1040 { STRING_COMMA_LEN (".sse"), PROCESSOR_UNKNOWN,
1041 CPU_SSE_FLAGS, 0 },
1042 { STRING_COMMA_LEN (".sse2"), PROCESSOR_UNKNOWN,
1043 CPU_SSE2_FLAGS, 0 },
1044 { STRING_COMMA_LEN (".sse3"), PROCESSOR_UNKNOWN,
1045 CPU_SSE3_FLAGS, 0 },
1046 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1047 CPU_SSE4A_FLAGS, 0 },
1048 { STRING_COMMA_LEN (".ssse3"), PROCESSOR_UNKNOWN,
1049 CPU_SSSE3_FLAGS, 0 },
1050 { STRING_COMMA_LEN (".sse4.1"), PROCESSOR_UNKNOWN,
1051 CPU_SSE4_1_FLAGS, 0 },
1052 { STRING_COMMA_LEN (".sse4.2"), PROCESSOR_UNKNOWN,
1053 CPU_SSE4_2_FLAGS, 0 },
1054 { STRING_COMMA_LEN (".sse4"), PROCESSOR_UNKNOWN,
1055 CPU_SSE4_2_FLAGS, 0 },
1056 { STRING_COMMA_LEN (".avx"), PROCESSOR_UNKNOWN,
1057 CPU_AVX_FLAGS, 0 },
1058 { STRING_COMMA_LEN (".avx2"), PROCESSOR_UNKNOWN,
1059 CPU_AVX2_FLAGS, 0 },
1060 { STRING_COMMA_LEN (".avx512f"), PROCESSOR_UNKNOWN,
1061 CPU_AVX512F_FLAGS, 0 },
1062 { STRING_COMMA_LEN (".avx512cd"), PROCESSOR_UNKNOWN,
1063 CPU_AVX512CD_FLAGS, 0 },
1064 { STRING_COMMA_LEN (".avx512er"), PROCESSOR_UNKNOWN,
1065 CPU_AVX512ER_FLAGS, 0 },
1066 { STRING_COMMA_LEN (".avx512pf"), PROCESSOR_UNKNOWN,
1067 CPU_AVX512PF_FLAGS, 0 },
1068 { STRING_COMMA_LEN (".avx512dq"), PROCESSOR_UNKNOWN,
1069 CPU_AVX512DQ_FLAGS, 0 },
1070 { STRING_COMMA_LEN (".avx512bw"), PROCESSOR_UNKNOWN,
1071 CPU_AVX512BW_FLAGS, 0 },
1072 { STRING_COMMA_LEN (".avx512vl"), PROCESSOR_UNKNOWN,
1073 CPU_AVX512VL_FLAGS, 0 },
1074 { STRING_COMMA_LEN (".vmx"), PROCESSOR_UNKNOWN,
1075 CPU_VMX_FLAGS, 0 },
1076 { STRING_COMMA_LEN (".vmfunc"), PROCESSOR_UNKNOWN,
1077 CPU_VMFUNC_FLAGS, 0 },
1078 { STRING_COMMA_LEN (".smx"), PROCESSOR_UNKNOWN,
1079 CPU_SMX_FLAGS, 0 },
1080 { STRING_COMMA_LEN (".xsave"), PROCESSOR_UNKNOWN,
1081 CPU_XSAVE_FLAGS, 0 },
1082 { STRING_COMMA_LEN (".xsaveopt"), PROCESSOR_UNKNOWN,
1083 CPU_XSAVEOPT_FLAGS, 0 },
1084 { STRING_COMMA_LEN (".xsavec"), PROCESSOR_UNKNOWN,
1085 CPU_XSAVEC_FLAGS, 0 },
1086 { STRING_COMMA_LEN (".xsaves"), PROCESSOR_UNKNOWN,
1087 CPU_XSAVES_FLAGS, 0 },
1088 { STRING_COMMA_LEN (".aes"), PROCESSOR_UNKNOWN,
1089 CPU_AES_FLAGS, 0 },
1090 { STRING_COMMA_LEN (".pclmul"), PROCESSOR_UNKNOWN,
1091 CPU_PCLMUL_FLAGS, 0 },
1092 { STRING_COMMA_LEN (".clmul"), PROCESSOR_UNKNOWN,
1093 CPU_PCLMUL_FLAGS, 1 },
1094 { STRING_COMMA_LEN (".fsgsbase"), PROCESSOR_UNKNOWN,
1095 CPU_FSGSBASE_FLAGS, 0 },
1096 { STRING_COMMA_LEN (".rdrnd"), PROCESSOR_UNKNOWN,
1097 CPU_RDRND_FLAGS, 0 },
1098 { STRING_COMMA_LEN (".f16c"), PROCESSOR_UNKNOWN,
1099 CPU_F16C_FLAGS, 0 },
1100 { STRING_COMMA_LEN (".bmi2"), PROCESSOR_UNKNOWN,
1101 CPU_BMI2_FLAGS, 0 },
1102 { STRING_COMMA_LEN (".fma"), PROCESSOR_UNKNOWN,
1103 CPU_FMA_FLAGS, 0 },
1104 { STRING_COMMA_LEN (".fma4"), PROCESSOR_UNKNOWN,
1105 CPU_FMA4_FLAGS, 0 },
1106 { STRING_COMMA_LEN (".xop"), PROCESSOR_UNKNOWN,
1107 CPU_XOP_FLAGS, 0 },
1108 { STRING_COMMA_LEN (".lwp"), PROCESSOR_UNKNOWN,
1109 CPU_LWP_FLAGS, 0 },
1110 { STRING_COMMA_LEN (".movbe"), PROCESSOR_UNKNOWN,
1111 CPU_MOVBE_FLAGS, 0 },
1112 { STRING_COMMA_LEN (".cx16"), PROCESSOR_UNKNOWN,
1113 CPU_CX16_FLAGS, 0 },
1114 { STRING_COMMA_LEN (".ept"), PROCESSOR_UNKNOWN,
1115 CPU_EPT_FLAGS, 0 },
1116 { STRING_COMMA_LEN (".lzcnt"), PROCESSOR_UNKNOWN,
1117 CPU_LZCNT_FLAGS, 0 },
1118 { STRING_COMMA_LEN (".popcnt"), PROCESSOR_UNKNOWN,
1119 CPU_POPCNT_FLAGS, 0 },
1120 { STRING_COMMA_LEN (".hle"), PROCESSOR_UNKNOWN,
1121 CPU_HLE_FLAGS, 0 },
1122 { STRING_COMMA_LEN (".rtm"), PROCESSOR_UNKNOWN,
1123 CPU_RTM_FLAGS, 0 },
1124 { STRING_COMMA_LEN (".invpcid"), PROCESSOR_UNKNOWN,
1125 CPU_INVPCID_FLAGS, 0 },
1126 { STRING_COMMA_LEN (".clflush"), PROCESSOR_UNKNOWN,
1127 CPU_CLFLUSH_FLAGS, 0 },
1128 { STRING_COMMA_LEN (".nop"), PROCESSOR_UNKNOWN,
1129 CPU_NOP_FLAGS, 0 },
1130 { STRING_COMMA_LEN (".syscall"), PROCESSOR_UNKNOWN,
1131 CPU_SYSCALL_FLAGS, 0 },
1132 { STRING_COMMA_LEN (".rdtscp"), PROCESSOR_UNKNOWN,
1133 CPU_RDTSCP_FLAGS, 0 },
1134 { STRING_COMMA_LEN (".3dnow"), PROCESSOR_UNKNOWN,
1135 CPU_3DNOW_FLAGS, 0 },
1136 { STRING_COMMA_LEN (".3dnowa"), PROCESSOR_UNKNOWN,
1137 CPU_3DNOWA_FLAGS, 0 },
1138 { STRING_COMMA_LEN (".padlock"), PROCESSOR_UNKNOWN,
1139 CPU_PADLOCK_FLAGS, 0 },
1140 { STRING_COMMA_LEN (".pacifica"), PROCESSOR_UNKNOWN,
1141 CPU_SVME_FLAGS, 1 },
1142 { STRING_COMMA_LEN (".svme"), PROCESSOR_UNKNOWN,
1143 CPU_SVME_FLAGS, 0 },
1144 { STRING_COMMA_LEN (".sse4a"), PROCESSOR_UNKNOWN,
1145 CPU_SSE4A_FLAGS, 0 },
1146 { STRING_COMMA_LEN (".abm"), PROCESSOR_UNKNOWN,
1147 CPU_ABM_FLAGS, 0 },
1148 { STRING_COMMA_LEN (".bmi"), PROCESSOR_UNKNOWN,
1149 CPU_BMI_FLAGS, 0 },
1150 { STRING_COMMA_LEN (".tbm"), PROCESSOR_UNKNOWN,
1151 CPU_TBM_FLAGS, 0 },
1152 { STRING_COMMA_LEN (".adx"), PROCESSOR_UNKNOWN,
1153 CPU_ADX_FLAGS, 0 },
1154 { STRING_COMMA_LEN (".rdseed"), PROCESSOR_UNKNOWN,
1155 CPU_RDSEED_FLAGS, 0 },
1156 { STRING_COMMA_LEN (".prfchw"), PROCESSOR_UNKNOWN,
1157 CPU_PRFCHW_FLAGS, 0 },
1158 { STRING_COMMA_LEN (".smap"), PROCESSOR_UNKNOWN,
1159 CPU_SMAP_FLAGS, 0 },
1160 { STRING_COMMA_LEN (".mpx"), PROCESSOR_UNKNOWN,
1161 CPU_MPX_FLAGS, 0 },
1162 { STRING_COMMA_LEN (".sha"), PROCESSOR_UNKNOWN,
1163 CPU_SHA_FLAGS, 0 },
1164 { STRING_COMMA_LEN (".clflushopt"), PROCESSOR_UNKNOWN,
1165 CPU_CLFLUSHOPT_FLAGS, 0 },
1166 { STRING_COMMA_LEN (".prefetchwt1"), PROCESSOR_UNKNOWN,
1167 CPU_PREFETCHWT1_FLAGS, 0 },
1168 { STRING_COMMA_LEN (".se1"), PROCESSOR_UNKNOWN,
1169 CPU_SE1_FLAGS, 0 },
1170 { STRING_COMMA_LEN (".clwb"), PROCESSOR_UNKNOWN,
1171 CPU_CLWB_FLAGS, 0 },
1172 { STRING_COMMA_LEN (".avx512ifma"), PROCESSOR_UNKNOWN,
1173 CPU_AVX512IFMA_FLAGS, 0 },
1174 { STRING_COMMA_LEN (".avx512vbmi"), PROCESSOR_UNKNOWN,
1175 CPU_AVX512VBMI_FLAGS, 0 },
1176 { STRING_COMMA_LEN (".avx512_4fmaps"), PROCESSOR_UNKNOWN,
1177 CPU_AVX512_4FMAPS_FLAGS, 0 },
1178 { STRING_COMMA_LEN (".avx512_4vnniw"), PROCESSOR_UNKNOWN,
1179 CPU_AVX512_4VNNIW_FLAGS, 0 },
1180 { STRING_COMMA_LEN (".avx512_vpopcntdq"), PROCESSOR_UNKNOWN,
1181 CPU_AVX512_VPOPCNTDQ_FLAGS, 0 },
1182 { STRING_COMMA_LEN (".avx512_vbmi2"), PROCESSOR_UNKNOWN,
1183 CPU_AVX512_VBMI2_FLAGS, 0 },
1184 { STRING_COMMA_LEN (".avx512_vnni"), PROCESSOR_UNKNOWN,
1185 CPU_AVX512_VNNI_FLAGS, 0 },
1186 { STRING_COMMA_LEN (".avx512_bitalg"), PROCESSOR_UNKNOWN,
1187 CPU_AVX512_BITALG_FLAGS, 0 },
1188 { STRING_COMMA_LEN (".avx_vnni"), PROCESSOR_UNKNOWN,
1189 CPU_AVX_VNNI_FLAGS, 0 },
1190 { STRING_COMMA_LEN (".clzero"), PROCESSOR_UNKNOWN,
1191 CPU_CLZERO_FLAGS, 0 },
1192 { STRING_COMMA_LEN (".mwaitx"), PROCESSOR_UNKNOWN,
1193 CPU_MWAITX_FLAGS, 0 },
1194 { STRING_COMMA_LEN (".ospke"), PROCESSOR_UNKNOWN,
1195 CPU_OSPKE_FLAGS, 0 },
1196 { STRING_COMMA_LEN (".rdpid"), PROCESSOR_UNKNOWN,
1197 CPU_RDPID_FLAGS, 0 },
1198 { STRING_COMMA_LEN (".ptwrite"), PROCESSOR_UNKNOWN,
1199 CPU_PTWRITE_FLAGS, 0 },
1200 { STRING_COMMA_LEN (".ibt"), PROCESSOR_UNKNOWN,
1201 CPU_IBT_FLAGS, 0 },
1202 { STRING_COMMA_LEN (".shstk"), PROCESSOR_UNKNOWN,
1203 CPU_SHSTK_FLAGS, 0 },
1204 { STRING_COMMA_LEN (".gfni"), PROCESSOR_UNKNOWN,
1205 CPU_GFNI_FLAGS, 0 },
1206 { STRING_COMMA_LEN (".vaes"), PROCESSOR_UNKNOWN,
1207 CPU_VAES_FLAGS, 0 },
1208 { STRING_COMMA_LEN (".vpclmulqdq"), PROCESSOR_UNKNOWN,
1209 CPU_VPCLMULQDQ_FLAGS, 0 },
1210 { STRING_COMMA_LEN (".wbnoinvd"), PROCESSOR_UNKNOWN,
1211 CPU_WBNOINVD_FLAGS, 0 },
1212 { STRING_COMMA_LEN (".pconfig"), PROCESSOR_UNKNOWN,
1213 CPU_PCONFIG_FLAGS, 0 },
1214 { STRING_COMMA_LEN (".waitpkg"), PROCESSOR_UNKNOWN,
1215 CPU_WAITPKG_FLAGS, 0 },
1216 { STRING_COMMA_LEN (".cldemote"), PROCESSOR_UNKNOWN,
1217 CPU_CLDEMOTE_FLAGS, 0 },
1218 { STRING_COMMA_LEN (".amx_int8"), PROCESSOR_UNKNOWN,
1219 CPU_AMX_INT8_FLAGS, 0 },
1220 { STRING_COMMA_LEN (".amx_bf16"), PROCESSOR_UNKNOWN,
1221 CPU_AMX_BF16_FLAGS, 0 },
1222 { STRING_COMMA_LEN (".amx_tile"), PROCESSOR_UNKNOWN,
1223 CPU_AMX_TILE_FLAGS, 0 },
1224 { STRING_COMMA_LEN (".movdiri"), PROCESSOR_UNKNOWN,
1225 CPU_MOVDIRI_FLAGS, 0 },
1226 { STRING_COMMA_LEN (".movdir64b"), PROCESSOR_UNKNOWN,
1227 CPU_MOVDIR64B_FLAGS, 0 },
1228 { STRING_COMMA_LEN (".avx512_bf16"), PROCESSOR_UNKNOWN,
1229 CPU_AVX512_BF16_FLAGS, 0 },
1230 { STRING_COMMA_LEN (".avx512_vp2intersect"), PROCESSOR_UNKNOWN,
1231 CPU_AVX512_VP2INTERSECT_FLAGS, 0 },
1232 { STRING_COMMA_LEN (".tdx"), PROCESSOR_UNKNOWN,
1233 CPU_TDX_FLAGS, 0 },
1234 { STRING_COMMA_LEN (".enqcmd"), PROCESSOR_UNKNOWN,
1235 CPU_ENQCMD_FLAGS, 0 },
1236 { STRING_COMMA_LEN (".serialize"), PROCESSOR_UNKNOWN,
1237 CPU_SERIALIZE_FLAGS, 0 },
1238 { STRING_COMMA_LEN (".rdpru"), PROCESSOR_UNKNOWN,
1239 CPU_RDPRU_FLAGS, 0 },
1240 { STRING_COMMA_LEN (".mcommit"), PROCESSOR_UNKNOWN,
1241 CPU_MCOMMIT_FLAGS, 0 },
1242 { STRING_COMMA_LEN (".sev_es"), PROCESSOR_UNKNOWN,
1243 CPU_SEV_ES_FLAGS, 0 },
1244 { STRING_COMMA_LEN (".tsxldtrk"), PROCESSOR_UNKNOWN,
1245 CPU_TSXLDTRK_FLAGS, 0 },
1246 { STRING_COMMA_LEN (".kl"), PROCESSOR_UNKNOWN,
1247 CPU_KL_FLAGS, 0 },
1248 { STRING_COMMA_LEN (".widekl"), PROCESSOR_UNKNOWN,
1249 CPU_WIDEKL_FLAGS, 0 },
1250 { STRING_COMMA_LEN (".uintr"), PROCESSOR_UNKNOWN,
1251 CPU_UINTR_FLAGS, 0 },
1252 { STRING_COMMA_LEN (".hreset"), PROCESSOR_UNKNOWN,
1253 CPU_HRESET_FLAGS, 0 },
1254 };
1255
1256 static const noarch_entry cpu_noarch[] =
1257 {
1258 { STRING_COMMA_LEN ("no87"), CPU_ANY_X87_FLAGS },
1259 { STRING_COMMA_LEN ("no287"), CPU_ANY_287_FLAGS },
1260 { STRING_COMMA_LEN ("no387"), CPU_ANY_387_FLAGS },
1261 { STRING_COMMA_LEN ("no687"), CPU_ANY_687_FLAGS },
1262 { STRING_COMMA_LEN ("nocmov"), CPU_ANY_CMOV_FLAGS },
1263 { STRING_COMMA_LEN ("nofxsr"), CPU_ANY_FXSR_FLAGS },
1264 { STRING_COMMA_LEN ("nommx"), CPU_ANY_MMX_FLAGS },
1265 { STRING_COMMA_LEN ("nosse"), CPU_ANY_SSE_FLAGS },
1266 { STRING_COMMA_LEN ("nosse2"), CPU_ANY_SSE2_FLAGS },
1267 { STRING_COMMA_LEN ("nosse3"), CPU_ANY_SSE3_FLAGS },
1268 { STRING_COMMA_LEN ("nosse4a"), CPU_ANY_SSE4A_FLAGS },
1269 { STRING_COMMA_LEN ("nossse3"), CPU_ANY_SSSE3_FLAGS },
1270 { STRING_COMMA_LEN ("nosse4.1"), CPU_ANY_SSE4_1_FLAGS },
1271 { STRING_COMMA_LEN ("nosse4.2"), CPU_ANY_SSE4_2_FLAGS },
1272 { STRING_COMMA_LEN ("nosse4"), CPU_ANY_SSE4_1_FLAGS },
1273 { STRING_COMMA_LEN ("noavx"), CPU_ANY_AVX_FLAGS },
1274 { STRING_COMMA_LEN ("noavx2"), CPU_ANY_AVX2_FLAGS },
1275 { STRING_COMMA_LEN ("noavx512f"), CPU_ANY_AVX512F_FLAGS },
1276 { STRING_COMMA_LEN ("noavx512cd"), CPU_ANY_AVX512CD_FLAGS },
1277 { STRING_COMMA_LEN ("noavx512er"), CPU_ANY_AVX512ER_FLAGS },
1278 { STRING_COMMA_LEN ("noavx512pf"), CPU_ANY_AVX512PF_FLAGS },
1279 { STRING_COMMA_LEN ("noavx512dq"), CPU_ANY_AVX512DQ_FLAGS },
1280 { STRING_COMMA_LEN ("noavx512bw"), CPU_ANY_AVX512BW_FLAGS },
1281 { STRING_COMMA_LEN ("noavx512vl"), CPU_ANY_AVX512VL_FLAGS },
1282 { STRING_COMMA_LEN ("noavx512ifma"), CPU_ANY_AVX512IFMA_FLAGS },
1283 { STRING_COMMA_LEN ("noavx512vbmi"), CPU_ANY_AVX512VBMI_FLAGS },
1284 { STRING_COMMA_LEN ("noavx512_4fmaps"), CPU_ANY_AVX512_4FMAPS_FLAGS },
1285 { STRING_COMMA_LEN ("noavx512_4vnniw"), CPU_ANY_AVX512_4VNNIW_FLAGS },
1286 { STRING_COMMA_LEN ("noavx512_vpopcntdq"), CPU_ANY_AVX512_VPOPCNTDQ_FLAGS },
1287 { STRING_COMMA_LEN ("noavx512_vbmi2"), CPU_ANY_AVX512_VBMI2_FLAGS },
1288 { STRING_COMMA_LEN ("noavx512_vnni"), CPU_ANY_AVX512_VNNI_FLAGS },
1289 { STRING_COMMA_LEN ("noavx512_bitalg"), CPU_ANY_AVX512_BITALG_FLAGS },
1290 { STRING_COMMA_LEN ("noavx_vnni"), CPU_ANY_AVX_VNNI_FLAGS },
1291 { STRING_COMMA_LEN ("noibt"), CPU_ANY_IBT_FLAGS },
1292 { STRING_COMMA_LEN ("noshstk"), CPU_ANY_SHSTK_FLAGS },
1293 { STRING_COMMA_LEN ("noamx_int8"), CPU_ANY_AMX_INT8_FLAGS },
1294 { STRING_COMMA_LEN ("noamx_bf16"), CPU_ANY_AMX_BF16_FLAGS },
1295 { STRING_COMMA_LEN ("noamx_tile"), CPU_ANY_AMX_TILE_FLAGS },
1296 { STRING_COMMA_LEN ("nomovdiri"), CPU_ANY_MOVDIRI_FLAGS },
1297 { STRING_COMMA_LEN ("nomovdir64b"), CPU_ANY_MOVDIR64B_FLAGS },
1298 { STRING_COMMA_LEN ("noavx512_bf16"), CPU_ANY_AVX512_BF16_FLAGS },
1299 { STRING_COMMA_LEN ("noavx512_vp2intersect"),
1300 CPU_ANY_AVX512_VP2INTERSECT_FLAGS },
1301 { STRING_COMMA_LEN ("notdx"), CPU_ANY_TDX_FLAGS },
1302 { STRING_COMMA_LEN ("noenqcmd"), CPU_ANY_ENQCMD_FLAGS },
1303 { STRING_COMMA_LEN ("noserialize"), CPU_ANY_SERIALIZE_FLAGS },
1304 { STRING_COMMA_LEN ("notsxldtrk"), CPU_ANY_TSXLDTRK_FLAGS },
1305 { STRING_COMMA_LEN ("nokl"), CPU_ANY_KL_FLAGS },
1306 { STRING_COMMA_LEN ("nowidekl"), CPU_ANY_WIDEKL_FLAGS },
1307 { STRING_COMMA_LEN ("nouintr"), CPU_ANY_UINTR_FLAGS },
1308 { STRING_COMMA_LEN ("nohreset"), CPU_ANY_HRESET_FLAGS },
1309 };
1310
1311 #ifdef I386COFF
1312 /* Like s_lcomm_internal in gas/read.c but the alignment string
1313 is allowed to be optional. */
1314
1315 static symbolS *
1316 pe_lcomm_internal (int needs_align, symbolS *symbolP, addressT size)
1317 {
1318 addressT align = 0;
1319
1320 SKIP_WHITESPACE ();
1321
1322 if (needs_align
1323 && *input_line_pointer == ',')
1324 {
1325 align = parse_align (needs_align - 1);
1326
1327 if (align == (addressT) -1)
1328 return NULL;
1329 }
1330 else
1331 {
1332 if (size >= 8)
1333 align = 3;
1334 else if (size >= 4)
1335 align = 2;
1336 else if (size >= 2)
1337 align = 1;
1338 else
1339 align = 0;
1340 }
1341
1342 bss_alloc (symbolP, size, align);
1343 return symbolP;
1344 }
1345
1346 static void
1347 pe_lcomm (int needs_align)
1348 {
1349 s_comm_internal (needs_align * 2, pe_lcomm_internal);
1350 }
1351 #endif
1352
1353 const pseudo_typeS md_pseudo_table[] =
1354 {
1355 #if !defined(OBJ_AOUT) && !defined(USE_ALIGN_PTWO)
1356 {"align", s_align_bytes, 0},
1357 #else
1358 {"align", s_align_ptwo, 0},
1359 #endif
1360 {"arch", set_cpu_arch, 0},
1361 #ifndef I386COFF
1362 {"bss", s_bss, 0},
1363 #else
1364 {"lcomm", pe_lcomm, 1},
1365 #endif
1366 {"ffloat", float_cons, 'f'},
1367 {"dfloat", float_cons, 'd'},
1368 {"tfloat", float_cons, 'x'},
1369 {"value", cons, 2},
1370 {"slong", signed_cons, 4},
1371 {"noopt", s_ignore, 0},
1372 {"optim", s_ignore, 0},
1373 {"code16gcc", set_16bit_gcc_code_flag, CODE_16BIT},
1374 {"code16", set_code_flag, CODE_16BIT},
1375 {"code32", set_code_flag, CODE_32BIT},
1376 #ifdef BFD64
1377 {"code64", set_code_flag, CODE_64BIT},
1378 #endif
1379 {"intel_syntax", set_intel_syntax, 1},
1380 {"att_syntax", set_intel_syntax, 0},
1381 {"intel_mnemonic", set_intel_mnemonic, 1},
1382 {"att_mnemonic", set_intel_mnemonic, 0},
1383 {"allow_index_reg", set_allow_index_reg, 1},
1384 {"disallow_index_reg", set_allow_index_reg, 0},
1385 {"sse_check", set_check, 0},
1386 {"operand_check", set_check, 1},
1387 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
1388 {"largecomm", handle_large_common, 0},
1389 #else
1390 {"file", dwarf2_directive_file, 0},
1391 {"loc", dwarf2_directive_loc, 0},
1392 {"loc_mark_labels", dwarf2_directive_loc_mark_labels, 0},
1393 #endif
1394 #ifdef TE_PE
1395 {"secrel32", pe_directive_secrel, 0},
1396 #endif
1397 {0, 0, 0}
1398 };
1399
1400 /* For interface with expression (). */
1401 extern char *input_line_pointer;
1402
1403 /* Hash table for instruction mnemonic lookup. */
1404 static htab_t op_hash;
1405
1406 /* Hash table for register lookup. */
1407 static htab_t reg_hash;
1408 \f
1409 /* Various efficient no-op patterns for aligning code labels.
1410 Note: Don't try to assemble the instructions in the comments.
1411 0L and 0w are not legal. */
1412 static const unsigned char f32_1[] =
1413 {0x90}; /* nop */
1414 static const unsigned char f32_2[] =
1415 {0x66,0x90}; /* xchg %ax,%ax */
1416 static const unsigned char f32_3[] =
1417 {0x8d,0x76,0x00}; /* leal 0(%esi),%esi */
1418 static const unsigned char f32_4[] =
1419 {0x8d,0x74,0x26,0x00}; /* leal 0(%esi,1),%esi */
1420 static const unsigned char f32_6[] =
1421 {0x8d,0xb6,0x00,0x00,0x00,0x00}; /* leal 0L(%esi),%esi */
1422 static const unsigned char f32_7[] =
1423 {0x8d,0xb4,0x26,0x00,0x00,0x00,0x00}; /* leal 0L(%esi,1),%esi */
1424 static const unsigned char f16_3[] =
1425 {0x8d,0x74,0x00}; /* lea 0(%si),%si */
1426 static const unsigned char f16_4[] =
1427 {0x8d,0xb4,0x00,0x00}; /* lea 0W(%si),%si */
1428 static const unsigned char jump_disp8[] =
1429 {0xeb}; /* jmp disp8 */
1430 static const unsigned char jump32_disp32[] =
1431 {0xe9}; /* jmp disp32 */
1432 static const unsigned char jump16_disp32[] =
1433 {0x66,0xe9}; /* jmp disp32 */
1434 /* 32-bit NOPs patterns. */
1435 static const unsigned char *const f32_patt[] = {
1436 f32_1, f32_2, f32_3, f32_4, NULL, f32_6, f32_7
1437 };
1438 /* 16-bit NOPs patterns. */
1439 static const unsigned char *const f16_patt[] = {
1440 f32_1, f32_2, f16_3, f16_4
1441 };
1442 /* nopl (%[re]ax) */
1443 static const unsigned char alt_3[] =
1444 {0x0f,0x1f,0x00};
1445 /* nopl 0(%[re]ax) */
1446 static const unsigned char alt_4[] =
1447 {0x0f,0x1f,0x40,0x00};
1448 /* nopl 0(%[re]ax,%[re]ax,1) */
1449 static const unsigned char alt_5[] =
1450 {0x0f,0x1f,0x44,0x00,0x00};
1451 /* nopw 0(%[re]ax,%[re]ax,1) */
1452 static const unsigned char alt_6[] =
1453 {0x66,0x0f,0x1f,0x44,0x00,0x00};
1454 /* nopl 0L(%[re]ax) */
1455 static const unsigned char alt_7[] =
1456 {0x0f,0x1f,0x80,0x00,0x00,0x00,0x00};
1457 /* nopl 0L(%[re]ax,%[re]ax,1) */
1458 static const unsigned char alt_8[] =
1459 {0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1460 /* nopw 0L(%[re]ax,%[re]ax,1) */
1461 static const unsigned char alt_9[] =
1462 {0x66,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1463 /* nopw %cs:0L(%[re]ax,%[re]ax,1) */
1464 static const unsigned char alt_10[] =
1465 {0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1466 /* data16 nopw %cs:0L(%eax,%eax,1) */
1467 static const unsigned char alt_11[] =
1468 {0x66,0x66,0x2e,0x0f,0x1f,0x84,0x00,0x00,0x00,0x00,0x00};
1469 /* 32-bit and 64-bit NOPs patterns. */
1470 static const unsigned char *const alt_patt[] = {
1471 f32_1, f32_2, alt_3, alt_4, alt_5, alt_6, alt_7, alt_8,
1472 alt_9, alt_10, alt_11
1473 };
1474
1475 /* Genenerate COUNT bytes of NOPs to WHERE from PATT with the maximum
1476 size of a single NOP instruction MAX_SINGLE_NOP_SIZE. */
1477
1478 static void
1479 i386_output_nops (char *where, const unsigned char *const *patt,
1480 int count, int max_single_nop_size)
1481
1482 {
1483 /* Place the longer NOP first. */
1484 int last;
1485 int offset;
1486 const unsigned char *nops;
1487
1488 if (max_single_nop_size < 1)
1489 {
1490 as_fatal (_("i386_output_nops called to generate nops of at most %d bytes!"),
1491 max_single_nop_size);
1492 return;
1493 }
1494
1495 nops = patt[max_single_nop_size - 1];
1496
1497 /* Use the smaller one if the requsted one isn't available. */
1498 if (nops == NULL)
1499 {
1500 max_single_nop_size--;
1501 nops = patt[max_single_nop_size - 1];
1502 }
1503
1504 last = count % max_single_nop_size;
1505
1506 count -= last;
1507 for (offset = 0; offset < count; offset += max_single_nop_size)
1508 memcpy (where + offset, nops, max_single_nop_size);
1509
1510 if (last)
1511 {
1512 nops = patt[last - 1];
1513 if (nops == NULL)
1514 {
1515 /* Use the smaller one plus one-byte NOP if the needed one
1516 isn't available. */
1517 last--;
1518 nops = patt[last - 1];
1519 memcpy (where + offset, nops, last);
1520 where[offset + last] = *patt[0];
1521 }
1522 else
1523 memcpy (where + offset, nops, last);
1524 }
1525 }
1526
1527 static INLINE int
1528 fits_in_imm7 (offsetT num)
1529 {
1530 return (num & 0x7f) == num;
1531 }
1532
1533 static INLINE int
1534 fits_in_imm31 (offsetT num)
1535 {
1536 return (num & 0x7fffffff) == num;
1537 }
1538
1539 /* Genenerate COUNT bytes of NOPs to WHERE with the maximum size of a
1540 single NOP instruction LIMIT. */
1541
1542 void
1543 i386_generate_nops (fragS *fragP, char *where, offsetT count, int limit)
1544 {
1545 const unsigned char *const *patt = NULL;
1546 int max_single_nop_size;
1547 /* Maximum number of NOPs before switching to jump over NOPs. */
1548 int max_number_of_nops;
1549
1550 switch (fragP->fr_type)
1551 {
1552 case rs_fill_nop:
1553 case rs_align_code:
1554 break;
1555 case rs_machine_dependent:
1556 /* Allow NOP padding for jumps and calls. */
1557 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
1558 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
1559 break;
1560 /* Fall through. */
1561 default:
1562 return;
1563 }
1564
1565 /* We need to decide which NOP sequence to use for 32bit and
1566 64bit. When -mtune= is used:
1567
1568 1. For PROCESSOR_I386, PROCESSOR_I486, PROCESSOR_PENTIUM and
1569 PROCESSOR_GENERIC32, f32_patt will be used.
1570 2. For the rest, alt_patt will be used.
1571
1572 When -mtune= isn't used, alt_patt will be used if
1573 cpu_arch_isa_flags has CpuNop. Otherwise, f32_patt will
1574 be used.
1575
1576 When -march= or .arch is used, we can't use anything beyond
1577 cpu_arch_isa_flags. */
1578
1579 if (flag_code == CODE_16BIT)
1580 {
1581 patt = f16_patt;
1582 max_single_nop_size = sizeof (f16_patt) / sizeof (f16_patt[0]);
1583 /* Limit number of NOPs to 2 in 16-bit mode. */
1584 max_number_of_nops = 2;
1585 }
1586 else
1587 {
1588 if (fragP->tc_frag_data.isa == PROCESSOR_UNKNOWN)
1589 {
1590 /* PROCESSOR_UNKNOWN means that all ISAs may be used. */
1591 switch (cpu_arch_tune)
1592 {
1593 case PROCESSOR_UNKNOWN:
1594 /* We use cpu_arch_isa_flags to check if we SHOULD
1595 optimize with nops. */
1596 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1597 patt = alt_patt;
1598 else
1599 patt = f32_patt;
1600 break;
1601 case PROCESSOR_PENTIUM4:
1602 case PROCESSOR_NOCONA:
1603 case PROCESSOR_CORE:
1604 case PROCESSOR_CORE2:
1605 case PROCESSOR_COREI7:
1606 case PROCESSOR_L1OM:
1607 case PROCESSOR_K1OM:
1608 case PROCESSOR_GENERIC64:
1609 case PROCESSOR_K6:
1610 case PROCESSOR_ATHLON:
1611 case PROCESSOR_K8:
1612 case PROCESSOR_AMDFAM10:
1613 case PROCESSOR_BD:
1614 case PROCESSOR_ZNVER:
1615 case PROCESSOR_BT:
1616 patt = alt_patt;
1617 break;
1618 case PROCESSOR_I386:
1619 case PROCESSOR_I486:
1620 case PROCESSOR_PENTIUM:
1621 case PROCESSOR_PENTIUMPRO:
1622 case PROCESSOR_IAMCU:
1623 case PROCESSOR_GENERIC32:
1624 patt = f32_patt;
1625 break;
1626 }
1627 }
1628 else
1629 {
1630 switch (fragP->tc_frag_data.tune)
1631 {
1632 case PROCESSOR_UNKNOWN:
1633 /* When cpu_arch_isa is set, cpu_arch_tune shouldn't be
1634 PROCESSOR_UNKNOWN. */
1635 abort ();
1636 break;
1637
1638 case PROCESSOR_I386:
1639 case PROCESSOR_I486:
1640 case PROCESSOR_PENTIUM:
1641 case PROCESSOR_IAMCU:
1642 case PROCESSOR_K6:
1643 case PROCESSOR_ATHLON:
1644 case PROCESSOR_K8:
1645 case PROCESSOR_AMDFAM10:
1646 case PROCESSOR_BD:
1647 case PROCESSOR_ZNVER:
1648 case PROCESSOR_BT:
1649 case PROCESSOR_GENERIC32:
1650 /* We use cpu_arch_isa_flags to check if we CAN optimize
1651 with nops. */
1652 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1653 patt = alt_patt;
1654 else
1655 patt = f32_patt;
1656 break;
1657 case PROCESSOR_PENTIUMPRO:
1658 case PROCESSOR_PENTIUM4:
1659 case PROCESSOR_NOCONA:
1660 case PROCESSOR_CORE:
1661 case PROCESSOR_CORE2:
1662 case PROCESSOR_COREI7:
1663 case PROCESSOR_L1OM:
1664 case PROCESSOR_K1OM:
1665 if (fragP->tc_frag_data.isa_flags.bitfield.cpunop)
1666 patt = alt_patt;
1667 else
1668 patt = f32_patt;
1669 break;
1670 case PROCESSOR_GENERIC64:
1671 patt = alt_patt;
1672 break;
1673 }
1674 }
1675
1676 if (patt == f32_patt)
1677 {
1678 max_single_nop_size = sizeof (f32_patt) / sizeof (f32_patt[0]);
1679 /* Limit number of NOPs to 2 for older processors. */
1680 max_number_of_nops = 2;
1681 }
1682 else
1683 {
1684 max_single_nop_size = sizeof (alt_patt) / sizeof (alt_patt[0]);
1685 /* Limit number of NOPs to 7 for newer processors. */
1686 max_number_of_nops = 7;
1687 }
1688 }
1689
1690 if (limit == 0)
1691 limit = max_single_nop_size;
1692
1693 if (fragP->fr_type == rs_fill_nop)
1694 {
1695 /* Output NOPs for .nop directive. */
1696 if (limit > max_single_nop_size)
1697 {
1698 as_bad_where (fragP->fr_file, fragP->fr_line,
1699 _("invalid single nop size: %d "
1700 "(expect within [0, %d])"),
1701 limit, max_single_nop_size);
1702 return;
1703 }
1704 }
1705 else if (fragP->fr_type != rs_machine_dependent)
1706 fragP->fr_var = count;
1707
1708 if ((count / max_single_nop_size) > max_number_of_nops)
1709 {
1710 /* Generate jump over NOPs. */
1711 offsetT disp = count - 2;
1712 if (fits_in_imm7 (disp))
1713 {
1714 /* Use "jmp disp8" if possible. */
1715 count = disp;
1716 where[0] = jump_disp8[0];
1717 where[1] = count;
1718 where += 2;
1719 }
1720 else
1721 {
1722 unsigned int size_of_jump;
1723
1724 if (flag_code == CODE_16BIT)
1725 {
1726 where[0] = jump16_disp32[0];
1727 where[1] = jump16_disp32[1];
1728 size_of_jump = 2;
1729 }
1730 else
1731 {
1732 where[0] = jump32_disp32[0];
1733 size_of_jump = 1;
1734 }
1735
1736 count -= size_of_jump + 4;
1737 if (!fits_in_imm31 (count))
1738 {
1739 as_bad_where (fragP->fr_file, fragP->fr_line,
1740 _("jump over nop padding out of range"));
1741 return;
1742 }
1743
1744 md_number_to_chars (where + size_of_jump, count, 4);
1745 where += size_of_jump + 4;
1746 }
1747 }
1748
1749 /* Generate multiple NOPs. */
1750 i386_output_nops (where, patt, count, limit);
1751 }
1752
1753 static INLINE int
1754 operand_type_all_zero (const union i386_operand_type *x)
1755 {
1756 switch (ARRAY_SIZE(x->array))
1757 {
1758 case 3:
1759 if (x->array[2])
1760 return 0;
1761 /* Fall through. */
1762 case 2:
1763 if (x->array[1])
1764 return 0;
1765 /* Fall through. */
1766 case 1:
1767 return !x->array[0];
1768 default:
1769 abort ();
1770 }
1771 }
1772
1773 static INLINE void
1774 operand_type_set (union i386_operand_type *x, unsigned int v)
1775 {
1776 switch (ARRAY_SIZE(x->array))
1777 {
1778 case 3:
1779 x->array[2] = v;
1780 /* Fall through. */
1781 case 2:
1782 x->array[1] = v;
1783 /* Fall through. */
1784 case 1:
1785 x->array[0] = v;
1786 /* Fall through. */
1787 break;
1788 default:
1789 abort ();
1790 }
1791
1792 x->bitfield.class = ClassNone;
1793 x->bitfield.instance = InstanceNone;
1794 }
1795
1796 static INLINE int
1797 operand_type_equal (const union i386_operand_type *x,
1798 const union i386_operand_type *y)
1799 {
1800 switch (ARRAY_SIZE(x->array))
1801 {
1802 case 3:
1803 if (x->array[2] != y->array[2])
1804 return 0;
1805 /* Fall through. */
1806 case 2:
1807 if (x->array[1] != y->array[1])
1808 return 0;
1809 /* Fall through. */
1810 case 1:
1811 return x->array[0] == y->array[0];
1812 break;
1813 default:
1814 abort ();
1815 }
1816 }
1817
1818 static INLINE int
1819 cpu_flags_all_zero (const union i386_cpu_flags *x)
1820 {
1821 switch (ARRAY_SIZE(x->array))
1822 {
1823 case 4:
1824 if (x->array[3])
1825 return 0;
1826 /* Fall through. */
1827 case 3:
1828 if (x->array[2])
1829 return 0;
1830 /* Fall through. */
1831 case 2:
1832 if (x->array[1])
1833 return 0;
1834 /* Fall through. */
1835 case 1:
1836 return !x->array[0];
1837 default:
1838 abort ();
1839 }
1840 }
1841
1842 static INLINE int
1843 cpu_flags_equal (const union i386_cpu_flags *x,
1844 const union i386_cpu_flags *y)
1845 {
1846 switch (ARRAY_SIZE(x->array))
1847 {
1848 case 4:
1849 if (x->array[3] != y->array[3])
1850 return 0;
1851 /* Fall through. */
1852 case 3:
1853 if (x->array[2] != y->array[2])
1854 return 0;
1855 /* Fall through. */
1856 case 2:
1857 if (x->array[1] != y->array[1])
1858 return 0;
1859 /* Fall through. */
1860 case 1:
1861 return x->array[0] == y->array[0];
1862 break;
1863 default:
1864 abort ();
1865 }
1866 }
1867
1868 static INLINE int
1869 cpu_flags_check_cpu64 (i386_cpu_flags f)
1870 {
1871 return !((flag_code == CODE_64BIT && f.bitfield.cpuno64)
1872 || (flag_code != CODE_64BIT && f.bitfield.cpu64));
1873 }
1874
1875 static INLINE i386_cpu_flags
1876 cpu_flags_and (i386_cpu_flags x, i386_cpu_flags y)
1877 {
1878 switch (ARRAY_SIZE (x.array))
1879 {
1880 case 4:
1881 x.array [3] &= y.array [3];
1882 /* Fall through. */
1883 case 3:
1884 x.array [2] &= y.array [2];
1885 /* Fall through. */
1886 case 2:
1887 x.array [1] &= y.array [1];
1888 /* Fall through. */
1889 case 1:
1890 x.array [0] &= y.array [0];
1891 break;
1892 default:
1893 abort ();
1894 }
1895 return x;
1896 }
1897
1898 static INLINE i386_cpu_flags
1899 cpu_flags_or (i386_cpu_flags x, i386_cpu_flags y)
1900 {
1901 switch (ARRAY_SIZE (x.array))
1902 {
1903 case 4:
1904 x.array [3] |= y.array [3];
1905 /* Fall through. */
1906 case 3:
1907 x.array [2] |= y.array [2];
1908 /* Fall through. */
1909 case 2:
1910 x.array [1] |= y.array [1];
1911 /* Fall through. */
1912 case 1:
1913 x.array [0] |= y.array [0];
1914 break;
1915 default:
1916 abort ();
1917 }
1918 return x;
1919 }
1920
1921 static INLINE i386_cpu_flags
1922 cpu_flags_and_not (i386_cpu_flags x, i386_cpu_flags y)
1923 {
1924 switch (ARRAY_SIZE (x.array))
1925 {
1926 case 4:
1927 x.array [3] &= ~y.array [3];
1928 /* Fall through. */
1929 case 3:
1930 x.array [2] &= ~y.array [2];
1931 /* Fall through. */
1932 case 2:
1933 x.array [1] &= ~y.array [1];
1934 /* Fall through. */
1935 case 1:
1936 x.array [0] &= ~y.array [0];
1937 break;
1938 default:
1939 abort ();
1940 }
1941 return x;
1942 }
1943
1944 static const i386_cpu_flags avx512 = CPU_ANY_AVX512F_FLAGS;
1945
1946 #define CPU_FLAGS_ARCH_MATCH 0x1
1947 #define CPU_FLAGS_64BIT_MATCH 0x2
1948
1949 #define CPU_FLAGS_PERFECT_MATCH \
1950 (CPU_FLAGS_ARCH_MATCH | CPU_FLAGS_64BIT_MATCH)
1951
1952 /* Return CPU flags match bits. */
1953
1954 static int
1955 cpu_flags_match (const insn_template *t)
1956 {
1957 i386_cpu_flags x = t->cpu_flags;
1958 int match = cpu_flags_check_cpu64 (x) ? CPU_FLAGS_64BIT_MATCH : 0;
1959
1960 x.bitfield.cpu64 = 0;
1961 x.bitfield.cpuno64 = 0;
1962
1963 if (cpu_flags_all_zero (&x))
1964 {
1965 /* This instruction is available on all archs. */
1966 match |= CPU_FLAGS_ARCH_MATCH;
1967 }
1968 else
1969 {
1970 /* This instruction is available only on some archs. */
1971 i386_cpu_flags cpu = cpu_arch_flags;
1972
1973 /* AVX512VL is no standalone feature - match it and then strip it. */
1974 if (x.bitfield.cpuavx512vl && !cpu.bitfield.cpuavx512vl)
1975 return match;
1976 x.bitfield.cpuavx512vl = 0;
1977
1978 cpu = cpu_flags_and (x, cpu);
1979 if (!cpu_flags_all_zero (&cpu))
1980 {
1981 if (x.bitfield.cpuavx)
1982 {
1983 /* We need to check a few extra flags with AVX. */
1984 if (cpu.bitfield.cpuavx
1985 && (!t->opcode_modifier.sse2avx
1986 || (sse2avx && !i.prefix[DATA_PREFIX]))
1987 && (!x.bitfield.cpuaes || cpu.bitfield.cpuaes)
1988 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1989 && (!x.bitfield.cpupclmul || cpu.bitfield.cpupclmul))
1990 match |= CPU_FLAGS_ARCH_MATCH;
1991 }
1992 else if (x.bitfield.cpuavx512f)
1993 {
1994 /* We need to check a few extra flags with AVX512F. */
1995 if (cpu.bitfield.cpuavx512f
1996 && (!x.bitfield.cpugfni || cpu.bitfield.cpugfni)
1997 && (!x.bitfield.cpuvaes || cpu.bitfield.cpuvaes)
1998 && (!x.bitfield.cpuvpclmulqdq || cpu.bitfield.cpuvpclmulqdq))
1999 match |= CPU_FLAGS_ARCH_MATCH;
2000 }
2001 else
2002 match |= CPU_FLAGS_ARCH_MATCH;
2003 }
2004 }
2005 return match;
2006 }
2007
2008 static INLINE i386_operand_type
2009 operand_type_and (i386_operand_type x, i386_operand_type y)
2010 {
2011 if (x.bitfield.class != y.bitfield.class)
2012 x.bitfield.class = ClassNone;
2013 if (x.bitfield.instance != y.bitfield.instance)
2014 x.bitfield.instance = InstanceNone;
2015
2016 switch (ARRAY_SIZE (x.array))
2017 {
2018 case 3:
2019 x.array [2] &= y.array [2];
2020 /* Fall through. */
2021 case 2:
2022 x.array [1] &= y.array [1];
2023 /* Fall through. */
2024 case 1:
2025 x.array [0] &= y.array [0];
2026 break;
2027 default:
2028 abort ();
2029 }
2030 return x;
2031 }
2032
2033 static INLINE i386_operand_type
2034 operand_type_and_not (i386_operand_type x, i386_operand_type y)
2035 {
2036 gas_assert (y.bitfield.class == ClassNone);
2037 gas_assert (y.bitfield.instance == InstanceNone);
2038
2039 switch (ARRAY_SIZE (x.array))
2040 {
2041 case 3:
2042 x.array [2] &= ~y.array [2];
2043 /* Fall through. */
2044 case 2:
2045 x.array [1] &= ~y.array [1];
2046 /* Fall through. */
2047 case 1:
2048 x.array [0] &= ~y.array [0];
2049 break;
2050 default:
2051 abort ();
2052 }
2053 return x;
2054 }
2055
2056 static INLINE i386_operand_type
2057 operand_type_or (i386_operand_type x, i386_operand_type y)
2058 {
2059 gas_assert (x.bitfield.class == ClassNone ||
2060 y.bitfield.class == ClassNone ||
2061 x.bitfield.class == y.bitfield.class);
2062 gas_assert (x.bitfield.instance == InstanceNone ||
2063 y.bitfield.instance == InstanceNone ||
2064 x.bitfield.instance == y.bitfield.instance);
2065
2066 switch (ARRAY_SIZE (x.array))
2067 {
2068 case 3:
2069 x.array [2] |= y.array [2];
2070 /* Fall through. */
2071 case 2:
2072 x.array [1] |= y.array [1];
2073 /* Fall through. */
2074 case 1:
2075 x.array [0] |= y.array [0];
2076 break;
2077 default:
2078 abort ();
2079 }
2080 return x;
2081 }
2082
2083 static INLINE i386_operand_type
2084 operand_type_xor (i386_operand_type x, i386_operand_type y)
2085 {
2086 gas_assert (y.bitfield.class == ClassNone);
2087 gas_assert (y.bitfield.instance == InstanceNone);
2088
2089 switch (ARRAY_SIZE (x.array))
2090 {
2091 case 3:
2092 x.array [2] ^= y.array [2];
2093 /* Fall through. */
2094 case 2:
2095 x.array [1] ^= y.array [1];
2096 /* Fall through. */
2097 case 1:
2098 x.array [0] ^= y.array [0];
2099 break;
2100 default:
2101 abort ();
2102 }
2103 return x;
2104 }
2105
2106 static const i386_operand_type disp16 = OPERAND_TYPE_DISP16;
2107 static const i386_operand_type disp32 = OPERAND_TYPE_DISP32;
2108 static const i386_operand_type disp32s = OPERAND_TYPE_DISP32S;
2109 static const i386_operand_type disp16_32 = OPERAND_TYPE_DISP16_32;
2110 static const i386_operand_type anydisp = OPERAND_TYPE_ANYDISP;
2111 static const i386_operand_type anyimm = OPERAND_TYPE_ANYIMM;
2112 static const i386_operand_type regxmm = OPERAND_TYPE_REGXMM;
2113 static const i386_operand_type regmask = OPERAND_TYPE_REGMASK;
2114 static const i386_operand_type imm8 = OPERAND_TYPE_IMM8;
2115 static const i386_operand_type imm8s = OPERAND_TYPE_IMM8S;
2116 static const i386_operand_type imm16 = OPERAND_TYPE_IMM16;
2117 static const i386_operand_type imm32 = OPERAND_TYPE_IMM32;
2118 static const i386_operand_type imm32s = OPERAND_TYPE_IMM32S;
2119 static const i386_operand_type imm64 = OPERAND_TYPE_IMM64;
2120 static const i386_operand_type imm16_32 = OPERAND_TYPE_IMM16_32;
2121 static const i386_operand_type imm16_32s = OPERAND_TYPE_IMM16_32S;
2122 static const i386_operand_type imm16_32_32s = OPERAND_TYPE_IMM16_32_32S;
2123
2124 enum operand_type
2125 {
2126 reg,
2127 imm,
2128 disp,
2129 anymem
2130 };
2131
2132 static INLINE int
2133 operand_type_check (i386_operand_type t, enum operand_type c)
2134 {
2135 switch (c)
2136 {
2137 case reg:
2138 return t.bitfield.class == Reg;
2139
2140 case imm:
2141 return (t.bitfield.imm8
2142 || t.bitfield.imm8s
2143 || t.bitfield.imm16
2144 || t.bitfield.imm32
2145 || t.bitfield.imm32s
2146 || t.bitfield.imm64);
2147
2148 case disp:
2149 return (t.bitfield.disp8
2150 || t.bitfield.disp16
2151 || t.bitfield.disp32
2152 || t.bitfield.disp32s
2153 || t.bitfield.disp64);
2154
2155 case anymem:
2156 return (t.bitfield.disp8
2157 || t.bitfield.disp16
2158 || t.bitfield.disp32
2159 || t.bitfield.disp32s
2160 || t.bitfield.disp64
2161 || t.bitfield.baseindex);
2162
2163 default:
2164 abort ();
2165 }
2166
2167 return 0;
2168 }
2169
2170 /* Return 1 if there is no conflict in 8bit/16bit/32bit/64bit/80bit size
2171 between operand GIVEN and opeand WANTED for instruction template T. */
2172
2173 static INLINE int
2174 match_operand_size (const insn_template *t, unsigned int wanted,
2175 unsigned int given)
2176 {
2177 return !((i.types[given].bitfield.byte
2178 && !t->operand_types[wanted].bitfield.byte)
2179 || (i.types[given].bitfield.word
2180 && !t->operand_types[wanted].bitfield.word)
2181 || (i.types[given].bitfield.dword
2182 && !t->operand_types[wanted].bitfield.dword)
2183 || (i.types[given].bitfield.qword
2184 && !t->operand_types[wanted].bitfield.qword)
2185 || (i.types[given].bitfield.tbyte
2186 && !t->operand_types[wanted].bitfield.tbyte));
2187 }
2188
2189 /* Return 1 if there is no conflict in SIMD register between operand
2190 GIVEN and opeand WANTED for instruction template T. */
2191
2192 static INLINE int
2193 match_simd_size (const insn_template *t, unsigned int wanted,
2194 unsigned int given)
2195 {
2196 return !((i.types[given].bitfield.xmmword
2197 && !t->operand_types[wanted].bitfield.xmmword)
2198 || (i.types[given].bitfield.ymmword
2199 && !t->operand_types[wanted].bitfield.ymmword)
2200 || (i.types[given].bitfield.zmmword
2201 && !t->operand_types[wanted].bitfield.zmmword)
2202 || (i.types[given].bitfield.tmmword
2203 && !t->operand_types[wanted].bitfield.tmmword));
2204 }
2205
2206 /* Return 1 if there is no conflict in any size between operand GIVEN
2207 and opeand WANTED for instruction template T. */
2208
2209 static INLINE int
2210 match_mem_size (const insn_template *t, unsigned int wanted,
2211 unsigned int given)
2212 {
2213 return (match_operand_size (t, wanted, given)
2214 && !((i.types[given].bitfield.unspecified
2215 && !i.broadcast
2216 && !t->operand_types[wanted].bitfield.unspecified)
2217 || (i.types[given].bitfield.fword
2218 && !t->operand_types[wanted].bitfield.fword)
2219 /* For scalar opcode templates to allow register and memory
2220 operands at the same time, some special casing is needed
2221 here. Also for v{,p}broadcast*, {,v}pmov{s,z}*, and
2222 down-conversion vpmov*. */
2223 || ((t->operand_types[wanted].bitfield.class == RegSIMD
2224 && t->operand_types[wanted].bitfield.byte
2225 + t->operand_types[wanted].bitfield.word
2226 + t->operand_types[wanted].bitfield.dword
2227 + t->operand_types[wanted].bitfield.qword
2228 > !!t->opcode_modifier.broadcast)
2229 ? (i.types[given].bitfield.xmmword
2230 || i.types[given].bitfield.ymmword
2231 || i.types[given].bitfield.zmmword)
2232 : !match_simd_size(t, wanted, given))));
2233 }
2234
2235 /* Return value has MATCH_STRAIGHT set if there is no size conflict on any
2236 operands for instruction template T, and it has MATCH_REVERSE set if there
2237 is no size conflict on any operands for the template with operands reversed
2238 (and the template allows for reversing in the first place). */
2239
2240 #define MATCH_STRAIGHT 1
2241 #define MATCH_REVERSE 2
2242
2243 static INLINE unsigned int
2244 operand_size_match (const insn_template *t)
2245 {
2246 unsigned int j, match = MATCH_STRAIGHT;
2247
2248 /* Don't check non-absolute jump instructions. */
2249 if (t->opcode_modifier.jump
2250 && t->opcode_modifier.jump != JUMP_ABSOLUTE)
2251 return match;
2252
2253 /* Check memory and accumulator operand size. */
2254 for (j = 0; j < i.operands; j++)
2255 {
2256 if (i.types[j].bitfield.class != Reg
2257 && i.types[j].bitfield.class != RegSIMD
2258 && t->opcode_modifier.anysize)
2259 continue;
2260
2261 if (t->operand_types[j].bitfield.class == Reg
2262 && !match_operand_size (t, j, j))
2263 {
2264 match = 0;
2265 break;
2266 }
2267
2268 if (t->operand_types[j].bitfield.class == RegSIMD
2269 && !match_simd_size (t, j, j))
2270 {
2271 match = 0;
2272 break;
2273 }
2274
2275 if (t->operand_types[j].bitfield.instance == Accum
2276 && (!match_operand_size (t, j, j) || !match_simd_size (t, j, j)))
2277 {
2278 match = 0;
2279 break;
2280 }
2281
2282 if ((i.flags[j] & Operand_Mem) && !match_mem_size (t, j, j))
2283 {
2284 match = 0;
2285 break;
2286 }
2287 }
2288
2289 if (!t->opcode_modifier.d)
2290 {
2291 mismatch:
2292 if (!match)
2293 i.error = operand_size_mismatch;
2294 return match;
2295 }
2296
2297 /* Check reverse. */
2298 gas_assert (i.operands >= 2 && i.operands <= 3);
2299
2300 for (j = 0; j < i.operands; j++)
2301 {
2302 unsigned int given = i.operands - j - 1;
2303
2304 if (t->operand_types[j].bitfield.class == Reg
2305 && !match_operand_size (t, j, given))
2306 goto mismatch;
2307
2308 if (t->operand_types[j].bitfield.class == RegSIMD
2309 && !match_simd_size (t, j, given))
2310 goto mismatch;
2311
2312 if (t->operand_types[j].bitfield.instance == Accum
2313 && (!match_operand_size (t, j, given)
2314 || !match_simd_size (t, j, given)))
2315 goto mismatch;
2316
2317 if ((i.flags[given] & Operand_Mem) && !match_mem_size (t, j, given))
2318 goto mismatch;
2319 }
2320
2321 return match | MATCH_REVERSE;
2322 }
2323
2324 static INLINE int
2325 operand_type_match (i386_operand_type overlap,
2326 i386_operand_type given)
2327 {
2328 i386_operand_type temp = overlap;
2329
2330 temp.bitfield.unspecified = 0;
2331 temp.bitfield.byte = 0;
2332 temp.bitfield.word = 0;
2333 temp.bitfield.dword = 0;
2334 temp.bitfield.fword = 0;
2335 temp.bitfield.qword = 0;
2336 temp.bitfield.tbyte = 0;
2337 temp.bitfield.xmmword = 0;
2338 temp.bitfield.ymmword = 0;
2339 temp.bitfield.zmmword = 0;
2340 temp.bitfield.tmmword = 0;
2341 if (operand_type_all_zero (&temp))
2342 goto mismatch;
2343
2344 if (given.bitfield.baseindex == overlap.bitfield.baseindex)
2345 return 1;
2346
2347 mismatch:
2348 i.error = operand_type_mismatch;
2349 return 0;
2350 }
2351
2352 /* If given types g0 and g1 are registers they must be of the same type
2353 unless the expected operand type register overlap is null.
2354 Some Intel syntax memory operand size checking also happens here. */
2355
2356 static INLINE int
2357 operand_type_register_match (i386_operand_type g0,
2358 i386_operand_type t0,
2359 i386_operand_type g1,
2360 i386_operand_type t1)
2361 {
2362 if (g0.bitfield.class != Reg
2363 && g0.bitfield.class != RegSIMD
2364 && (!operand_type_check (g0, anymem)
2365 || g0.bitfield.unspecified
2366 || (t0.bitfield.class != Reg
2367 && t0.bitfield.class != RegSIMD)))
2368 return 1;
2369
2370 if (g1.bitfield.class != Reg
2371 && g1.bitfield.class != RegSIMD
2372 && (!operand_type_check (g1, anymem)
2373 || g1.bitfield.unspecified
2374 || (t1.bitfield.class != Reg
2375 && t1.bitfield.class != RegSIMD)))
2376 return 1;
2377
2378 if (g0.bitfield.byte == g1.bitfield.byte
2379 && g0.bitfield.word == g1.bitfield.word
2380 && g0.bitfield.dword == g1.bitfield.dword
2381 && g0.bitfield.qword == g1.bitfield.qword
2382 && g0.bitfield.xmmword == g1.bitfield.xmmword
2383 && g0.bitfield.ymmword == g1.bitfield.ymmword
2384 && g0.bitfield.zmmword == g1.bitfield.zmmword)
2385 return 1;
2386
2387 if (!(t0.bitfield.byte & t1.bitfield.byte)
2388 && !(t0.bitfield.word & t1.bitfield.word)
2389 && !(t0.bitfield.dword & t1.bitfield.dword)
2390 && !(t0.bitfield.qword & t1.bitfield.qword)
2391 && !(t0.bitfield.xmmword & t1.bitfield.xmmword)
2392 && !(t0.bitfield.ymmword & t1.bitfield.ymmword)
2393 && !(t0.bitfield.zmmword & t1.bitfield.zmmword))
2394 return 1;
2395
2396 i.error = register_type_mismatch;
2397
2398 return 0;
2399 }
2400
2401 static INLINE unsigned int
2402 register_number (const reg_entry *r)
2403 {
2404 unsigned int nr = r->reg_num;
2405
2406 if (r->reg_flags & RegRex)
2407 nr += 8;
2408
2409 if (r->reg_flags & RegVRex)
2410 nr += 16;
2411
2412 return nr;
2413 }
2414
2415 static INLINE unsigned int
2416 mode_from_disp_size (i386_operand_type t)
2417 {
2418 if (t.bitfield.disp8)
2419 return 1;
2420 else if (t.bitfield.disp16
2421 || t.bitfield.disp32
2422 || t.bitfield.disp32s)
2423 return 2;
2424 else
2425 return 0;
2426 }
2427
2428 static INLINE int
2429 fits_in_signed_byte (addressT num)
2430 {
2431 return num + 0x80 <= 0xff;
2432 }
2433
2434 static INLINE int
2435 fits_in_unsigned_byte (addressT num)
2436 {
2437 return num <= 0xff;
2438 }
2439
2440 static INLINE int
2441 fits_in_unsigned_word (addressT num)
2442 {
2443 return num <= 0xffff;
2444 }
2445
2446 static INLINE int
2447 fits_in_signed_word (addressT num)
2448 {
2449 return num + 0x8000 <= 0xffff;
2450 }
2451
2452 static INLINE int
2453 fits_in_signed_long (addressT num ATTRIBUTE_UNUSED)
2454 {
2455 #ifndef BFD64
2456 return 1;
2457 #else
2458 return num + 0x80000000 <= 0xffffffff;
2459 #endif
2460 } /* fits_in_signed_long() */
2461
2462 static INLINE int
2463 fits_in_unsigned_long (addressT num ATTRIBUTE_UNUSED)
2464 {
2465 #ifndef BFD64
2466 return 1;
2467 #else
2468 return num <= 0xffffffff;
2469 #endif
2470 } /* fits_in_unsigned_long() */
2471
2472 static INLINE int
2473 fits_in_disp8 (offsetT num)
2474 {
2475 int shift = i.memshift;
2476 unsigned int mask;
2477
2478 if (shift == -1)
2479 abort ();
2480
2481 mask = (1 << shift) - 1;
2482
2483 /* Return 0 if NUM isn't properly aligned. */
2484 if ((num & mask))
2485 return 0;
2486
2487 /* Check if NUM will fit in 8bit after shift. */
2488 return fits_in_signed_byte (num >> shift);
2489 }
2490
2491 static INLINE int
2492 fits_in_imm4 (offsetT num)
2493 {
2494 return (num & 0xf) == num;
2495 }
2496
2497 static i386_operand_type
2498 smallest_imm_type (offsetT num)
2499 {
2500 i386_operand_type t;
2501
2502 operand_type_set (&t, 0);
2503 t.bitfield.imm64 = 1;
2504
2505 if (cpu_arch_tune != PROCESSOR_I486 && num == 1)
2506 {
2507 /* This code is disabled on the 486 because all the Imm1 forms
2508 in the opcode table are slower on the i486. They're the
2509 versions with the implicitly specified single-position
2510 displacement, which has another syntax if you really want to
2511 use that form. */
2512 t.bitfield.imm1 = 1;
2513 t.bitfield.imm8 = 1;
2514 t.bitfield.imm8s = 1;
2515 t.bitfield.imm16 = 1;
2516 t.bitfield.imm32 = 1;
2517 t.bitfield.imm32s = 1;
2518 }
2519 else if (fits_in_signed_byte (num))
2520 {
2521 t.bitfield.imm8 = 1;
2522 t.bitfield.imm8s = 1;
2523 t.bitfield.imm16 = 1;
2524 t.bitfield.imm32 = 1;
2525 t.bitfield.imm32s = 1;
2526 }
2527 else if (fits_in_unsigned_byte (num))
2528 {
2529 t.bitfield.imm8 = 1;
2530 t.bitfield.imm16 = 1;
2531 t.bitfield.imm32 = 1;
2532 t.bitfield.imm32s = 1;
2533 }
2534 else if (fits_in_signed_word (num) || fits_in_unsigned_word (num))
2535 {
2536 t.bitfield.imm16 = 1;
2537 t.bitfield.imm32 = 1;
2538 t.bitfield.imm32s = 1;
2539 }
2540 else if (fits_in_signed_long (num))
2541 {
2542 t.bitfield.imm32 = 1;
2543 t.bitfield.imm32s = 1;
2544 }
2545 else if (fits_in_unsigned_long (num))
2546 t.bitfield.imm32 = 1;
2547
2548 return t;
2549 }
2550
2551 static offsetT
2552 offset_in_range (offsetT val, int size)
2553 {
2554 addressT mask;
2555
2556 switch (size)
2557 {
2558 case 1: mask = ((addressT) 1 << 8) - 1; break;
2559 case 2: mask = ((addressT) 1 << 16) - 1; break;
2560 case 4: mask = ((addressT) 2 << 31) - 1; break;
2561 #ifdef BFD64
2562 case 8: mask = ((addressT) 2 << 63) - 1; break;
2563 #endif
2564 default: abort ();
2565 }
2566
2567 if ((val & ~mask) != 0 && (val & ~mask) != ~mask)
2568 {
2569 char buf1[40], buf2[40];
2570
2571 sprint_value (buf1, val);
2572 sprint_value (buf2, val & mask);
2573 as_warn (_("%s shortened to %s"), buf1, buf2);
2574 }
2575 return val & mask;
2576 }
2577
2578 enum PREFIX_GROUP
2579 {
2580 PREFIX_EXIST = 0,
2581 PREFIX_LOCK,
2582 PREFIX_REP,
2583 PREFIX_DS,
2584 PREFIX_OTHER
2585 };
2586
2587 /* Returns
2588 a. PREFIX_EXIST if attempting to add a prefix where one from the
2589 same class already exists.
2590 b. PREFIX_LOCK if lock prefix is added.
2591 c. PREFIX_REP if rep/repne prefix is added.
2592 d. PREFIX_DS if ds prefix is added.
2593 e. PREFIX_OTHER if other prefix is added.
2594 */
2595
2596 static enum PREFIX_GROUP
2597 add_prefix (unsigned int prefix)
2598 {
2599 enum PREFIX_GROUP ret = PREFIX_OTHER;
2600 unsigned int q;
2601
2602 if (prefix >= REX_OPCODE && prefix < REX_OPCODE + 16
2603 && flag_code == CODE_64BIT)
2604 {
2605 if ((i.prefix[REX_PREFIX] & prefix & REX_W)
2606 || (i.prefix[REX_PREFIX] & prefix & REX_R)
2607 || (i.prefix[REX_PREFIX] & prefix & REX_X)
2608 || (i.prefix[REX_PREFIX] & prefix & REX_B))
2609 ret = PREFIX_EXIST;
2610 q = REX_PREFIX;
2611 }
2612 else
2613 {
2614 switch (prefix)
2615 {
2616 default:
2617 abort ();
2618
2619 case DS_PREFIX_OPCODE:
2620 ret = PREFIX_DS;
2621 /* Fall through. */
2622 case CS_PREFIX_OPCODE:
2623 case ES_PREFIX_OPCODE:
2624 case FS_PREFIX_OPCODE:
2625 case GS_PREFIX_OPCODE:
2626 case SS_PREFIX_OPCODE:
2627 q = SEG_PREFIX;
2628 break;
2629
2630 case REPNE_PREFIX_OPCODE:
2631 case REPE_PREFIX_OPCODE:
2632 q = REP_PREFIX;
2633 ret = PREFIX_REP;
2634 break;
2635
2636 case LOCK_PREFIX_OPCODE:
2637 q = LOCK_PREFIX;
2638 ret = PREFIX_LOCK;
2639 break;
2640
2641 case FWAIT_OPCODE:
2642 q = WAIT_PREFIX;
2643 break;
2644
2645 case ADDR_PREFIX_OPCODE:
2646 q = ADDR_PREFIX;
2647 break;
2648
2649 case DATA_PREFIX_OPCODE:
2650 q = DATA_PREFIX;
2651 break;
2652 }
2653 if (i.prefix[q] != 0)
2654 ret = PREFIX_EXIST;
2655 }
2656
2657 if (ret)
2658 {
2659 if (!i.prefix[q])
2660 ++i.prefixes;
2661 i.prefix[q] |= prefix;
2662 }
2663 else
2664 as_bad (_("same type of prefix used twice"));
2665
2666 return ret;
2667 }
2668
2669 static void
2670 update_code_flag (int value, int check)
2671 {
2672 PRINTF_LIKE ((*as_error));
2673
2674 flag_code = (enum flag_code) value;
2675 if (flag_code == CODE_64BIT)
2676 {
2677 cpu_arch_flags.bitfield.cpu64 = 1;
2678 cpu_arch_flags.bitfield.cpuno64 = 0;
2679 }
2680 else
2681 {
2682 cpu_arch_flags.bitfield.cpu64 = 0;
2683 cpu_arch_flags.bitfield.cpuno64 = 1;
2684 }
2685 if (value == CODE_64BIT && !cpu_arch_flags.bitfield.cpulm )
2686 {
2687 if (check)
2688 as_error = as_fatal;
2689 else
2690 as_error = as_bad;
2691 (*as_error) (_("64bit mode not supported on `%s'."),
2692 cpu_arch_name ? cpu_arch_name : default_arch);
2693 }
2694 if (value == CODE_32BIT && !cpu_arch_flags.bitfield.cpui386)
2695 {
2696 if (check)
2697 as_error = as_fatal;
2698 else
2699 as_error = as_bad;
2700 (*as_error) (_("32bit mode not supported on `%s'."),
2701 cpu_arch_name ? cpu_arch_name : default_arch);
2702 }
2703 stackop_size = '\0';
2704 }
2705
2706 static void
2707 set_code_flag (int value)
2708 {
2709 update_code_flag (value, 0);
2710 }
2711
2712 static void
2713 set_16bit_gcc_code_flag (int new_code_flag)
2714 {
2715 flag_code = (enum flag_code) new_code_flag;
2716 if (flag_code != CODE_16BIT)
2717 abort ();
2718 cpu_arch_flags.bitfield.cpu64 = 0;
2719 cpu_arch_flags.bitfield.cpuno64 = 1;
2720 stackop_size = LONG_MNEM_SUFFIX;
2721 }
2722
2723 static void
2724 set_intel_syntax (int syntax_flag)
2725 {
2726 /* Find out if register prefixing is specified. */
2727 int ask_naked_reg = 0;
2728
2729 SKIP_WHITESPACE ();
2730 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2731 {
2732 char *string;
2733 int e = get_symbol_name (&string);
2734
2735 if (strcmp (string, "prefix") == 0)
2736 ask_naked_reg = 1;
2737 else if (strcmp (string, "noprefix") == 0)
2738 ask_naked_reg = -1;
2739 else
2740 as_bad (_("bad argument to syntax directive."));
2741 (void) restore_line_pointer (e);
2742 }
2743 demand_empty_rest_of_line ();
2744
2745 intel_syntax = syntax_flag;
2746
2747 if (ask_naked_reg == 0)
2748 allow_naked_reg = (intel_syntax
2749 && (bfd_get_symbol_leading_char (stdoutput) != '\0'));
2750 else
2751 allow_naked_reg = (ask_naked_reg < 0);
2752
2753 expr_set_rank (O_full_ptr, syntax_flag ? 10 : 0);
2754
2755 identifier_chars['%'] = intel_syntax && allow_naked_reg ? '%' : 0;
2756 identifier_chars['$'] = intel_syntax ? '$' : 0;
2757 register_prefix = allow_naked_reg ? "" : "%";
2758 }
2759
2760 static void
2761 set_intel_mnemonic (int mnemonic_flag)
2762 {
2763 intel_mnemonic = mnemonic_flag;
2764 }
2765
2766 static void
2767 set_allow_index_reg (int flag)
2768 {
2769 allow_index_reg = flag;
2770 }
2771
2772 static void
2773 set_check (int what)
2774 {
2775 enum check_kind *kind;
2776 const char *str;
2777
2778 if (what)
2779 {
2780 kind = &operand_check;
2781 str = "operand";
2782 }
2783 else
2784 {
2785 kind = &sse_check;
2786 str = "sse";
2787 }
2788
2789 SKIP_WHITESPACE ();
2790
2791 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2792 {
2793 char *string;
2794 int e = get_symbol_name (&string);
2795
2796 if (strcmp (string, "none") == 0)
2797 *kind = check_none;
2798 else if (strcmp (string, "warning") == 0)
2799 *kind = check_warning;
2800 else if (strcmp (string, "error") == 0)
2801 *kind = check_error;
2802 else
2803 as_bad (_("bad argument to %s_check directive."), str);
2804 (void) restore_line_pointer (e);
2805 }
2806 else
2807 as_bad (_("missing argument for %s_check directive"), str);
2808
2809 demand_empty_rest_of_line ();
2810 }
2811
2812 static void
2813 check_cpu_arch_compatible (const char *name ATTRIBUTE_UNUSED,
2814 i386_cpu_flags new_flag ATTRIBUTE_UNUSED)
2815 {
2816 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
2817 static const char *arch;
2818
2819 /* Intel LIOM is only supported on ELF. */
2820 if (!IS_ELF)
2821 return;
2822
2823 if (!arch)
2824 {
2825 /* Use cpu_arch_name if it is set in md_parse_option. Otherwise
2826 use default_arch. */
2827 arch = cpu_arch_name;
2828 if (!arch)
2829 arch = default_arch;
2830 }
2831
2832 /* If we are targeting Intel MCU, we must enable it. */
2833 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_IAMCU
2834 || new_flag.bitfield.cpuiamcu)
2835 return;
2836
2837 /* If we are targeting Intel L1OM, we must enable it. */
2838 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_L1OM
2839 || new_flag.bitfield.cpul1om)
2840 return;
2841
2842 /* If we are targeting Intel K1OM, we must enable it. */
2843 if (get_elf_backend_data (stdoutput)->elf_machine_code != EM_K1OM
2844 || new_flag.bitfield.cpuk1om)
2845 return;
2846
2847 as_bad (_("`%s' is not supported on `%s'"), name, arch);
2848 #endif
2849 }
2850
2851 static void
2852 set_cpu_arch (int dummy ATTRIBUTE_UNUSED)
2853 {
2854 SKIP_WHITESPACE ();
2855
2856 if (!is_end_of_line[(unsigned char) *input_line_pointer])
2857 {
2858 char *string;
2859 int e = get_symbol_name (&string);
2860 unsigned int j;
2861 i386_cpu_flags flags;
2862
2863 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
2864 {
2865 if (strcmp (string, cpu_arch[j].name) == 0)
2866 {
2867 check_cpu_arch_compatible (string, cpu_arch[j].flags);
2868
2869 if (*string != '.')
2870 {
2871 cpu_arch_name = cpu_arch[j].name;
2872 cpu_sub_arch_name = NULL;
2873 cpu_arch_flags = cpu_arch[j].flags;
2874 if (flag_code == CODE_64BIT)
2875 {
2876 cpu_arch_flags.bitfield.cpu64 = 1;
2877 cpu_arch_flags.bitfield.cpuno64 = 0;
2878 }
2879 else
2880 {
2881 cpu_arch_flags.bitfield.cpu64 = 0;
2882 cpu_arch_flags.bitfield.cpuno64 = 1;
2883 }
2884 cpu_arch_isa = cpu_arch[j].type;
2885 cpu_arch_isa_flags = cpu_arch[j].flags;
2886 if (!cpu_arch_tune_set)
2887 {
2888 cpu_arch_tune = cpu_arch_isa;
2889 cpu_arch_tune_flags = cpu_arch_isa_flags;
2890 }
2891 break;
2892 }
2893
2894 flags = cpu_flags_or (cpu_arch_flags,
2895 cpu_arch[j].flags);
2896
2897 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2898 {
2899 if (cpu_sub_arch_name)
2900 {
2901 char *name = cpu_sub_arch_name;
2902 cpu_sub_arch_name = concat (name,
2903 cpu_arch[j].name,
2904 (const char *) NULL);
2905 free (name);
2906 }
2907 else
2908 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
2909 cpu_arch_flags = flags;
2910 cpu_arch_isa_flags = flags;
2911 }
2912 else
2913 cpu_arch_isa_flags
2914 = cpu_flags_or (cpu_arch_isa_flags,
2915 cpu_arch[j].flags);
2916 (void) restore_line_pointer (e);
2917 demand_empty_rest_of_line ();
2918 return;
2919 }
2920 }
2921
2922 if (*string == '.' && j >= ARRAY_SIZE (cpu_arch))
2923 {
2924 /* Disable an ISA extension. */
2925 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
2926 if (strcmp (string + 1, cpu_noarch [j].name) == 0)
2927 {
2928 flags = cpu_flags_and_not (cpu_arch_flags,
2929 cpu_noarch[j].flags);
2930 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
2931 {
2932 if (cpu_sub_arch_name)
2933 {
2934 char *name = cpu_sub_arch_name;
2935 cpu_sub_arch_name = concat (name, string,
2936 (const char *) NULL);
2937 free (name);
2938 }
2939 else
2940 cpu_sub_arch_name = xstrdup (string);
2941 cpu_arch_flags = flags;
2942 cpu_arch_isa_flags = flags;
2943 }
2944 (void) restore_line_pointer (e);
2945 demand_empty_rest_of_line ();
2946 return;
2947 }
2948
2949 j = ARRAY_SIZE (cpu_arch);
2950 }
2951
2952 if (j >= ARRAY_SIZE (cpu_arch))
2953 as_bad (_("no such architecture: `%s'"), string);
2954
2955 *input_line_pointer = e;
2956 }
2957 else
2958 as_bad (_("missing cpu architecture"));
2959
2960 no_cond_jump_promotion = 0;
2961 if (*input_line_pointer == ','
2962 && !is_end_of_line[(unsigned char) input_line_pointer[1]])
2963 {
2964 char *string;
2965 char e;
2966
2967 ++input_line_pointer;
2968 e = get_symbol_name (&string);
2969
2970 if (strcmp (string, "nojumps") == 0)
2971 no_cond_jump_promotion = 1;
2972 else if (strcmp (string, "jumps") == 0)
2973 ;
2974 else
2975 as_bad (_("no such architecture modifier: `%s'"), string);
2976
2977 (void) restore_line_pointer (e);
2978 }
2979
2980 demand_empty_rest_of_line ();
2981 }
2982
2983 enum bfd_architecture
2984 i386_arch (void)
2985 {
2986 if (cpu_arch_isa == PROCESSOR_L1OM)
2987 {
2988 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2989 || flag_code != CODE_64BIT)
2990 as_fatal (_("Intel L1OM is 64bit ELF only"));
2991 return bfd_arch_l1om;
2992 }
2993 else if (cpu_arch_isa == PROCESSOR_K1OM)
2994 {
2995 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
2996 || flag_code != CODE_64BIT)
2997 as_fatal (_("Intel K1OM is 64bit ELF only"));
2998 return bfd_arch_k1om;
2999 }
3000 else if (cpu_arch_isa == PROCESSOR_IAMCU)
3001 {
3002 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3003 || flag_code == CODE_64BIT)
3004 as_fatal (_("Intel MCU is 32bit ELF only"));
3005 return bfd_arch_iamcu;
3006 }
3007 else
3008 return bfd_arch_i386;
3009 }
3010
3011 unsigned long
3012 i386_mach (void)
3013 {
3014 if (!strncmp (default_arch, "x86_64", 6))
3015 {
3016 if (cpu_arch_isa == PROCESSOR_L1OM)
3017 {
3018 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3019 || default_arch[6] != '\0')
3020 as_fatal (_("Intel L1OM is 64bit ELF only"));
3021 return bfd_mach_l1om;
3022 }
3023 else if (cpu_arch_isa == PROCESSOR_K1OM)
3024 {
3025 if (OUTPUT_FLAVOR != bfd_target_elf_flavour
3026 || default_arch[6] != '\0')
3027 as_fatal (_("Intel K1OM is 64bit ELF only"));
3028 return bfd_mach_k1om;
3029 }
3030 else if (default_arch[6] == '\0')
3031 return bfd_mach_x86_64;
3032 else
3033 return bfd_mach_x64_32;
3034 }
3035 else if (!strcmp (default_arch, "i386")
3036 || !strcmp (default_arch, "iamcu"))
3037 {
3038 if (cpu_arch_isa == PROCESSOR_IAMCU)
3039 {
3040 if (OUTPUT_FLAVOR != bfd_target_elf_flavour)
3041 as_fatal (_("Intel MCU is 32bit ELF only"));
3042 return bfd_mach_i386_iamcu;
3043 }
3044 else
3045 return bfd_mach_i386_i386;
3046 }
3047 else
3048 as_fatal (_("unknown architecture"));
3049 }
3050 \f
3051 void
3052 md_begin (void)
3053 {
3054 /* Support pseudo prefixes like {disp32}. */
3055 lex_type ['{'] = LEX_BEGIN_NAME;
3056
3057 /* Initialize op_hash hash table. */
3058 op_hash = str_htab_create ();
3059
3060 {
3061 const insn_template *optab;
3062 templates *core_optab;
3063
3064 /* Setup for loop. */
3065 optab = i386_optab;
3066 core_optab = XNEW (templates);
3067 core_optab->start = optab;
3068
3069 while (1)
3070 {
3071 ++optab;
3072 if (optab->name == NULL
3073 || strcmp (optab->name, (optab - 1)->name) != 0)
3074 {
3075 /* different name --> ship out current template list;
3076 add to hash table; & begin anew. */
3077 core_optab->end = optab;
3078 if (str_hash_insert (op_hash, (optab - 1)->name, core_optab, 0))
3079 as_fatal (_("duplicate %s"), (optab - 1)->name);
3080
3081 if (optab->name == NULL)
3082 break;
3083 core_optab = XNEW (templates);
3084 core_optab->start = optab;
3085 }
3086 }
3087 }
3088
3089 /* Initialize reg_hash hash table. */
3090 reg_hash = str_htab_create ();
3091 {
3092 const reg_entry *regtab;
3093 unsigned int regtab_size = i386_regtab_size;
3094
3095 for (regtab = i386_regtab; regtab_size--; regtab++)
3096 if (str_hash_insert (reg_hash, regtab->reg_name, regtab, 0) != NULL)
3097 as_fatal (_("duplicate %s"), regtab->reg_name);
3098 }
3099
3100 /* Fill in lexical tables: mnemonic_chars, operand_chars. */
3101 {
3102 int c;
3103 char *p;
3104
3105 for (c = 0; c < 256; c++)
3106 {
3107 if (ISDIGIT (c))
3108 {
3109 digit_chars[c] = c;
3110 mnemonic_chars[c] = c;
3111 register_chars[c] = c;
3112 operand_chars[c] = c;
3113 }
3114 else if (ISLOWER (c))
3115 {
3116 mnemonic_chars[c] = c;
3117 register_chars[c] = c;
3118 operand_chars[c] = c;
3119 }
3120 else if (ISUPPER (c))
3121 {
3122 mnemonic_chars[c] = TOLOWER (c);
3123 register_chars[c] = mnemonic_chars[c];
3124 operand_chars[c] = c;
3125 }
3126 else if (c == '{' || c == '}')
3127 {
3128 mnemonic_chars[c] = c;
3129 operand_chars[c] = c;
3130 }
3131 #ifdef SVR4_COMMENT_CHARS
3132 else if (c == '\\' && strchr (i386_comment_chars, '/'))
3133 operand_chars[c] = c;
3134 #endif
3135
3136 if (ISALPHA (c) || ISDIGIT (c))
3137 identifier_chars[c] = c;
3138 else if (c >= 128)
3139 {
3140 identifier_chars[c] = c;
3141 operand_chars[c] = c;
3142 }
3143 }
3144
3145 #ifdef LEX_AT
3146 identifier_chars['@'] = '@';
3147 #endif
3148 #ifdef LEX_QM
3149 identifier_chars['?'] = '?';
3150 operand_chars['?'] = '?';
3151 #endif
3152 digit_chars['-'] = '-';
3153 mnemonic_chars['_'] = '_';
3154 mnemonic_chars['-'] = '-';
3155 mnemonic_chars['.'] = '.';
3156 identifier_chars['_'] = '_';
3157 identifier_chars['.'] = '.';
3158
3159 for (p = operand_special_chars; *p != '\0'; p++)
3160 operand_chars[(unsigned char) *p] = *p;
3161 }
3162
3163 if (flag_code == CODE_64BIT)
3164 {
3165 #if defined (OBJ_COFF) && defined (TE_PE)
3166 x86_dwarf2_return_column = (OUTPUT_FLAVOR == bfd_target_coff_flavour
3167 ? 32 : 16);
3168 #else
3169 x86_dwarf2_return_column = 16;
3170 #endif
3171 x86_cie_data_alignment = -8;
3172 }
3173 else
3174 {
3175 x86_dwarf2_return_column = 8;
3176 x86_cie_data_alignment = -4;
3177 }
3178
3179 /* NB: FUSED_JCC_PADDING frag must have sufficient room so that it
3180 can be turned into BRANCH_PREFIX frag. */
3181 if (align_branch_prefix_size > MAX_FUSED_JCC_PADDING_SIZE)
3182 abort ();
3183 }
3184
3185 void
3186 i386_print_statistics (FILE *file)
3187 {
3188 htab_print_statistics (file, "i386 opcode", op_hash);
3189 htab_print_statistics (file, "i386 register", reg_hash);
3190 }
3191 \f
3192 #ifdef DEBUG386
3193
3194 /* Debugging routines for md_assemble. */
3195 static void pte (insn_template *);
3196 static void pt (i386_operand_type);
3197 static void pe (expressionS *);
3198 static void ps (symbolS *);
3199
3200 static void
3201 pi (const char *line, i386_insn *x)
3202 {
3203 unsigned int j;
3204
3205 fprintf (stdout, "%s: template ", line);
3206 pte (&x->tm);
3207 fprintf (stdout, " address: base %s index %s scale %x\n",
3208 x->base_reg ? x->base_reg->reg_name : "none",
3209 x->index_reg ? x->index_reg->reg_name : "none",
3210 x->log2_scale_factor);
3211 fprintf (stdout, " modrm: mode %x reg %x reg/mem %x\n",
3212 x->rm.mode, x->rm.reg, x->rm.regmem);
3213 fprintf (stdout, " sib: base %x index %x scale %x\n",
3214 x->sib.base, x->sib.index, x->sib.scale);
3215 fprintf (stdout, " rex: 64bit %x extX %x extY %x extZ %x\n",
3216 (x->rex & REX_W) != 0,
3217 (x->rex & REX_R) != 0,
3218 (x->rex & REX_X) != 0,
3219 (x->rex & REX_B) != 0);
3220 for (j = 0; j < x->operands; j++)
3221 {
3222 fprintf (stdout, " #%d: ", j + 1);
3223 pt (x->types[j]);
3224 fprintf (stdout, "\n");
3225 if (x->types[j].bitfield.class == Reg
3226 || x->types[j].bitfield.class == RegMMX
3227 || x->types[j].bitfield.class == RegSIMD
3228 || x->types[j].bitfield.class == RegMask
3229 || x->types[j].bitfield.class == SReg
3230 || x->types[j].bitfield.class == RegCR
3231 || x->types[j].bitfield.class == RegDR
3232 || x->types[j].bitfield.class == RegTR
3233 || x->types[j].bitfield.class == RegBND)
3234 fprintf (stdout, "%s\n", x->op[j].regs->reg_name);
3235 if (operand_type_check (x->types[j], imm))
3236 pe (x->op[j].imms);
3237 if (operand_type_check (x->types[j], disp))
3238 pe (x->op[j].disps);
3239 }
3240 }
3241
3242 static void
3243 pte (insn_template *t)
3244 {
3245 static const unsigned char opc_pfx[] = { 0, 0x66, 0xf3, 0xf2 };
3246 static const char *const opc_spc[] = {
3247 NULL, "0f", "0f38", "0f3a", NULL, NULL, NULL, NULL,
3248 "XOP08", "XOP09", "XOP0A",
3249 };
3250 unsigned int j;
3251
3252 fprintf (stdout, " %d operands ", t->operands);
3253 if (opc_pfx[t->opcode_modifier.opcodeprefix])
3254 fprintf (stdout, "pfx %x ", opc_pfx[t->opcode_modifier.opcodeprefix]);
3255 if (opc_spc[t->opcode_modifier.opcodespace])
3256 fprintf (stdout, "space %s ", opc_spc[t->opcode_modifier.opcodespace]);
3257 fprintf (stdout, "opcode %x ", t->base_opcode);
3258 if (t->extension_opcode != None)
3259 fprintf (stdout, "ext %x ", t->extension_opcode);
3260 if (t->opcode_modifier.d)
3261 fprintf (stdout, "D");
3262 if (t->opcode_modifier.w)
3263 fprintf (stdout, "W");
3264 fprintf (stdout, "\n");
3265 for (j = 0; j < t->operands; j++)
3266 {
3267 fprintf (stdout, " #%d type ", j + 1);
3268 pt (t->operand_types[j]);
3269 fprintf (stdout, "\n");
3270 }
3271 }
3272
3273 static void
3274 pe (expressionS *e)
3275 {
3276 fprintf (stdout, " operation %d\n", e->X_op);
3277 fprintf (stdout, " add_number %ld (%lx)\n",
3278 (long) e->X_add_number, (long) e->X_add_number);
3279 if (e->X_add_symbol)
3280 {
3281 fprintf (stdout, " add_symbol ");
3282 ps (e->X_add_symbol);
3283 fprintf (stdout, "\n");
3284 }
3285 if (e->X_op_symbol)
3286 {
3287 fprintf (stdout, " op_symbol ");
3288 ps (e->X_op_symbol);
3289 fprintf (stdout, "\n");
3290 }
3291 }
3292
3293 static void
3294 ps (symbolS *s)
3295 {
3296 fprintf (stdout, "%s type %s%s",
3297 S_GET_NAME (s),
3298 S_IS_EXTERNAL (s) ? "EXTERNAL " : "",
3299 segment_name (S_GET_SEGMENT (s)));
3300 }
3301
3302 static struct type_name
3303 {
3304 i386_operand_type mask;
3305 const char *name;
3306 }
3307 const type_names[] =
3308 {
3309 { OPERAND_TYPE_REG8, "r8" },
3310 { OPERAND_TYPE_REG16, "r16" },
3311 { OPERAND_TYPE_REG32, "r32" },
3312 { OPERAND_TYPE_REG64, "r64" },
3313 { OPERAND_TYPE_ACC8, "acc8" },
3314 { OPERAND_TYPE_ACC16, "acc16" },
3315 { OPERAND_TYPE_ACC32, "acc32" },
3316 { OPERAND_TYPE_ACC64, "acc64" },
3317 { OPERAND_TYPE_IMM8, "i8" },
3318 { OPERAND_TYPE_IMM8, "i8s" },
3319 { OPERAND_TYPE_IMM16, "i16" },
3320 { OPERAND_TYPE_IMM32, "i32" },
3321 { OPERAND_TYPE_IMM32S, "i32s" },
3322 { OPERAND_TYPE_IMM64, "i64" },
3323 { OPERAND_TYPE_IMM1, "i1" },
3324 { OPERAND_TYPE_BASEINDEX, "BaseIndex" },
3325 { OPERAND_TYPE_DISP8, "d8" },
3326 { OPERAND_TYPE_DISP16, "d16" },
3327 { OPERAND_TYPE_DISP32, "d32" },
3328 { OPERAND_TYPE_DISP32S, "d32s" },
3329 { OPERAND_TYPE_DISP64, "d64" },
3330 { OPERAND_TYPE_INOUTPORTREG, "InOutPortReg" },
3331 { OPERAND_TYPE_SHIFTCOUNT, "ShiftCount" },
3332 { OPERAND_TYPE_CONTROL, "control reg" },
3333 { OPERAND_TYPE_TEST, "test reg" },
3334 { OPERAND_TYPE_DEBUG, "debug reg" },
3335 { OPERAND_TYPE_FLOATREG, "FReg" },
3336 { OPERAND_TYPE_FLOATACC, "FAcc" },
3337 { OPERAND_TYPE_SREG, "SReg" },
3338 { OPERAND_TYPE_REGMMX, "rMMX" },
3339 { OPERAND_TYPE_REGXMM, "rXMM" },
3340 { OPERAND_TYPE_REGYMM, "rYMM" },
3341 { OPERAND_TYPE_REGZMM, "rZMM" },
3342 { OPERAND_TYPE_REGTMM, "rTMM" },
3343 { OPERAND_TYPE_REGMASK, "Mask reg" },
3344 };
3345
3346 static void
3347 pt (i386_operand_type t)
3348 {
3349 unsigned int j;
3350 i386_operand_type a;
3351
3352 for (j = 0; j < ARRAY_SIZE (type_names); j++)
3353 {
3354 a = operand_type_and (t, type_names[j].mask);
3355 if (operand_type_equal (&a, &type_names[j].mask))
3356 fprintf (stdout, "%s, ", type_names[j].name);
3357 }
3358 fflush (stdout);
3359 }
3360
3361 #endif /* DEBUG386 */
3362 \f
3363 static bfd_reloc_code_real_type
3364 reloc (unsigned int size,
3365 int pcrel,
3366 int sign,
3367 bfd_reloc_code_real_type other)
3368 {
3369 if (other != NO_RELOC)
3370 {
3371 reloc_howto_type *rel;
3372
3373 if (size == 8)
3374 switch (other)
3375 {
3376 case BFD_RELOC_X86_64_GOT32:
3377 return BFD_RELOC_X86_64_GOT64;
3378 break;
3379 case BFD_RELOC_X86_64_GOTPLT64:
3380 return BFD_RELOC_X86_64_GOTPLT64;
3381 break;
3382 case BFD_RELOC_X86_64_PLTOFF64:
3383 return BFD_RELOC_X86_64_PLTOFF64;
3384 break;
3385 case BFD_RELOC_X86_64_GOTPC32:
3386 other = BFD_RELOC_X86_64_GOTPC64;
3387 break;
3388 case BFD_RELOC_X86_64_GOTPCREL:
3389 other = BFD_RELOC_X86_64_GOTPCREL64;
3390 break;
3391 case BFD_RELOC_X86_64_TPOFF32:
3392 other = BFD_RELOC_X86_64_TPOFF64;
3393 break;
3394 case BFD_RELOC_X86_64_DTPOFF32:
3395 other = BFD_RELOC_X86_64_DTPOFF64;
3396 break;
3397 default:
3398 break;
3399 }
3400
3401 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3402 if (other == BFD_RELOC_SIZE32)
3403 {
3404 if (size == 8)
3405 other = BFD_RELOC_SIZE64;
3406 if (pcrel)
3407 {
3408 as_bad (_("there are no pc-relative size relocations"));
3409 return NO_RELOC;
3410 }
3411 }
3412 #endif
3413
3414 /* Sign-checking 4-byte relocations in 16-/32-bit code is pointless. */
3415 if (size == 4 && (flag_code != CODE_64BIT || disallow_64bit_reloc))
3416 sign = -1;
3417
3418 rel = bfd_reloc_type_lookup (stdoutput, other);
3419 if (!rel)
3420 as_bad (_("unknown relocation (%u)"), other);
3421 else if (size != bfd_get_reloc_size (rel))
3422 as_bad (_("%u-byte relocation cannot be applied to %u-byte field"),
3423 bfd_get_reloc_size (rel),
3424 size);
3425 else if (pcrel && !rel->pc_relative)
3426 as_bad (_("non-pc-relative relocation for pc-relative field"));
3427 else if ((rel->complain_on_overflow == complain_overflow_signed
3428 && !sign)
3429 || (rel->complain_on_overflow == complain_overflow_unsigned
3430 && sign > 0))
3431 as_bad (_("relocated field and relocation type differ in signedness"));
3432 else
3433 return other;
3434 return NO_RELOC;
3435 }
3436
3437 if (pcrel)
3438 {
3439 if (!sign)
3440 as_bad (_("there are no unsigned pc-relative relocations"));
3441 switch (size)
3442 {
3443 case 1: return BFD_RELOC_8_PCREL;
3444 case 2: return BFD_RELOC_16_PCREL;
3445 case 4: return BFD_RELOC_32_PCREL;
3446 case 8: return BFD_RELOC_64_PCREL;
3447 }
3448 as_bad (_("cannot do %u byte pc-relative relocation"), size);
3449 }
3450 else
3451 {
3452 if (sign > 0)
3453 switch (size)
3454 {
3455 case 4: return BFD_RELOC_X86_64_32S;
3456 }
3457 else
3458 switch (size)
3459 {
3460 case 1: return BFD_RELOC_8;
3461 case 2: return BFD_RELOC_16;
3462 case 4: return BFD_RELOC_32;
3463 case 8: return BFD_RELOC_64;
3464 }
3465 as_bad (_("cannot do %s %u byte relocation"),
3466 sign > 0 ? "signed" : "unsigned", size);
3467 }
3468
3469 return NO_RELOC;
3470 }
3471
3472 /* Here we decide which fixups can be adjusted to make them relative to
3473 the beginning of the section instead of the symbol. Basically we need
3474 to make sure that the dynamic relocations are done correctly, so in
3475 some cases we force the original symbol to be used. */
3476
3477 int
3478 tc_i386_fix_adjustable (fixS *fixP ATTRIBUTE_UNUSED)
3479 {
3480 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
3481 if (!IS_ELF)
3482 return 1;
3483
3484 /* Don't adjust pc-relative references to merge sections in 64-bit
3485 mode. */
3486 if (use_rela_relocations
3487 && (S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_MERGE) != 0
3488 && fixP->fx_pcrel)
3489 return 0;
3490
3491 /* The x86_64 GOTPCREL are represented as 32bit PCrel relocations
3492 and changed later by validate_fix. */
3493 if (GOT_symbol && fixP->fx_subsy == GOT_symbol
3494 && fixP->fx_r_type == BFD_RELOC_32_PCREL)
3495 return 0;
3496
3497 /* Adjust_reloc_syms doesn't know about the GOT. Need to keep symbol
3498 for size relocations. */
3499 if (fixP->fx_r_type == BFD_RELOC_SIZE32
3500 || fixP->fx_r_type == BFD_RELOC_SIZE64
3501 || fixP->fx_r_type == BFD_RELOC_386_GOTOFF
3502 || fixP->fx_r_type == BFD_RELOC_386_GOT32
3503 || fixP->fx_r_type == BFD_RELOC_386_GOT32X
3504 || fixP->fx_r_type == BFD_RELOC_386_TLS_GD
3505 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDM
3506 || fixP->fx_r_type == BFD_RELOC_386_TLS_LDO_32
3507 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE_32
3508 || fixP->fx_r_type == BFD_RELOC_386_TLS_IE
3509 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTIE
3510 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE_32
3511 || fixP->fx_r_type == BFD_RELOC_386_TLS_LE
3512 || fixP->fx_r_type == BFD_RELOC_386_TLS_GOTDESC
3513 || fixP->fx_r_type == BFD_RELOC_386_TLS_DESC_CALL
3514 || fixP->fx_r_type == BFD_RELOC_X86_64_GOT32
3515 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCREL
3516 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPCRELX
3517 || fixP->fx_r_type == BFD_RELOC_X86_64_REX_GOTPCRELX
3518 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSGD
3519 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSLD
3520 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF32
3521 || fixP->fx_r_type == BFD_RELOC_X86_64_DTPOFF64
3522 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTTPOFF
3523 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF32
3524 || fixP->fx_r_type == BFD_RELOC_X86_64_TPOFF64
3525 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTOFF64
3526 || fixP->fx_r_type == BFD_RELOC_X86_64_GOTPC32_TLSDESC
3527 || fixP->fx_r_type == BFD_RELOC_X86_64_TLSDESC_CALL
3528 || fixP->fx_r_type == BFD_RELOC_VTABLE_INHERIT
3529 || fixP->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
3530 return 0;
3531 #endif
3532 return 1;
3533 }
3534
3535 static int
3536 intel_float_operand (const char *mnemonic)
3537 {
3538 /* Note that the value returned is meaningful only for opcodes with (memory)
3539 operands, hence the code here is free to improperly handle opcodes that
3540 have no operands (for better performance and smaller code). */
3541
3542 if (mnemonic[0] != 'f')
3543 return 0; /* non-math */
3544
3545 switch (mnemonic[1])
3546 {
3547 /* fclex, fdecstp, fdisi, femms, feni, fincstp, finit, fsetpm, and
3548 the fs segment override prefix not currently handled because no
3549 call path can make opcodes without operands get here */
3550 case 'i':
3551 return 2 /* integer op */;
3552 case 'l':
3553 if (mnemonic[2] == 'd' && (mnemonic[3] == 'c' || mnemonic[3] == 'e'))
3554 return 3; /* fldcw/fldenv */
3555 break;
3556 case 'n':
3557 if (mnemonic[2] != 'o' /* fnop */)
3558 return 3; /* non-waiting control op */
3559 break;
3560 case 'r':
3561 if (mnemonic[2] == 's')
3562 return 3; /* frstor/frstpm */
3563 break;
3564 case 's':
3565 if (mnemonic[2] == 'a')
3566 return 3; /* fsave */
3567 if (mnemonic[2] == 't')
3568 {
3569 switch (mnemonic[3])
3570 {
3571 case 'c': /* fstcw */
3572 case 'd': /* fstdw */
3573 case 'e': /* fstenv */
3574 case 's': /* fsts[gw] */
3575 return 3;
3576 }
3577 }
3578 break;
3579 case 'x':
3580 if (mnemonic[2] == 'r' || mnemonic[2] == 's')
3581 return 0; /* fxsave/fxrstor are not really math ops */
3582 break;
3583 }
3584
3585 return 1;
3586 }
3587
3588 static INLINE void
3589 install_template (const insn_template *t)
3590 {
3591 unsigned int l;
3592
3593 i.tm = *t;
3594
3595 /* Note that for pseudo prefixes this produces a length of 1. But for them
3596 the length isn't interesting at all. */
3597 for (l = 1; l < 4; ++l)
3598 if (!(t->base_opcode >> (8 * l)))
3599 break;
3600
3601 i.opcode_length = l;
3602 }
3603
3604 /* Build the VEX prefix. */
3605
3606 static void
3607 build_vex_prefix (const insn_template *t)
3608 {
3609 unsigned int register_specifier;
3610 unsigned int vector_length;
3611 unsigned int w;
3612
3613 /* Check register specifier. */
3614 if (i.vex.register_specifier)
3615 {
3616 register_specifier =
3617 ~register_number (i.vex.register_specifier) & 0xf;
3618 gas_assert ((i.vex.register_specifier->reg_flags & RegVRex) == 0);
3619 }
3620 else
3621 register_specifier = 0xf;
3622
3623 /* Use 2-byte VEX prefix by swapping destination and source operand
3624 if there are more than 1 register operand. */
3625 if (i.reg_operands > 1
3626 && i.vec_encoding != vex_encoding_vex3
3627 && i.dir_encoding == dir_encoding_default
3628 && i.operands == i.reg_operands
3629 && operand_type_equal (&i.types[0], &i.types[i.operands - 1])
3630 && i.tm.opcode_modifier.opcodespace == SPACE_0F
3631 && (i.tm.opcode_modifier.load || i.tm.opcode_modifier.d)
3632 && i.rex == REX_B)
3633 {
3634 unsigned int xchg = i.operands - 1;
3635 union i386_op temp_op;
3636 i386_operand_type temp_type;
3637
3638 temp_type = i.types[xchg];
3639 i.types[xchg] = i.types[0];
3640 i.types[0] = temp_type;
3641 temp_op = i.op[xchg];
3642 i.op[xchg] = i.op[0];
3643 i.op[0] = temp_op;
3644
3645 gas_assert (i.rm.mode == 3);
3646
3647 i.rex = REX_R;
3648 xchg = i.rm.regmem;
3649 i.rm.regmem = i.rm.reg;
3650 i.rm.reg = xchg;
3651
3652 if (i.tm.opcode_modifier.d)
3653 i.tm.base_opcode ^= (i.tm.base_opcode & 0xee) != 0x6e
3654 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
3655 else /* Use the next insn. */
3656 install_template (&t[1]);
3657 }
3658
3659 /* Use 2-byte VEX prefix by swapping commutative source operands if there
3660 are no memory operands and at least 3 register ones. */
3661 if (i.reg_operands >= 3
3662 && i.vec_encoding != vex_encoding_vex3
3663 && i.reg_operands == i.operands - i.imm_operands
3664 && i.tm.opcode_modifier.vex
3665 && i.tm.opcode_modifier.commutative
3666 && (i.tm.opcode_modifier.sse2avx || optimize > 1)
3667 && i.rex == REX_B
3668 && i.vex.register_specifier
3669 && !(i.vex.register_specifier->reg_flags & RegRex))
3670 {
3671 unsigned int xchg = i.operands - i.reg_operands;
3672 union i386_op temp_op;
3673 i386_operand_type temp_type;
3674
3675 gas_assert (i.tm.opcode_modifier.opcodespace == SPACE_0F);
3676 gas_assert (!i.tm.opcode_modifier.sae);
3677 gas_assert (operand_type_equal (&i.types[i.operands - 2],
3678 &i.types[i.operands - 3]));
3679 gas_assert (i.rm.mode == 3);
3680
3681 temp_type = i.types[xchg];
3682 i.types[xchg] = i.types[xchg + 1];
3683 i.types[xchg + 1] = temp_type;
3684 temp_op = i.op[xchg];
3685 i.op[xchg] = i.op[xchg + 1];
3686 i.op[xchg + 1] = temp_op;
3687
3688 i.rex = 0;
3689 xchg = i.rm.regmem | 8;
3690 i.rm.regmem = ~register_specifier & 0xf;
3691 gas_assert (!(i.rm.regmem & 8));
3692 i.vex.register_specifier += xchg - i.rm.regmem;
3693 register_specifier = ~xchg & 0xf;
3694 }
3695
3696 if (i.tm.opcode_modifier.vex == VEXScalar)
3697 vector_length = avxscalar;
3698 else if (i.tm.opcode_modifier.vex == VEX256)
3699 vector_length = 1;
3700 else
3701 {
3702 unsigned int op;
3703
3704 /* Determine vector length from the last multi-length vector
3705 operand. */
3706 vector_length = 0;
3707 for (op = t->operands; op--;)
3708 if (t->operand_types[op].bitfield.xmmword
3709 && t->operand_types[op].bitfield.ymmword
3710 && i.types[op].bitfield.ymmword)
3711 {
3712 vector_length = 1;
3713 break;
3714 }
3715 }
3716
3717 /* Check the REX.W bit and VEXW. */
3718 if (i.tm.opcode_modifier.vexw == VEXWIG)
3719 w = (vexwig == vexw1 || (i.rex & REX_W)) ? 1 : 0;
3720 else if (i.tm.opcode_modifier.vexw)
3721 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3722 else
3723 w = (flag_code == CODE_64BIT ? i.rex & REX_W : vexwig == vexw1) ? 1 : 0;
3724
3725 /* Use 2-byte VEX prefix if possible. */
3726 if (w == 0
3727 && i.vec_encoding != vex_encoding_vex3
3728 && i.tm.opcode_modifier.opcodespace == SPACE_0F
3729 && (i.rex & (REX_W | REX_X | REX_B)) == 0)
3730 {
3731 /* 2-byte VEX prefix. */
3732 unsigned int r;
3733
3734 i.vex.length = 2;
3735 i.vex.bytes[0] = 0xc5;
3736
3737 /* Check the REX.R bit. */
3738 r = (i.rex & REX_R) ? 0 : 1;
3739 i.vex.bytes[1] = (r << 7
3740 | register_specifier << 3
3741 | vector_length << 2
3742 | i.tm.opcode_modifier.opcodeprefix);
3743 }
3744 else
3745 {
3746 /* 3-byte VEX prefix. */
3747 i.vex.length = 3;
3748
3749 switch (i.tm.opcode_modifier.opcodespace)
3750 {
3751 case SPACE_0F:
3752 case SPACE_0F38:
3753 case SPACE_0F3A:
3754 i.vex.bytes[0] = 0xc4;
3755 break;
3756 case SPACE_XOP08:
3757 case SPACE_XOP09:
3758 case SPACE_XOP0A:
3759 i.vex.bytes[0] = 0x8f;
3760 break;
3761 default:
3762 abort ();
3763 }
3764
3765 /* The high 3 bits of the second VEX byte are 1's compliment
3766 of RXB bits from REX. */
3767 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3768
3769 i.vex.bytes[2] = (w << 7
3770 | register_specifier << 3
3771 | vector_length << 2
3772 | i.tm.opcode_modifier.opcodeprefix);
3773 }
3774 }
3775
3776 static INLINE bfd_boolean
3777 is_evex_encoding (const insn_template *t)
3778 {
3779 return t->opcode_modifier.evex || t->opcode_modifier.disp8memshift
3780 || t->opcode_modifier.broadcast || t->opcode_modifier.masking
3781 || t->opcode_modifier.sae;
3782 }
3783
3784 static INLINE bfd_boolean
3785 is_any_vex_encoding (const insn_template *t)
3786 {
3787 return t->opcode_modifier.vex || is_evex_encoding (t);
3788 }
3789
3790 /* Build the EVEX prefix. */
3791
3792 static void
3793 build_evex_prefix (void)
3794 {
3795 unsigned int register_specifier, w;
3796 rex_byte vrex_used = 0;
3797
3798 /* Check register specifier. */
3799 if (i.vex.register_specifier)
3800 {
3801 gas_assert ((i.vrex & REX_X) == 0);
3802
3803 register_specifier = i.vex.register_specifier->reg_num;
3804 if ((i.vex.register_specifier->reg_flags & RegRex))
3805 register_specifier += 8;
3806 /* The upper 16 registers are encoded in the fourth byte of the
3807 EVEX prefix. */
3808 if (!(i.vex.register_specifier->reg_flags & RegVRex))
3809 i.vex.bytes[3] = 0x8;
3810 register_specifier = ~register_specifier & 0xf;
3811 }
3812 else
3813 {
3814 register_specifier = 0xf;
3815
3816 /* Encode upper 16 vector index register in the fourth byte of
3817 the EVEX prefix. */
3818 if (!(i.vrex & REX_X))
3819 i.vex.bytes[3] = 0x8;
3820 else
3821 vrex_used |= REX_X;
3822 }
3823
3824 /* 4 byte EVEX prefix. */
3825 i.vex.length = 4;
3826 i.vex.bytes[0] = 0x62;
3827
3828 /* The high 3 bits of the second EVEX byte are 1's compliment of RXB
3829 bits from REX. */
3830 gas_assert (i.tm.opcode_modifier.opcodespace >= SPACE_0F);
3831 gas_assert (i.tm.opcode_modifier.opcodespace <= SPACE_0F3A);
3832 i.vex.bytes[1] = (~i.rex & 0x7) << 5 | i.tm.opcode_modifier.opcodespace;
3833
3834 /* The fifth bit of the second EVEX byte is 1's compliment of the
3835 REX_R bit in VREX. */
3836 if (!(i.vrex & REX_R))
3837 i.vex.bytes[1] |= 0x10;
3838 else
3839 vrex_used |= REX_R;
3840
3841 if ((i.reg_operands + i.imm_operands) == i.operands)
3842 {
3843 /* When all operands are registers, the REX_X bit in REX is not
3844 used. We reuse it to encode the upper 16 registers, which is
3845 indicated by the REX_B bit in VREX. The REX_X bit is encoded
3846 as 1's compliment. */
3847 if ((i.vrex & REX_B))
3848 {
3849 vrex_used |= REX_B;
3850 i.vex.bytes[1] &= ~0x40;
3851 }
3852 }
3853
3854 /* EVEX instructions shouldn't need the REX prefix. */
3855 i.vrex &= ~vrex_used;
3856 gas_assert (i.vrex == 0);
3857
3858 /* Check the REX.W bit and VEXW. */
3859 if (i.tm.opcode_modifier.vexw == VEXWIG)
3860 w = (evexwig == evexw1 || (i.rex & REX_W)) ? 1 : 0;
3861 else if (i.tm.opcode_modifier.vexw)
3862 w = i.tm.opcode_modifier.vexw == VEXW1 ? 1 : 0;
3863 else
3864 w = (flag_code == CODE_64BIT ? i.rex & REX_W : evexwig == evexw1) ? 1 : 0;
3865
3866 /* The third byte of the EVEX prefix. */
3867 i.vex.bytes[2] = ((w << 7)
3868 | (register_specifier << 3)
3869 | 4 /* Encode the U bit. */
3870 | i.tm.opcode_modifier.opcodeprefix);
3871
3872 /* The fourth byte of the EVEX prefix. */
3873 /* The zeroing-masking bit. */
3874 if (i.mask && i.mask->zeroing)
3875 i.vex.bytes[3] |= 0x80;
3876
3877 /* Don't always set the broadcast bit if there is no RC. */
3878 if (!i.rounding)
3879 {
3880 /* Encode the vector length. */
3881 unsigned int vec_length;
3882
3883 if (!i.tm.opcode_modifier.evex
3884 || i.tm.opcode_modifier.evex == EVEXDYN)
3885 {
3886 unsigned int op;
3887
3888 /* Determine vector length from the last multi-length vector
3889 operand. */
3890 for (op = i.operands; op--;)
3891 if (i.tm.operand_types[op].bitfield.xmmword
3892 + i.tm.operand_types[op].bitfield.ymmword
3893 + i.tm.operand_types[op].bitfield.zmmword > 1)
3894 {
3895 if (i.types[op].bitfield.zmmword)
3896 {
3897 i.tm.opcode_modifier.evex = EVEX512;
3898 break;
3899 }
3900 else if (i.types[op].bitfield.ymmword)
3901 {
3902 i.tm.opcode_modifier.evex = EVEX256;
3903 break;
3904 }
3905 else if (i.types[op].bitfield.xmmword)
3906 {
3907 i.tm.opcode_modifier.evex = EVEX128;
3908 break;
3909 }
3910 else if (i.broadcast && (int) op == i.broadcast->operand)
3911 {
3912 switch (i.broadcast->bytes)
3913 {
3914 case 64:
3915 i.tm.opcode_modifier.evex = EVEX512;
3916 break;
3917 case 32:
3918 i.tm.opcode_modifier.evex = EVEX256;
3919 break;
3920 case 16:
3921 i.tm.opcode_modifier.evex = EVEX128;
3922 break;
3923 default:
3924 abort ();
3925 }
3926 break;
3927 }
3928 }
3929
3930 if (op >= MAX_OPERANDS)
3931 abort ();
3932 }
3933
3934 switch (i.tm.opcode_modifier.evex)
3935 {
3936 case EVEXLIG: /* LL' is ignored */
3937 vec_length = evexlig << 5;
3938 break;
3939 case EVEX128:
3940 vec_length = 0 << 5;
3941 break;
3942 case EVEX256:
3943 vec_length = 1 << 5;
3944 break;
3945 case EVEX512:
3946 vec_length = 2 << 5;
3947 break;
3948 default:
3949 abort ();
3950 break;
3951 }
3952 i.vex.bytes[3] |= vec_length;
3953 /* Encode the broadcast bit. */
3954 if (i.broadcast)
3955 i.vex.bytes[3] |= 0x10;
3956 }
3957 else
3958 {
3959 if (i.rounding->type != saeonly)
3960 i.vex.bytes[3] |= 0x10 | (i.rounding->type << 5);
3961 else
3962 i.vex.bytes[3] |= 0x10 | (evexrcig << 5);
3963 }
3964
3965 if (i.mask && i.mask->mask)
3966 i.vex.bytes[3] |= i.mask->mask->reg_num;
3967 }
3968
3969 static void
3970 process_immext (void)
3971 {
3972 expressionS *exp;
3973
3974 /* These AMD 3DNow! and SSE2 instructions have an opcode suffix
3975 which is coded in the same place as an 8-bit immediate field
3976 would be. Here we fake an 8-bit immediate operand from the
3977 opcode suffix stored in tm.extension_opcode.
3978
3979 AVX instructions also use this encoding, for some of
3980 3 argument instructions. */
3981
3982 gas_assert (i.imm_operands <= 1
3983 && (i.operands <= 2
3984 || (is_any_vex_encoding (&i.tm)
3985 && i.operands <= 4)));
3986
3987 exp = &im_expressions[i.imm_operands++];
3988 i.op[i.operands].imms = exp;
3989 i.types[i.operands] = imm8;
3990 i.operands++;
3991 exp->X_op = O_constant;
3992 exp->X_add_number = i.tm.extension_opcode;
3993 i.tm.extension_opcode = None;
3994 }
3995
3996
3997 static int
3998 check_hle (void)
3999 {
4000 switch (i.tm.opcode_modifier.prefixok)
4001 {
4002 default:
4003 abort ();
4004 case PrefixLock:
4005 case PrefixNone:
4006 case PrefixNoTrack:
4007 case PrefixRep:
4008 as_bad (_("invalid instruction `%s' after `%s'"),
4009 i.tm.name, i.hle_prefix);
4010 return 0;
4011 case PrefixHLELock:
4012 if (i.prefix[LOCK_PREFIX])
4013 return 1;
4014 as_bad (_("missing `lock' with `%s'"), i.hle_prefix);
4015 return 0;
4016 case PrefixHLEAny:
4017 return 1;
4018 case PrefixHLERelease:
4019 if (i.prefix[HLE_PREFIX] != XRELEASE_PREFIX_OPCODE)
4020 {
4021 as_bad (_("instruction `%s' after `xacquire' not allowed"),
4022 i.tm.name);
4023 return 0;
4024 }
4025 if (i.mem_operands == 0 || !(i.flags[i.operands - 1] & Operand_Mem))
4026 {
4027 as_bad (_("memory destination needed for instruction `%s'"
4028 " after `xrelease'"), i.tm.name);
4029 return 0;
4030 }
4031 return 1;
4032 }
4033 }
4034
4035 /* Try the shortest encoding by shortening operand size. */
4036
4037 static void
4038 optimize_encoding (void)
4039 {
4040 unsigned int j;
4041
4042 if (optimize_for_space
4043 && !is_any_vex_encoding (&i.tm)
4044 && i.reg_operands == 1
4045 && i.imm_operands == 1
4046 && !i.types[1].bitfield.byte
4047 && i.op[0].imms->X_op == O_constant
4048 && fits_in_imm7 (i.op[0].imms->X_add_number)
4049 && (i.tm.base_opcode == 0xa8
4050 || (i.tm.base_opcode == 0xf6
4051 && i.tm.extension_opcode == 0x0)))
4052 {
4053 /* Optimize: -Os:
4054 test $imm7, %r64/%r32/%r16 -> test $imm7, %r8
4055 */
4056 unsigned int base_regnum = i.op[1].regs->reg_num;
4057 if (flag_code == CODE_64BIT || base_regnum < 4)
4058 {
4059 i.types[1].bitfield.byte = 1;
4060 /* Ignore the suffix. */
4061 i.suffix = 0;
4062 /* Convert to byte registers. */
4063 if (i.types[1].bitfield.word)
4064 j = 16;
4065 else if (i.types[1].bitfield.dword)
4066 j = 32;
4067 else
4068 j = 48;
4069 if (!(i.op[1].regs->reg_flags & RegRex) && base_regnum < 4)
4070 j += 8;
4071 i.op[1].regs -= j;
4072 }
4073 }
4074 else if (flag_code == CODE_64BIT
4075 && !is_any_vex_encoding (&i.tm)
4076 && ((i.types[1].bitfield.qword
4077 && i.reg_operands == 1
4078 && i.imm_operands == 1
4079 && i.op[0].imms->X_op == O_constant
4080 && ((i.tm.base_opcode == 0xb8
4081 && i.tm.extension_opcode == None
4082 && fits_in_unsigned_long (i.op[0].imms->X_add_number))
4083 || (fits_in_imm31 (i.op[0].imms->X_add_number)
4084 && ((i.tm.base_opcode == 0x24
4085 || i.tm.base_opcode == 0xa8)
4086 || (i.tm.base_opcode == 0x80
4087 && i.tm.extension_opcode == 0x4)
4088 || ((i.tm.base_opcode == 0xf6
4089 || (i.tm.base_opcode | 1) == 0xc7)
4090 && i.tm.extension_opcode == 0x0)))
4091 || (fits_in_imm7 (i.op[0].imms->X_add_number)
4092 && i.tm.base_opcode == 0x83
4093 && i.tm.extension_opcode == 0x4)))
4094 || (i.types[0].bitfield.qword
4095 && ((i.reg_operands == 2
4096 && i.op[0].regs == i.op[1].regs
4097 && (i.tm.base_opcode == 0x30
4098 || i.tm.base_opcode == 0x28))
4099 || (i.reg_operands == 1
4100 && i.operands == 1
4101 && i.tm.base_opcode == 0x30)))))
4102 {
4103 /* Optimize: -O:
4104 andq $imm31, %r64 -> andl $imm31, %r32
4105 andq $imm7, %r64 -> andl $imm7, %r32
4106 testq $imm31, %r64 -> testl $imm31, %r32
4107 xorq %r64, %r64 -> xorl %r32, %r32
4108 subq %r64, %r64 -> subl %r32, %r32
4109 movq $imm31, %r64 -> movl $imm31, %r32
4110 movq $imm32, %r64 -> movl $imm32, %r32
4111 */
4112 i.tm.opcode_modifier.norex64 = 1;
4113 if (i.tm.base_opcode == 0xb8 || (i.tm.base_opcode | 1) == 0xc7)
4114 {
4115 /* Handle
4116 movq $imm31, %r64 -> movl $imm31, %r32
4117 movq $imm32, %r64 -> movl $imm32, %r32
4118 */
4119 i.tm.operand_types[0].bitfield.imm32 = 1;
4120 i.tm.operand_types[0].bitfield.imm32s = 0;
4121 i.tm.operand_types[0].bitfield.imm64 = 0;
4122 i.types[0].bitfield.imm32 = 1;
4123 i.types[0].bitfield.imm32s = 0;
4124 i.types[0].bitfield.imm64 = 0;
4125 i.types[1].bitfield.dword = 1;
4126 i.types[1].bitfield.qword = 0;
4127 if ((i.tm.base_opcode | 1) == 0xc7)
4128 {
4129 /* Handle
4130 movq $imm31, %r64 -> movl $imm31, %r32
4131 */
4132 i.tm.base_opcode = 0xb8;
4133 i.tm.extension_opcode = None;
4134 i.tm.opcode_modifier.w = 0;
4135 i.tm.opcode_modifier.modrm = 0;
4136 }
4137 }
4138 }
4139 else if (optimize > 1
4140 && !optimize_for_space
4141 && !is_any_vex_encoding (&i.tm)
4142 && i.reg_operands == 2
4143 && i.op[0].regs == i.op[1].regs
4144 && ((i.tm.base_opcode & ~(Opcode_D | 1)) == 0x8
4145 || (i.tm.base_opcode & ~(Opcode_D | 1)) == 0x20)
4146 && (flag_code != CODE_64BIT || !i.types[0].bitfield.dword))
4147 {
4148 /* Optimize: -O2:
4149 andb %rN, %rN -> testb %rN, %rN
4150 andw %rN, %rN -> testw %rN, %rN
4151 andq %rN, %rN -> testq %rN, %rN
4152 orb %rN, %rN -> testb %rN, %rN
4153 orw %rN, %rN -> testw %rN, %rN
4154 orq %rN, %rN -> testq %rN, %rN
4155
4156 and outside of 64-bit mode
4157
4158 andl %rN, %rN -> testl %rN, %rN
4159 orl %rN, %rN -> testl %rN, %rN
4160 */
4161 i.tm.base_opcode = 0x84 | (i.tm.base_opcode & 1);
4162 }
4163 else if (i.reg_operands == 3
4164 && i.op[0].regs == i.op[1].regs
4165 && !i.types[2].bitfield.xmmword
4166 && (i.tm.opcode_modifier.vex
4167 || ((!i.mask || i.mask->zeroing)
4168 && !i.rounding
4169 && is_evex_encoding (&i.tm)
4170 && (i.vec_encoding != vex_encoding_evex
4171 || cpu_arch_isa_flags.bitfield.cpuavx512vl
4172 || i.tm.cpu_flags.bitfield.cpuavx512vl
4173 || (i.tm.operand_types[2].bitfield.zmmword
4174 && i.types[2].bitfield.ymmword))))
4175 && ((i.tm.base_opcode == 0x55
4176 || i.tm.base_opcode == 0x57
4177 || i.tm.base_opcode == 0xdf
4178 || i.tm.base_opcode == 0xef
4179 || i.tm.base_opcode == 0xf8
4180 || i.tm.base_opcode == 0xf9
4181 || i.tm.base_opcode == 0xfa
4182 || i.tm.base_opcode == 0xfb
4183 || i.tm.base_opcode == 0x42
4184 || i.tm.base_opcode == 0x47)
4185 && i.tm.extension_opcode == None))
4186 {
4187 /* Optimize: -O1:
4188 VOP, one of vandnps, vandnpd, vxorps, vxorpd, vpsubb, vpsubd,
4189 vpsubq and vpsubw:
4190 EVEX VOP %zmmM, %zmmM, %zmmN
4191 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4192 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4193 EVEX VOP %ymmM, %ymmM, %ymmN
4194 -> VEX VOP %xmmM, %xmmM, %xmmN (M and N < 16)
4195 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4196 VEX VOP %ymmM, %ymmM, %ymmN
4197 -> VEX VOP %xmmM, %xmmM, %xmmN
4198 VOP, one of vpandn and vpxor:
4199 VEX VOP %ymmM, %ymmM, %ymmN
4200 -> VEX VOP %xmmM, %xmmM, %xmmN
4201 VOP, one of vpandnd and vpandnq:
4202 EVEX VOP %zmmM, %zmmM, %zmmN
4203 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4204 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4205 EVEX VOP %ymmM, %ymmM, %ymmN
4206 -> VEX vpandn %xmmM, %xmmM, %xmmN (M and N < 16)
4207 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4208 VOP, one of vpxord and vpxorq:
4209 EVEX VOP %zmmM, %zmmM, %zmmN
4210 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4211 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4212 EVEX VOP %ymmM, %ymmM, %ymmN
4213 -> VEX vpxor %xmmM, %xmmM, %xmmN (M and N < 16)
4214 -> EVEX VOP %xmmM, %xmmM, %xmmN (M || N >= 16) (-O2)
4215 VOP, one of kxord and kxorq:
4216 VEX VOP %kM, %kM, %kN
4217 -> VEX kxorw %kM, %kM, %kN
4218 VOP, one of kandnd and kandnq:
4219 VEX VOP %kM, %kM, %kN
4220 -> VEX kandnw %kM, %kM, %kN
4221 */
4222 if (is_evex_encoding (&i.tm))
4223 {
4224 if (i.vec_encoding != vex_encoding_evex)
4225 {
4226 i.tm.opcode_modifier.vex = VEX128;
4227 i.tm.opcode_modifier.vexw = VEXW0;
4228 i.tm.opcode_modifier.evex = 0;
4229 }
4230 else if (optimize > 1)
4231 i.tm.opcode_modifier.evex = EVEX128;
4232 else
4233 return;
4234 }
4235 else if (i.tm.operand_types[0].bitfield.class == RegMask)
4236 {
4237 i.tm.opcode_modifier.opcodeprefix = PREFIX_NONE;
4238 i.tm.opcode_modifier.vexw = VEXW0;
4239 }
4240 else
4241 i.tm.opcode_modifier.vex = VEX128;
4242
4243 if (i.tm.opcode_modifier.vex)
4244 for (j = 0; j < 3; j++)
4245 {
4246 i.types[j].bitfield.xmmword = 1;
4247 i.types[j].bitfield.ymmword = 0;
4248 }
4249 }
4250 else if (i.vec_encoding != vex_encoding_evex
4251 && !i.types[0].bitfield.zmmword
4252 && !i.types[1].bitfield.zmmword
4253 && !i.mask
4254 && !i.broadcast
4255 && is_evex_encoding (&i.tm)
4256 && ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4257 || (i.tm.base_opcode & ~4) == 0xdb
4258 || (i.tm.base_opcode & ~4) == 0xeb)
4259 && i.tm.extension_opcode == None)
4260 {
4261 /* Optimize: -O1:
4262 VOP, one of vmovdqa32, vmovdqa64, vmovdqu8, vmovdqu16,
4263 vmovdqu32 and vmovdqu64:
4264 EVEX VOP %xmmM, %xmmN
4265 -> VEX vmovdqa|vmovdqu %xmmM, %xmmN (M and N < 16)
4266 EVEX VOP %ymmM, %ymmN
4267 -> VEX vmovdqa|vmovdqu %ymmM, %ymmN (M and N < 16)
4268 EVEX VOP %xmmM, mem
4269 -> VEX vmovdqa|vmovdqu %xmmM, mem (M < 16)
4270 EVEX VOP %ymmM, mem
4271 -> VEX vmovdqa|vmovdqu %ymmM, mem (M < 16)
4272 EVEX VOP mem, %xmmN
4273 -> VEX mvmovdqa|vmovdquem, %xmmN (N < 16)
4274 EVEX VOP mem, %ymmN
4275 -> VEX vmovdqa|vmovdqu mem, %ymmN (N < 16)
4276 VOP, one of vpand, vpandn, vpor, vpxor:
4277 EVEX VOP{d,q} %xmmL, %xmmM, %xmmN
4278 -> VEX VOP %xmmL, %xmmM, %xmmN (L, M, and N < 16)
4279 EVEX VOP{d,q} %ymmL, %ymmM, %ymmN
4280 -> VEX VOP %ymmL, %ymmM, %ymmN (L, M, and N < 16)
4281 EVEX VOP{d,q} mem, %xmmM, %xmmN
4282 -> VEX VOP mem, %xmmM, %xmmN (M and N < 16)
4283 EVEX VOP{d,q} mem, %ymmM, %ymmN
4284 -> VEX VOP mem, %ymmM, %ymmN (M and N < 16)
4285 */
4286 for (j = 0; j < i.operands; j++)
4287 if (operand_type_check (i.types[j], disp)
4288 && i.op[j].disps->X_op == O_constant)
4289 {
4290 /* Since the VEX prefix has 2 or 3 bytes, the EVEX prefix
4291 has 4 bytes, EVEX Disp8 has 1 byte and VEX Disp32 has 4
4292 bytes, we choose EVEX Disp8 over VEX Disp32. */
4293 int evex_disp8, vex_disp8;
4294 unsigned int memshift = i.memshift;
4295 offsetT n = i.op[j].disps->X_add_number;
4296
4297 evex_disp8 = fits_in_disp8 (n);
4298 i.memshift = 0;
4299 vex_disp8 = fits_in_disp8 (n);
4300 if (evex_disp8 != vex_disp8)
4301 {
4302 i.memshift = memshift;
4303 return;
4304 }
4305
4306 i.types[j].bitfield.disp8 = vex_disp8;
4307 break;
4308 }
4309 if ((i.tm.base_opcode & ~Opcode_SIMD_IntD) == 0x6f
4310 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2)
4311 i.tm.opcode_modifier.opcodeprefix = PREFIX_0XF3;
4312 i.tm.opcode_modifier.vex
4313 = i.types[0].bitfield.ymmword ? VEX256 : VEX128;
4314 i.tm.opcode_modifier.vexw = VEXW0;
4315 /* VPAND, VPOR, and VPXOR are commutative. */
4316 if (i.reg_operands == 3 && i.tm.base_opcode != 0xdf)
4317 i.tm.opcode_modifier.commutative = 1;
4318 i.tm.opcode_modifier.evex = 0;
4319 i.tm.opcode_modifier.masking = 0;
4320 i.tm.opcode_modifier.broadcast = 0;
4321 i.tm.opcode_modifier.disp8memshift = 0;
4322 i.memshift = 0;
4323 if (j < i.operands)
4324 i.types[j].bitfield.disp8
4325 = fits_in_disp8 (i.op[j].disps->X_add_number);
4326 }
4327 }
4328
4329 /* Return non-zero for load instruction. */
4330
4331 static int
4332 load_insn_p (void)
4333 {
4334 unsigned int dest;
4335 int any_vex_p = is_any_vex_encoding (&i.tm);
4336 unsigned int base_opcode = i.tm.base_opcode | 1;
4337
4338 if (!any_vex_p)
4339 {
4340 /* Anysize insns: lea, invlpg, clflush, prefetchnta, prefetcht0,
4341 prefetcht1, prefetcht2, prefetchtw, bndmk, bndcl, bndcu, bndcn,
4342 bndstx, bndldx, prefetchwt1, clflushopt, clwb, cldemote. */
4343 if (i.tm.opcode_modifier.anysize)
4344 return 0;
4345
4346 /* pop, popf, popa. */
4347 if (strcmp (i.tm.name, "pop") == 0
4348 || i.tm.base_opcode == 0x9d
4349 || i.tm.base_opcode == 0x61)
4350 return 1;
4351
4352 /* movs, cmps, lods, scas. */
4353 if ((i.tm.base_opcode | 0xb) == 0xaf)
4354 return 1;
4355
4356 /* outs, xlatb. */
4357 if (base_opcode == 0x6f
4358 || i.tm.base_opcode == 0xd7)
4359 return 1;
4360 /* NB: For AMD-specific insns with implicit memory operands,
4361 they're intentionally not covered. */
4362 }
4363
4364 /* No memory operand. */
4365 if (!i.mem_operands)
4366 return 0;
4367
4368 if (any_vex_p)
4369 {
4370 /* vldmxcsr. */
4371 if (i.tm.base_opcode == 0xae
4372 && i.tm.opcode_modifier.vex
4373 && i.tm.opcode_modifier.opcodespace == SPACE_0F
4374 && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4375 && i.tm.extension_opcode == 2)
4376 return 1;
4377 }
4378 else
4379 {
4380 /* test, not, neg, mul, imul, div, idiv. */
4381 if ((i.tm.base_opcode == 0xf6 || i.tm.base_opcode == 0xf7)
4382 && i.tm.extension_opcode != 1)
4383 return 1;
4384
4385 /* inc, dec. */
4386 if (base_opcode == 0xff && i.tm.extension_opcode <= 1)
4387 return 1;
4388
4389 /* add, or, adc, sbb, and, sub, xor, cmp. */
4390 if (i.tm.base_opcode >= 0x80 && i.tm.base_opcode <= 0x83)
4391 return 1;
4392
4393 /* bt, bts, btr, btc. */
4394 if (i.tm.base_opcode == 0xfba
4395 && (i.tm.extension_opcode >= 4 && i.tm.extension_opcode <= 7))
4396 return 1;
4397
4398 /* rol, ror, rcl, rcr, shl/sal, shr, sar. */
4399 if ((base_opcode == 0xc1
4400 || (i.tm.base_opcode >= 0xd0 && i.tm.base_opcode <= 0xd3))
4401 && i.tm.extension_opcode != 6)
4402 return 1;
4403
4404 /* cmpxchg8b, cmpxchg16b, xrstors, vmptrld. */
4405 if (i.tm.base_opcode == 0xfc7
4406 && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
4407 && (i.tm.extension_opcode == 1 || i.tm.extension_opcode == 3
4408 || i.tm.extension_opcode == 6))
4409 return 1;
4410
4411 /* fxrstor, ldmxcsr, xrstor. */
4412 if (i.tm.base_opcode == 0xfae
4413 && (i.tm.extension_opcode == 1
4414 || i.tm.extension_opcode == 2
4415 || i.tm.extension_opcode == 5))
4416 return 1;
4417
4418 /* lgdt, lidt, lmsw. */
4419 if (i.tm.base_opcode == 0xf01
4420 && (i.tm.extension_opcode == 2
4421 || i.tm.extension_opcode == 3
4422 || i.tm.extension_opcode == 6))
4423 return 1;
4424
4425 /* Check for x87 instructions. */
4426 if (i.tm.base_opcode >= 0xd8 && i.tm.base_opcode <= 0xdf)
4427 {
4428 /* Skip fst, fstp, fstenv, fstcw. */
4429 if (i.tm.base_opcode == 0xd9
4430 && (i.tm.extension_opcode == 2
4431 || i.tm.extension_opcode == 3
4432 || i.tm.extension_opcode == 6
4433 || i.tm.extension_opcode == 7))
4434 return 0;
4435
4436 /* Skip fisttp, fist, fistp, fstp. */
4437 if (i.tm.base_opcode == 0xdb
4438 && (i.tm.extension_opcode == 1
4439 || i.tm.extension_opcode == 2
4440 || i.tm.extension_opcode == 3
4441 || i.tm.extension_opcode == 7))
4442 return 0;
4443
4444 /* Skip fisttp, fst, fstp, fsave, fstsw. */
4445 if (i.tm.base_opcode == 0xdd
4446 && (i.tm.extension_opcode == 1
4447 || i.tm.extension_opcode == 2
4448 || i.tm.extension_opcode == 3
4449 || i.tm.extension_opcode == 6
4450 || i.tm.extension_opcode == 7))
4451 return 0;
4452
4453 /* Skip fisttp, fist, fistp, fbstp, fistp. */
4454 if (i.tm.base_opcode == 0xdf
4455 && (i.tm.extension_opcode == 1
4456 || i.tm.extension_opcode == 2
4457 || i.tm.extension_opcode == 3
4458 || i.tm.extension_opcode == 6
4459 || i.tm.extension_opcode == 7))
4460 return 0;
4461
4462 return 1;
4463 }
4464 }
4465
4466 dest = i.operands - 1;
4467
4468 /* Check fake imm8 operand and 3 source operands. */
4469 if ((i.tm.opcode_modifier.immext
4470 || i.tm.opcode_modifier.vexsources == VEX3SOURCES)
4471 && i.types[dest].bitfield.imm8)
4472 dest--;
4473
4474 /* add, or, adc, sbb, and, sub, xor, cmp, test, xchg, xadd */
4475 if (!any_vex_p
4476 && (base_opcode == 0x1
4477 || base_opcode == 0x9
4478 || base_opcode == 0x11
4479 || base_opcode == 0x19
4480 || base_opcode == 0x21
4481 || base_opcode == 0x29
4482 || base_opcode == 0x31
4483 || base_opcode == 0x39
4484 || (i.tm.base_opcode >= 0x84 && i.tm.base_opcode <= 0x87)
4485 || base_opcode == 0xfc1))
4486 return 1;
4487
4488 /* Check for load instruction. */
4489 return (i.types[dest].bitfield.class != ClassNone
4490 || i.types[dest].bitfield.instance == Accum);
4491 }
4492
4493 /* Output lfence, 0xfaee8, after instruction. */
4494
4495 static void
4496 insert_lfence_after (void)
4497 {
4498 if (lfence_after_load && load_insn_p ())
4499 {
4500 /* There are also two REP string instructions that require
4501 special treatment. Specifically, the compare string (CMPS)
4502 and scan string (SCAS) instructions set EFLAGS in a manner
4503 that depends on the data being compared/scanned. When used
4504 with a REP prefix, the number of iterations may therefore
4505 vary depending on this data. If the data is a program secret
4506 chosen by the adversary using an LVI method,
4507 then this data-dependent behavior may leak some aspect
4508 of the secret. */
4509 if (((i.tm.base_opcode | 0x1) == 0xa7
4510 || (i.tm.base_opcode | 0x1) == 0xaf)
4511 && i.prefix[REP_PREFIX])
4512 {
4513 as_warn (_("`%s` changes flags which would affect control flow behavior"),
4514 i.tm.name);
4515 }
4516 char *p = frag_more (3);
4517 *p++ = 0xf;
4518 *p++ = 0xae;
4519 *p = 0xe8;
4520 }
4521 }
4522
4523 /* Output lfence, 0xfaee8, before instruction. */
4524
4525 static void
4526 insert_lfence_before (void)
4527 {
4528 char *p;
4529
4530 if (is_any_vex_encoding (&i.tm))
4531 return;
4532
4533 if (i.tm.base_opcode == 0xff
4534 && (i.tm.extension_opcode == 2 || i.tm.extension_opcode == 4))
4535 {
4536 /* Insert lfence before indirect branch if needed. */
4537
4538 if (lfence_before_indirect_branch == lfence_branch_none)
4539 return;
4540
4541 if (i.operands != 1)
4542 abort ();
4543
4544 if (i.reg_operands == 1)
4545 {
4546 /* Indirect branch via register. Don't insert lfence with
4547 -mlfence-after-load=yes. */
4548 if (lfence_after_load
4549 || lfence_before_indirect_branch == lfence_branch_memory)
4550 return;
4551 }
4552 else if (i.mem_operands == 1
4553 && lfence_before_indirect_branch != lfence_branch_register)
4554 {
4555 as_warn (_("indirect `%s` with memory operand should be avoided"),
4556 i.tm.name);
4557 return;
4558 }
4559 else
4560 return;
4561
4562 if (last_insn.kind != last_insn_other
4563 && last_insn.seg == now_seg)
4564 {
4565 as_warn_where (last_insn.file, last_insn.line,
4566 _("`%s` skips -mlfence-before-indirect-branch on `%s`"),
4567 last_insn.name, i.tm.name);
4568 return;
4569 }
4570
4571 p = frag_more (3);
4572 *p++ = 0xf;
4573 *p++ = 0xae;
4574 *p = 0xe8;
4575 return;
4576 }
4577
4578 /* Output or/not/shl and lfence before near ret. */
4579 if (lfence_before_ret != lfence_before_ret_none
4580 && (i.tm.base_opcode == 0xc2
4581 || i.tm.base_opcode == 0xc3))
4582 {
4583 if (last_insn.kind != last_insn_other
4584 && last_insn.seg == now_seg)
4585 {
4586 as_warn_where (last_insn.file, last_insn.line,
4587 _("`%s` skips -mlfence-before-ret on `%s`"),
4588 last_insn.name, i.tm.name);
4589 return;
4590 }
4591
4592 /* Near ret ingore operand size override under CPU64. */
4593 char prefix = flag_code == CODE_64BIT
4594 ? 0x48
4595 : i.prefix[DATA_PREFIX] ? 0x66 : 0x0;
4596
4597 if (lfence_before_ret == lfence_before_ret_not)
4598 {
4599 /* not: 0xf71424, may add prefix
4600 for operand size override or 64-bit code. */
4601 p = frag_more ((prefix ? 2 : 0) + 6 + 3);
4602 if (prefix)
4603 *p++ = prefix;
4604 *p++ = 0xf7;
4605 *p++ = 0x14;
4606 *p++ = 0x24;
4607 if (prefix)
4608 *p++ = prefix;
4609 *p++ = 0xf7;
4610 *p++ = 0x14;
4611 *p++ = 0x24;
4612 }
4613 else
4614 {
4615 p = frag_more ((prefix ? 1 : 0) + 4 + 3);
4616 if (prefix)
4617 *p++ = prefix;
4618 if (lfence_before_ret == lfence_before_ret_or)
4619 {
4620 /* or: 0x830c2400, may add prefix
4621 for operand size override or 64-bit code. */
4622 *p++ = 0x83;
4623 *p++ = 0x0c;
4624 }
4625 else
4626 {
4627 /* shl: 0xc1242400, may add prefix
4628 for operand size override or 64-bit code. */
4629 *p++ = 0xc1;
4630 *p++ = 0x24;
4631 }
4632
4633 *p++ = 0x24;
4634 *p++ = 0x0;
4635 }
4636
4637 *p++ = 0xf;
4638 *p++ = 0xae;
4639 *p = 0xe8;
4640 }
4641 }
4642
4643 /* This is the guts of the machine-dependent assembler. LINE points to a
4644 machine dependent instruction. This function is supposed to emit
4645 the frags/bytes it assembles to. */
4646
4647 void
4648 md_assemble (char *line)
4649 {
4650 unsigned int j;
4651 char mnemonic[MAX_MNEM_SIZE], mnem_suffix;
4652 const insn_template *t;
4653
4654 /* Initialize globals. */
4655 memset (&i, '\0', sizeof (i));
4656 for (j = 0; j < MAX_OPERANDS; j++)
4657 i.reloc[j] = NO_RELOC;
4658 memset (disp_expressions, '\0', sizeof (disp_expressions));
4659 memset (im_expressions, '\0', sizeof (im_expressions));
4660 save_stack_p = save_stack;
4661
4662 /* First parse an instruction mnemonic & call i386_operand for the operands.
4663 We assume that the scrubber has arranged it so that line[0] is the valid
4664 start of a (possibly prefixed) mnemonic. */
4665
4666 line = parse_insn (line, mnemonic);
4667 if (line == NULL)
4668 return;
4669 mnem_suffix = i.suffix;
4670
4671 line = parse_operands (line, mnemonic);
4672 this_operand = -1;
4673 xfree (i.memop1_string);
4674 i.memop1_string = NULL;
4675 if (line == NULL)
4676 return;
4677
4678 /* Now we've parsed the mnemonic into a set of templates, and have the
4679 operands at hand. */
4680
4681 /* All Intel opcodes have reversed operands except for "bound", "enter",
4682 "invlpg*", "monitor*", "mwait*", "tpause", "umwait", "pvalidate",
4683 "rmpadjust", and "rmpupdate". We also don't reverse intersegment "jmp"
4684 and "call" instructions with 2 immediate operands so that the immediate
4685 segment precedes the offset consistently in Intel and AT&T modes. */
4686 if (intel_syntax
4687 && i.operands > 1
4688 && (strcmp (mnemonic, "bound") != 0)
4689 && (strncmp (mnemonic, "invlpg", 6) != 0)
4690 && (strncmp (mnemonic, "monitor", 7) != 0)
4691 && (strncmp (mnemonic, "mwait", 5) != 0)
4692 && (strcmp (mnemonic, "pvalidate") != 0)
4693 && (strncmp (mnemonic, "rmp", 3) != 0)
4694 && (strcmp (mnemonic, "tpause") != 0)
4695 && (strcmp (mnemonic, "umwait") != 0)
4696 && !(operand_type_check (i.types[0], imm)
4697 && operand_type_check (i.types[1], imm)))
4698 swap_operands ();
4699
4700 /* The order of the immediates should be reversed
4701 for 2 immediates extrq and insertq instructions */
4702 if (i.imm_operands == 2
4703 && (strcmp (mnemonic, "extrq") == 0
4704 || strcmp (mnemonic, "insertq") == 0))
4705 swap_2_operands (0, 1);
4706
4707 if (i.imm_operands)
4708 optimize_imm ();
4709
4710 /* Don't optimize displacement for movabs since it only takes 64bit
4711 displacement. */
4712 if (i.disp_operands
4713 && i.disp_encoding != disp_encoding_32bit
4714 && (flag_code != CODE_64BIT
4715 || strcmp (mnemonic, "movabs") != 0))
4716 optimize_disp ();
4717
4718 /* Next, we find a template that matches the given insn,
4719 making sure the overlap of the given operands types is consistent
4720 with the template operand types. */
4721
4722 if (!(t = match_template (mnem_suffix)))
4723 return;
4724
4725 if (sse_check != check_none
4726 && !i.tm.opcode_modifier.noavx
4727 && !i.tm.cpu_flags.bitfield.cpuavx
4728 && !i.tm.cpu_flags.bitfield.cpuavx512f
4729 && (i.tm.cpu_flags.bitfield.cpusse
4730 || i.tm.cpu_flags.bitfield.cpusse2
4731 || i.tm.cpu_flags.bitfield.cpusse3
4732 || i.tm.cpu_flags.bitfield.cpussse3
4733 || i.tm.cpu_flags.bitfield.cpusse4_1
4734 || i.tm.cpu_flags.bitfield.cpusse4_2
4735 || i.tm.cpu_flags.bitfield.cpupclmul
4736 || i.tm.cpu_flags.bitfield.cpuaes
4737 || i.tm.cpu_flags.bitfield.cpusha
4738 || i.tm.cpu_flags.bitfield.cpugfni))
4739 {
4740 (sse_check == check_warning
4741 ? as_warn
4742 : as_bad) (_("SSE instruction `%s' is used"), i.tm.name);
4743 }
4744
4745 if (i.tm.opcode_modifier.fwait)
4746 if (!add_prefix (FWAIT_OPCODE))
4747 return;
4748
4749 /* Check if REP prefix is OK. */
4750 if (i.rep_prefix && i.tm.opcode_modifier.prefixok != PrefixRep)
4751 {
4752 as_bad (_("invalid instruction `%s' after `%s'"),
4753 i.tm.name, i.rep_prefix);
4754 return;
4755 }
4756
4757 /* Check for lock without a lockable instruction. Destination operand
4758 must be memory unless it is xchg (0x86). */
4759 if (i.prefix[LOCK_PREFIX]
4760 && (i.tm.opcode_modifier.prefixok < PrefixLock
4761 || i.mem_operands == 0
4762 || (i.tm.base_opcode != 0x86
4763 && !(i.flags[i.operands - 1] & Operand_Mem))))
4764 {
4765 as_bad (_("expecting lockable instruction after `lock'"));
4766 return;
4767 }
4768
4769 /* Check for data size prefix on VEX/XOP/EVEX encoded and SIMD insns. */
4770 if (i.prefix[DATA_PREFIX]
4771 && (is_any_vex_encoding (&i.tm)
4772 || i.tm.operand_types[i.imm_operands].bitfield.class >= RegMMX
4773 || i.tm.operand_types[i.imm_operands + 1].bitfield.class >= RegMMX))
4774 {
4775 as_bad (_("data size prefix invalid with `%s'"), i.tm.name);
4776 return;
4777 }
4778
4779 /* Check if HLE prefix is OK. */
4780 if (i.hle_prefix && !check_hle ())
4781 return;
4782
4783 /* Check BND prefix. */
4784 if (i.bnd_prefix && !i.tm.opcode_modifier.bndprefixok)
4785 as_bad (_("expecting valid branch instruction after `bnd'"));
4786
4787 /* Check NOTRACK prefix. */
4788 if (i.notrack_prefix && i.tm.opcode_modifier.prefixok != PrefixNoTrack)
4789 as_bad (_("expecting indirect branch instruction after `notrack'"));
4790
4791 if (i.tm.cpu_flags.bitfield.cpumpx)
4792 {
4793 if (flag_code == CODE_64BIT && i.prefix[ADDR_PREFIX])
4794 as_bad (_("32-bit address isn't allowed in 64-bit MPX instructions."));
4795 else if (flag_code != CODE_16BIT
4796 ? i.prefix[ADDR_PREFIX]
4797 : i.mem_operands && !i.prefix[ADDR_PREFIX])
4798 as_bad (_("16-bit address isn't allowed in MPX instructions"));
4799 }
4800
4801 /* Insert BND prefix. */
4802 if (add_bnd_prefix && i.tm.opcode_modifier.bndprefixok)
4803 {
4804 if (!i.prefix[BND_PREFIX])
4805 add_prefix (BND_PREFIX_OPCODE);
4806 else if (i.prefix[BND_PREFIX] != BND_PREFIX_OPCODE)
4807 {
4808 as_warn (_("replacing `rep'/`repe' prefix by `bnd'"));
4809 i.prefix[BND_PREFIX] = BND_PREFIX_OPCODE;
4810 }
4811 }
4812
4813 /* Check string instruction segment overrides. */
4814 if (i.tm.opcode_modifier.isstring >= IS_STRING_ES_OP0)
4815 {
4816 gas_assert (i.mem_operands);
4817 if (!check_string ())
4818 return;
4819 i.disp_operands = 0;
4820 }
4821
4822 if (optimize && !i.no_optimize && i.tm.opcode_modifier.optimize)
4823 optimize_encoding ();
4824
4825 if (!process_suffix ())
4826 return;
4827
4828 /* Update operand types and check extended states. */
4829 for (j = 0; j < i.operands; j++)
4830 {
4831 i.types[j] = operand_type_and (i.types[j], i.tm.operand_types[j]);
4832 switch (i.tm.operand_types[j].bitfield.class)
4833 {
4834 default:
4835 break;
4836 case RegMMX:
4837 i.xstate |= xstate_mmx;
4838 break;
4839 case RegMask:
4840 i.xstate |= xstate_mask;
4841 break;
4842 case RegSIMD:
4843 if (i.tm.operand_types[j].bitfield.tmmword)
4844 i.xstate |= xstate_tmm;
4845 else if (i.tm.operand_types[j].bitfield.zmmword)
4846 i.xstate |= xstate_zmm;
4847 else if (i.tm.operand_types[j].bitfield.ymmword)
4848 i.xstate |= xstate_ymm;
4849 else if (i.tm.operand_types[j].bitfield.xmmword)
4850 i.xstate |= xstate_xmm;
4851 break;
4852 }
4853 }
4854
4855 /* Make still unresolved immediate matches conform to size of immediate
4856 given in i.suffix. */
4857 if (!finalize_imm ())
4858 return;
4859
4860 if (i.types[0].bitfield.imm1)
4861 i.imm_operands = 0; /* kludge for shift insns. */
4862
4863 /* We only need to check those implicit registers for instructions
4864 with 3 operands or less. */
4865 if (i.operands <= 3)
4866 for (j = 0; j < i.operands; j++)
4867 if (i.types[j].bitfield.instance != InstanceNone
4868 && !i.types[j].bitfield.xmmword)
4869 i.reg_operands--;
4870
4871 /* For insns with operands there are more diddles to do to the opcode. */
4872 if (i.operands)
4873 {
4874 if (!process_operands ())
4875 return;
4876 }
4877 else if (!quiet_warnings && i.tm.opcode_modifier.ugh)
4878 {
4879 /* UnixWare fsub no args is alias for fsubp, fadd -> faddp, etc. */
4880 as_warn (_("translating to `%sp'"), i.tm.name);
4881 }
4882
4883 if (is_any_vex_encoding (&i.tm))
4884 {
4885 if (!cpu_arch_flags.bitfield.cpui286)
4886 {
4887 as_bad (_("instruction `%s' isn't supported outside of protected mode."),
4888 i.tm.name);
4889 return;
4890 }
4891
4892 /* Check for explicit REX prefix. */
4893 if (i.prefix[REX_PREFIX] || i.rex_encoding)
4894 {
4895 as_bad (_("REX prefix invalid with `%s'"), i.tm.name);
4896 return;
4897 }
4898
4899 if (i.tm.opcode_modifier.vex)
4900 build_vex_prefix (t);
4901 else
4902 build_evex_prefix ();
4903
4904 /* The individual REX.RXBW bits got consumed. */
4905 i.rex &= REX_OPCODE;
4906 }
4907
4908 /* Handle conversion of 'int $3' --> special int3 insn. XOP or FMA4
4909 instructions may define INT_OPCODE as well, so avoid this corner
4910 case for those instructions that use MODRM. */
4911 if (i.tm.base_opcode == INT_OPCODE
4912 && !i.tm.opcode_modifier.modrm
4913 && i.op[0].imms->X_add_number == 3)
4914 {
4915 i.tm.base_opcode = INT3_OPCODE;
4916 i.imm_operands = 0;
4917 }
4918
4919 if ((i.tm.opcode_modifier.jump == JUMP
4920 || i.tm.opcode_modifier.jump == JUMP_BYTE
4921 || i.tm.opcode_modifier.jump == JUMP_DWORD)
4922 && i.op[0].disps->X_op == O_constant)
4923 {
4924 /* Convert "jmp constant" (and "call constant") to a jump (call) to
4925 the absolute address given by the constant. Since ix86 jumps and
4926 calls are pc relative, we need to generate a reloc. */
4927 i.op[0].disps->X_add_symbol = &abs_symbol;
4928 i.op[0].disps->X_op = O_symbol;
4929 }
4930
4931 /* For 8 bit registers we need an empty rex prefix. Also if the
4932 instruction already has a prefix, we need to convert old
4933 registers to new ones. */
4934
4935 if ((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte
4936 && (i.op[0].regs->reg_flags & RegRex64) != 0)
4937 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte
4938 && (i.op[1].regs->reg_flags & RegRex64) != 0)
4939 || (((i.types[0].bitfield.class == Reg && i.types[0].bitfield.byte)
4940 || (i.types[1].bitfield.class == Reg && i.types[1].bitfield.byte))
4941 && i.rex != 0))
4942 {
4943 int x;
4944
4945 i.rex |= REX_OPCODE;
4946 for (x = 0; x < 2; x++)
4947 {
4948 /* Look for 8 bit operand that uses old registers. */
4949 if (i.types[x].bitfield.class == Reg && i.types[x].bitfield.byte
4950 && (i.op[x].regs->reg_flags & RegRex64) == 0)
4951 {
4952 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4953 /* In case it is "hi" register, give up. */
4954 if (i.op[x].regs->reg_num > 3)
4955 as_bad (_("can't encode register '%s%s' in an "
4956 "instruction requiring REX prefix."),
4957 register_prefix, i.op[x].regs->reg_name);
4958
4959 /* Otherwise it is equivalent to the extended register.
4960 Since the encoding doesn't change this is merely
4961 cosmetic cleanup for debug output. */
4962
4963 i.op[x].regs = i.op[x].regs + 8;
4964 }
4965 }
4966 }
4967
4968 if (i.rex == 0 && i.rex_encoding)
4969 {
4970 /* Check if we can add a REX_OPCODE byte. Look for 8 bit operand
4971 that uses legacy register. If it is "hi" register, don't add
4972 the REX_OPCODE byte. */
4973 int x;
4974 for (x = 0; x < 2; x++)
4975 if (i.types[x].bitfield.class == Reg
4976 && i.types[x].bitfield.byte
4977 && (i.op[x].regs->reg_flags & RegRex64) == 0
4978 && i.op[x].regs->reg_num > 3)
4979 {
4980 gas_assert (!(i.op[x].regs->reg_flags & RegRex));
4981 i.rex_encoding = FALSE;
4982 break;
4983 }
4984
4985 if (i.rex_encoding)
4986 i.rex = REX_OPCODE;
4987 }
4988
4989 if (i.rex != 0)
4990 add_prefix (REX_OPCODE | i.rex);
4991
4992 insert_lfence_before ();
4993
4994 /* We are ready to output the insn. */
4995 output_insn ();
4996
4997 insert_lfence_after ();
4998
4999 last_insn.seg = now_seg;
5000
5001 if (i.tm.opcode_modifier.isprefix)
5002 {
5003 last_insn.kind = last_insn_prefix;
5004 last_insn.name = i.tm.name;
5005 last_insn.file = as_where (&last_insn.line);
5006 }
5007 else
5008 last_insn.kind = last_insn_other;
5009 }
5010
5011 static char *
5012 parse_insn (char *line, char *mnemonic)
5013 {
5014 char *l = line;
5015 char *token_start = l;
5016 char *mnem_p;
5017 int supported;
5018 const insn_template *t;
5019 char *dot_p = NULL;
5020
5021 while (1)
5022 {
5023 mnem_p = mnemonic;
5024 while ((*mnem_p = mnemonic_chars[(unsigned char) *l]) != 0)
5025 {
5026 if (*mnem_p == '.')
5027 dot_p = mnem_p;
5028 mnem_p++;
5029 if (mnem_p >= mnemonic + MAX_MNEM_SIZE)
5030 {
5031 as_bad (_("no such instruction: `%s'"), token_start);
5032 return NULL;
5033 }
5034 l++;
5035 }
5036 if (!is_space_char (*l)
5037 && *l != END_OF_INSN
5038 && (intel_syntax
5039 || (*l != PREFIX_SEPARATOR
5040 && *l != ',')))
5041 {
5042 as_bad (_("invalid character %s in mnemonic"),
5043 output_invalid (*l));
5044 return NULL;
5045 }
5046 if (token_start == l)
5047 {
5048 if (!intel_syntax && *l == PREFIX_SEPARATOR)
5049 as_bad (_("expecting prefix; got nothing"));
5050 else
5051 as_bad (_("expecting mnemonic; got nothing"));
5052 return NULL;
5053 }
5054
5055 /* Look up instruction (or prefix) via hash table. */
5056 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5057
5058 if (*l != END_OF_INSN
5059 && (!is_space_char (*l) || l[1] != END_OF_INSN)
5060 && current_templates
5061 && current_templates->start->opcode_modifier.isprefix)
5062 {
5063 if (!cpu_flags_check_cpu64 (current_templates->start->cpu_flags))
5064 {
5065 as_bad ((flag_code != CODE_64BIT
5066 ? _("`%s' is only supported in 64-bit mode")
5067 : _("`%s' is not supported in 64-bit mode")),
5068 current_templates->start->name);
5069 return NULL;
5070 }
5071 /* If we are in 16-bit mode, do not allow addr16 or data16.
5072 Similarly, in 32-bit mode, do not allow addr32 or data32. */
5073 if ((current_templates->start->opcode_modifier.size == SIZE16
5074 || current_templates->start->opcode_modifier.size == SIZE32)
5075 && flag_code != CODE_64BIT
5076 && ((current_templates->start->opcode_modifier.size == SIZE32)
5077 ^ (flag_code == CODE_16BIT)))
5078 {
5079 as_bad (_("redundant %s prefix"),
5080 current_templates->start->name);
5081 return NULL;
5082 }
5083
5084 if (current_templates->start->base_opcode == PSEUDO_PREFIX)
5085 {
5086 /* Handle pseudo prefixes. */
5087 switch (current_templates->start->extension_opcode)
5088 {
5089 case Prefix_Disp8:
5090 /* {disp8} */
5091 i.disp_encoding = disp_encoding_8bit;
5092 break;
5093 case Prefix_Disp16:
5094 /* {disp16} */
5095 i.disp_encoding = disp_encoding_16bit;
5096 break;
5097 case Prefix_Disp32:
5098 /* {disp32} */
5099 i.disp_encoding = disp_encoding_32bit;
5100 break;
5101 case Prefix_Load:
5102 /* {load} */
5103 i.dir_encoding = dir_encoding_load;
5104 break;
5105 case Prefix_Store:
5106 /* {store} */
5107 i.dir_encoding = dir_encoding_store;
5108 break;
5109 case Prefix_VEX:
5110 /* {vex} */
5111 i.vec_encoding = vex_encoding_vex;
5112 break;
5113 case Prefix_VEX3:
5114 /* {vex3} */
5115 i.vec_encoding = vex_encoding_vex3;
5116 break;
5117 case Prefix_EVEX:
5118 /* {evex} */
5119 i.vec_encoding = vex_encoding_evex;
5120 break;
5121 case Prefix_REX:
5122 /* {rex} */
5123 i.rex_encoding = TRUE;
5124 break;
5125 case Prefix_NoOptimize:
5126 /* {nooptimize} */
5127 i.no_optimize = TRUE;
5128 break;
5129 default:
5130 abort ();
5131 }
5132 }
5133 else
5134 {
5135 /* Add prefix, checking for repeated prefixes. */
5136 switch (add_prefix (current_templates->start->base_opcode))
5137 {
5138 case PREFIX_EXIST:
5139 return NULL;
5140 case PREFIX_DS:
5141 if (current_templates->start->cpu_flags.bitfield.cpuibt)
5142 i.notrack_prefix = current_templates->start->name;
5143 break;
5144 case PREFIX_REP:
5145 if (current_templates->start->cpu_flags.bitfield.cpuhle)
5146 i.hle_prefix = current_templates->start->name;
5147 else if (current_templates->start->cpu_flags.bitfield.cpumpx)
5148 i.bnd_prefix = current_templates->start->name;
5149 else
5150 i.rep_prefix = current_templates->start->name;
5151 break;
5152 default:
5153 break;
5154 }
5155 }
5156 /* Skip past PREFIX_SEPARATOR and reset token_start. */
5157 token_start = ++l;
5158 }
5159 else
5160 break;
5161 }
5162
5163 if (!current_templates)
5164 {
5165 /* Deprecated functionality (new code should use pseudo-prefixes instead):
5166 Check if we should swap operand or force 32bit displacement in
5167 encoding. */
5168 if (mnem_p - 2 == dot_p && dot_p[1] == 's')
5169 i.dir_encoding = dir_encoding_swap;
5170 else if (mnem_p - 3 == dot_p
5171 && dot_p[1] == 'd'
5172 && dot_p[2] == '8')
5173 i.disp_encoding = disp_encoding_8bit;
5174 else if (mnem_p - 4 == dot_p
5175 && dot_p[1] == 'd'
5176 && dot_p[2] == '3'
5177 && dot_p[3] == '2')
5178 i.disp_encoding = disp_encoding_32bit;
5179 else
5180 goto check_suffix;
5181 mnem_p = dot_p;
5182 *dot_p = '\0';
5183 current_templates = (const templates *) str_hash_find (op_hash, mnemonic);
5184 }
5185
5186 if (!current_templates)
5187 {
5188 check_suffix:
5189 if (mnem_p > mnemonic)
5190 {
5191 /* See if we can get a match by trimming off a suffix. */
5192 switch (mnem_p[-1])
5193 {
5194 case WORD_MNEM_SUFFIX:
5195 if (intel_syntax && (intel_float_operand (mnemonic) & 2))
5196 i.suffix = SHORT_MNEM_SUFFIX;
5197 else
5198 /* Fall through. */
5199 case BYTE_MNEM_SUFFIX:
5200 case QWORD_MNEM_SUFFIX:
5201 i.suffix = mnem_p[-1];
5202 mnem_p[-1] = '\0';
5203 current_templates
5204 = (const templates *) str_hash_find (op_hash, mnemonic);
5205 break;
5206 case SHORT_MNEM_SUFFIX:
5207 case LONG_MNEM_SUFFIX:
5208 if (!intel_syntax)
5209 {
5210 i.suffix = mnem_p[-1];
5211 mnem_p[-1] = '\0';
5212 current_templates
5213 = (const templates *) str_hash_find (op_hash, mnemonic);
5214 }
5215 break;
5216
5217 /* Intel Syntax. */
5218 case 'd':
5219 if (intel_syntax)
5220 {
5221 if (intel_float_operand (mnemonic) == 1)
5222 i.suffix = SHORT_MNEM_SUFFIX;
5223 else
5224 i.suffix = LONG_MNEM_SUFFIX;
5225 mnem_p[-1] = '\0';
5226 current_templates
5227 = (const templates *) str_hash_find (op_hash, mnemonic);
5228 }
5229 break;
5230 }
5231 }
5232
5233 if (!current_templates)
5234 {
5235 as_bad (_("no such instruction: `%s'"), token_start);
5236 return NULL;
5237 }
5238 }
5239
5240 if (current_templates->start->opcode_modifier.jump == JUMP
5241 || current_templates->start->opcode_modifier.jump == JUMP_BYTE)
5242 {
5243 /* Check for a branch hint. We allow ",pt" and ",pn" for
5244 predict taken and predict not taken respectively.
5245 I'm not sure that branch hints actually do anything on loop
5246 and jcxz insns (JumpByte) for current Pentium4 chips. They
5247 may work in the future and it doesn't hurt to accept them
5248 now. */
5249 if (l[0] == ',' && l[1] == 'p')
5250 {
5251 if (l[2] == 't')
5252 {
5253 if (!add_prefix (DS_PREFIX_OPCODE))
5254 return NULL;
5255 l += 3;
5256 }
5257 else if (l[2] == 'n')
5258 {
5259 if (!add_prefix (CS_PREFIX_OPCODE))
5260 return NULL;
5261 l += 3;
5262 }
5263 }
5264 }
5265 /* Any other comma loses. */
5266 if (*l == ',')
5267 {
5268 as_bad (_("invalid character %s in mnemonic"),
5269 output_invalid (*l));
5270 return NULL;
5271 }
5272
5273 /* Check if instruction is supported on specified architecture. */
5274 supported = 0;
5275 for (t = current_templates->start; t < current_templates->end; ++t)
5276 {
5277 supported |= cpu_flags_match (t);
5278 if (supported == CPU_FLAGS_PERFECT_MATCH)
5279 {
5280 if (!cpu_arch_flags.bitfield.cpui386 && (flag_code != CODE_16BIT))
5281 as_warn (_("use .code16 to ensure correct addressing mode"));
5282
5283 return l;
5284 }
5285 }
5286
5287 if (!(supported & CPU_FLAGS_64BIT_MATCH))
5288 as_bad (flag_code == CODE_64BIT
5289 ? _("`%s' is not supported in 64-bit mode")
5290 : _("`%s' is only supported in 64-bit mode"),
5291 current_templates->start->name);
5292 else
5293 as_bad (_("`%s' is not supported on `%s%s'"),
5294 current_templates->start->name,
5295 cpu_arch_name ? cpu_arch_name : default_arch,
5296 cpu_sub_arch_name ? cpu_sub_arch_name : "");
5297
5298 return NULL;
5299 }
5300
5301 static char *
5302 parse_operands (char *l, const char *mnemonic)
5303 {
5304 char *token_start;
5305
5306 /* 1 if operand is pending after ','. */
5307 unsigned int expecting_operand = 0;
5308
5309 /* Non-zero if operand parens not balanced. */
5310 unsigned int paren_not_balanced;
5311
5312 while (*l != END_OF_INSN)
5313 {
5314 /* Skip optional white space before operand. */
5315 if (is_space_char (*l))
5316 ++l;
5317 if (!is_operand_char (*l) && *l != END_OF_INSN && *l != '"')
5318 {
5319 as_bad (_("invalid character %s before operand %d"),
5320 output_invalid (*l),
5321 i.operands + 1);
5322 return NULL;
5323 }
5324 token_start = l; /* After white space. */
5325 paren_not_balanced = 0;
5326 while (paren_not_balanced || *l != ',')
5327 {
5328 if (*l == END_OF_INSN)
5329 {
5330 if (paren_not_balanced)
5331 {
5332 if (!intel_syntax)
5333 as_bad (_("unbalanced parenthesis in operand %d."),
5334 i.operands + 1);
5335 else
5336 as_bad (_("unbalanced brackets in operand %d."),
5337 i.operands + 1);
5338 return NULL;
5339 }
5340 else
5341 break; /* we are done */
5342 }
5343 else if (!is_operand_char (*l) && !is_space_char (*l) && *l != '"')
5344 {
5345 as_bad (_("invalid character %s in operand %d"),
5346 output_invalid (*l),
5347 i.operands + 1);
5348 return NULL;
5349 }
5350 if (!intel_syntax)
5351 {
5352 if (*l == '(')
5353 ++paren_not_balanced;
5354 if (*l == ')')
5355 --paren_not_balanced;
5356 }
5357 else
5358 {
5359 if (*l == '[')
5360 ++paren_not_balanced;
5361 if (*l == ']')
5362 --paren_not_balanced;
5363 }
5364 l++;
5365 }
5366 if (l != token_start)
5367 { /* Yes, we've read in another operand. */
5368 unsigned int operand_ok;
5369 this_operand = i.operands++;
5370 if (i.operands > MAX_OPERANDS)
5371 {
5372 as_bad (_("spurious operands; (%d operands/instruction max)"),
5373 MAX_OPERANDS);
5374 return NULL;
5375 }
5376 i.types[this_operand].bitfield.unspecified = 1;
5377 /* Now parse operand adding info to 'i' as we go along. */
5378 END_STRING_AND_SAVE (l);
5379
5380 if (i.mem_operands > 1)
5381 {
5382 as_bad (_("too many memory references for `%s'"),
5383 mnemonic);
5384 return 0;
5385 }
5386
5387 if (intel_syntax)
5388 operand_ok =
5389 i386_intel_operand (token_start,
5390 intel_float_operand (mnemonic));
5391 else
5392 operand_ok = i386_att_operand (token_start);
5393
5394 RESTORE_END_STRING (l);
5395 if (!operand_ok)
5396 return NULL;
5397 }
5398 else
5399 {
5400 if (expecting_operand)
5401 {
5402 expecting_operand_after_comma:
5403 as_bad (_("expecting operand after ','; got nothing"));
5404 return NULL;
5405 }
5406 if (*l == ',')
5407 {
5408 as_bad (_("expecting operand before ','; got nothing"));
5409 return NULL;
5410 }
5411 }
5412
5413 /* Now *l must be either ',' or END_OF_INSN. */
5414 if (*l == ',')
5415 {
5416 if (*++l == END_OF_INSN)
5417 {
5418 /* Just skip it, if it's \n complain. */
5419 goto expecting_operand_after_comma;
5420 }
5421 expecting_operand = 1;
5422 }
5423 }
5424 return l;
5425 }
5426
5427 static void
5428 swap_2_operands (int xchg1, int xchg2)
5429 {
5430 union i386_op temp_op;
5431 i386_operand_type temp_type;
5432 unsigned int temp_flags;
5433 enum bfd_reloc_code_real temp_reloc;
5434
5435 temp_type = i.types[xchg2];
5436 i.types[xchg2] = i.types[xchg1];
5437 i.types[xchg1] = temp_type;
5438
5439 temp_flags = i.flags[xchg2];
5440 i.flags[xchg2] = i.flags[xchg1];
5441 i.flags[xchg1] = temp_flags;
5442
5443 temp_op = i.op[xchg2];
5444 i.op[xchg2] = i.op[xchg1];
5445 i.op[xchg1] = temp_op;
5446
5447 temp_reloc = i.reloc[xchg2];
5448 i.reloc[xchg2] = i.reloc[xchg1];
5449 i.reloc[xchg1] = temp_reloc;
5450
5451 if (i.mask)
5452 {
5453 if (i.mask->operand == xchg1)
5454 i.mask->operand = xchg2;
5455 else if (i.mask->operand == xchg2)
5456 i.mask->operand = xchg1;
5457 }
5458 if (i.broadcast)
5459 {
5460 if (i.broadcast->operand == xchg1)
5461 i.broadcast->operand = xchg2;
5462 else if (i.broadcast->operand == xchg2)
5463 i.broadcast->operand = xchg1;
5464 }
5465 if (i.rounding)
5466 {
5467 if (i.rounding->operand == xchg1)
5468 i.rounding->operand = xchg2;
5469 else if (i.rounding->operand == xchg2)
5470 i.rounding->operand = xchg1;
5471 }
5472 }
5473
5474 static void
5475 swap_operands (void)
5476 {
5477 switch (i.operands)
5478 {
5479 case 5:
5480 case 4:
5481 swap_2_operands (1, i.operands - 2);
5482 /* Fall through. */
5483 case 3:
5484 case 2:
5485 swap_2_operands (0, i.operands - 1);
5486 break;
5487 default:
5488 abort ();
5489 }
5490
5491 if (i.mem_operands == 2)
5492 {
5493 const seg_entry *temp_seg;
5494 temp_seg = i.seg[0];
5495 i.seg[0] = i.seg[1];
5496 i.seg[1] = temp_seg;
5497 }
5498 }
5499
5500 /* Try to ensure constant immediates are represented in the smallest
5501 opcode possible. */
5502 static void
5503 optimize_imm (void)
5504 {
5505 char guess_suffix = 0;
5506 int op;
5507
5508 if (i.suffix)
5509 guess_suffix = i.suffix;
5510 else if (i.reg_operands)
5511 {
5512 /* Figure out a suffix from the last register operand specified.
5513 We can't do this properly yet, i.e. excluding special register
5514 instances, but the following works for instructions with
5515 immediates. In any case, we can't set i.suffix yet. */
5516 for (op = i.operands; --op >= 0;)
5517 if (i.types[op].bitfield.class != Reg)
5518 continue;
5519 else if (i.types[op].bitfield.byte)
5520 {
5521 guess_suffix = BYTE_MNEM_SUFFIX;
5522 break;
5523 }
5524 else if (i.types[op].bitfield.word)
5525 {
5526 guess_suffix = WORD_MNEM_SUFFIX;
5527 break;
5528 }
5529 else if (i.types[op].bitfield.dword)
5530 {
5531 guess_suffix = LONG_MNEM_SUFFIX;
5532 break;
5533 }
5534 else if (i.types[op].bitfield.qword)
5535 {
5536 guess_suffix = QWORD_MNEM_SUFFIX;
5537 break;
5538 }
5539 }
5540 else if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
5541 guess_suffix = WORD_MNEM_SUFFIX;
5542
5543 for (op = i.operands; --op >= 0;)
5544 if (operand_type_check (i.types[op], imm))
5545 {
5546 switch (i.op[op].imms->X_op)
5547 {
5548 case O_constant:
5549 /* If a suffix is given, this operand may be shortened. */
5550 switch (guess_suffix)
5551 {
5552 case LONG_MNEM_SUFFIX:
5553 i.types[op].bitfield.imm32 = 1;
5554 i.types[op].bitfield.imm64 = 1;
5555 break;
5556 case WORD_MNEM_SUFFIX:
5557 i.types[op].bitfield.imm16 = 1;
5558 i.types[op].bitfield.imm32 = 1;
5559 i.types[op].bitfield.imm32s = 1;
5560 i.types[op].bitfield.imm64 = 1;
5561 break;
5562 case BYTE_MNEM_SUFFIX:
5563 i.types[op].bitfield.imm8 = 1;
5564 i.types[op].bitfield.imm8s = 1;
5565 i.types[op].bitfield.imm16 = 1;
5566 i.types[op].bitfield.imm32 = 1;
5567 i.types[op].bitfield.imm32s = 1;
5568 i.types[op].bitfield.imm64 = 1;
5569 break;
5570 }
5571
5572 /* If this operand is at most 16 bits, convert it
5573 to a signed 16 bit number before trying to see
5574 whether it will fit in an even smaller size.
5575 This allows a 16-bit operand such as $0xffe0 to
5576 be recognised as within Imm8S range. */
5577 if ((i.types[op].bitfield.imm16)
5578 && (i.op[op].imms->X_add_number & ~(offsetT) 0xffff) == 0)
5579 {
5580 i.op[op].imms->X_add_number =
5581 (((i.op[op].imms->X_add_number & 0xffff) ^ 0x8000) - 0x8000);
5582 }
5583 #ifdef BFD64
5584 /* Store 32-bit immediate in 64-bit for 64-bit BFD. */
5585 if ((i.types[op].bitfield.imm32)
5586 && ((i.op[op].imms->X_add_number & ~(((offsetT) 2 << 31) - 1))
5587 == 0))
5588 {
5589 i.op[op].imms->X_add_number = ((i.op[op].imms->X_add_number
5590 ^ ((offsetT) 1 << 31))
5591 - ((offsetT) 1 << 31));
5592 }
5593 #endif
5594 i.types[op]
5595 = operand_type_or (i.types[op],
5596 smallest_imm_type (i.op[op].imms->X_add_number));
5597
5598 /* We must avoid matching of Imm32 templates when 64bit
5599 only immediate is available. */
5600 if (guess_suffix == QWORD_MNEM_SUFFIX)
5601 i.types[op].bitfield.imm32 = 0;
5602 break;
5603
5604 case O_absent:
5605 case O_register:
5606 abort ();
5607
5608 /* Symbols and expressions. */
5609 default:
5610 /* Convert symbolic operand to proper sizes for matching, but don't
5611 prevent matching a set of insns that only supports sizes other
5612 than those matching the insn suffix. */
5613 {
5614 i386_operand_type mask, allowed;
5615 const insn_template *t;
5616
5617 operand_type_set (&mask, 0);
5618 operand_type_set (&allowed, 0);
5619
5620 for (t = current_templates->start;
5621 t < current_templates->end;
5622 ++t)
5623 {
5624 allowed = operand_type_or (allowed, t->operand_types[op]);
5625 allowed = operand_type_and (allowed, anyimm);
5626 }
5627 switch (guess_suffix)
5628 {
5629 case QWORD_MNEM_SUFFIX:
5630 mask.bitfield.imm64 = 1;
5631 mask.bitfield.imm32s = 1;
5632 break;
5633 case LONG_MNEM_SUFFIX:
5634 mask.bitfield.imm32 = 1;
5635 break;
5636 case WORD_MNEM_SUFFIX:
5637 mask.bitfield.imm16 = 1;
5638 break;
5639 case BYTE_MNEM_SUFFIX:
5640 mask.bitfield.imm8 = 1;
5641 break;
5642 default:
5643 break;
5644 }
5645 allowed = operand_type_and (mask, allowed);
5646 if (!operand_type_all_zero (&allowed))
5647 i.types[op] = operand_type_and (i.types[op], mask);
5648 }
5649 break;
5650 }
5651 }
5652 }
5653
5654 /* Try to use the smallest displacement type too. */
5655 static void
5656 optimize_disp (void)
5657 {
5658 int op;
5659
5660 for (op = i.operands; --op >= 0;)
5661 if (operand_type_check (i.types[op], disp))
5662 {
5663 if (i.op[op].disps->X_op == O_constant)
5664 {
5665 offsetT op_disp = i.op[op].disps->X_add_number;
5666
5667 if (i.types[op].bitfield.disp16
5668 && (op_disp & ~(offsetT) 0xffff) == 0)
5669 {
5670 /* If this operand is at most 16 bits, convert
5671 to a signed 16 bit number and don't use 64bit
5672 displacement. */
5673 op_disp = (((op_disp & 0xffff) ^ 0x8000) - 0x8000);
5674 i.types[op].bitfield.disp64 = 0;
5675 }
5676 #ifdef BFD64
5677 /* Optimize 64-bit displacement to 32-bit for 64-bit BFD. */
5678 if (i.types[op].bitfield.disp32
5679 && (op_disp & ~(((offsetT) 2 << 31) - 1)) == 0)
5680 {
5681 /* If this operand is at most 32 bits, convert
5682 to a signed 32 bit number and don't use 64bit
5683 displacement. */
5684 op_disp &= (((offsetT) 2 << 31) - 1);
5685 op_disp = (op_disp ^ ((offsetT) 1 << 31)) - ((addressT) 1 << 31);
5686 i.types[op].bitfield.disp64 = 0;
5687 }
5688 #endif
5689 if (!op_disp && i.types[op].bitfield.baseindex)
5690 {
5691 i.types[op].bitfield.disp8 = 0;
5692 i.types[op].bitfield.disp16 = 0;
5693 i.types[op].bitfield.disp32 = 0;
5694 i.types[op].bitfield.disp32s = 0;
5695 i.types[op].bitfield.disp64 = 0;
5696 i.op[op].disps = 0;
5697 i.disp_operands--;
5698 }
5699 else if (flag_code == CODE_64BIT)
5700 {
5701 if (fits_in_signed_long (op_disp))
5702 {
5703 i.types[op].bitfield.disp64 = 0;
5704 i.types[op].bitfield.disp32s = 1;
5705 }
5706 if (i.prefix[ADDR_PREFIX]
5707 && fits_in_unsigned_long (op_disp))
5708 i.types[op].bitfield.disp32 = 1;
5709 }
5710 if ((i.types[op].bitfield.disp32
5711 || i.types[op].bitfield.disp32s
5712 || i.types[op].bitfield.disp16)
5713 && fits_in_disp8 (op_disp))
5714 i.types[op].bitfield.disp8 = 1;
5715 }
5716 else if (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
5717 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL)
5718 {
5719 fix_new_exp (frag_now, frag_more (0) - frag_now->fr_literal, 0,
5720 i.op[op].disps, 0, i.reloc[op]);
5721 i.types[op].bitfield.disp8 = 0;
5722 i.types[op].bitfield.disp16 = 0;
5723 i.types[op].bitfield.disp32 = 0;
5724 i.types[op].bitfield.disp32s = 0;
5725 i.types[op].bitfield.disp64 = 0;
5726 }
5727 else
5728 /* We only support 64bit displacement on constants. */
5729 i.types[op].bitfield.disp64 = 0;
5730 }
5731 }
5732
5733 /* Return 1 if there is a match in broadcast bytes between operand
5734 GIVEN and instruction template T. */
5735
5736 static INLINE int
5737 match_broadcast_size (const insn_template *t, unsigned int given)
5738 {
5739 return ((t->opcode_modifier.broadcast == BYTE_BROADCAST
5740 && i.types[given].bitfield.byte)
5741 || (t->opcode_modifier.broadcast == WORD_BROADCAST
5742 && i.types[given].bitfield.word)
5743 || (t->opcode_modifier.broadcast == DWORD_BROADCAST
5744 && i.types[given].bitfield.dword)
5745 || (t->opcode_modifier.broadcast == QWORD_BROADCAST
5746 && i.types[given].bitfield.qword));
5747 }
5748
5749 /* Check if operands are valid for the instruction. */
5750
5751 static int
5752 check_VecOperands (const insn_template *t)
5753 {
5754 unsigned int op;
5755 i386_cpu_flags cpu;
5756
5757 /* Templates allowing for ZMMword as well as YMMword and/or XMMword for
5758 any one operand are implicity requiring AVX512VL support if the actual
5759 operand size is YMMword or XMMword. Since this function runs after
5760 template matching, there's no need to check for YMMword/XMMword in
5761 the template. */
5762 cpu = cpu_flags_and (t->cpu_flags, avx512);
5763 if (!cpu_flags_all_zero (&cpu)
5764 && !t->cpu_flags.bitfield.cpuavx512vl
5765 && !cpu_arch_flags.bitfield.cpuavx512vl)
5766 {
5767 for (op = 0; op < t->operands; ++op)
5768 {
5769 if (t->operand_types[op].bitfield.zmmword
5770 && (i.types[op].bitfield.ymmword
5771 || i.types[op].bitfield.xmmword))
5772 {
5773 i.error = unsupported;
5774 return 1;
5775 }
5776 }
5777 }
5778
5779 /* Without VSIB byte, we can't have a vector register for index. */
5780 if (!t->opcode_modifier.sib
5781 && i.index_reg
5782 && (i.index_reg->reg_type.bitfield.xmmword
5783 || i.index_reg->reg_type.bitfield.ymmword
5784 || i.index_reg->reg_type.bitfield.zmmword))
5785 {
5786 i.error = unsupported_vector_index_register;
5787 return 1;
5788 }
5789
5790 /* Check if default mask is allowed. */
5791 if (t->opcode_modifier.nodefmask
5792 && (!i.mask || i.mask->mask->reg_num == 0))
5793 {
5794 i.error = no_default_mask;
5795 return 1;
5796 }
5797
5798 /* For VSIB byte, we need a vector register for index, and all vector
5799 registers must be distinct. */
5800 if (t->opcode_modifier.sib && t->opcode_modifier.sib != SIBMEM)
5801 {
5802 if (!i.index_reg
5803 || !((t->opcode_modifier.sib == VECSIB128
5804 && i.index_reg->reg_type.bitfield.xmmword)
5805 || (t->opcode_modifier.sib == VECSIB256
5806 && i.index_reg->reg_type.bitfield.ymmword)
5807 || (t->opcode_modifier.sib == VECSIB512
5808 && i.index_reg->reg_type.bitfield.zmmword)))
5809 {
5810 i.error = invalid_vsib_address;
5811 return 1;
5812 }
5813
5814 gas_assert (i.reg_operands == 2 || i.mask);
5815 if (i.reg_operands == 2 && !i.mask)
5816 {
5817 gas_assert (i.types[0].bitfield.class == RegSIMD);
5818 gas_assert (i.types[0].bitfield.xmmword
5819 || i.types[0].bitfield.ymmword);
5820 gas_assert (i.types[2].bitfield.class == RegSIMD);
5821 gas_assert (i.types[2].bitfield.xmmword
5822 || i.types[2].bitfield.ymmword);
5823 if (operand_check == check_none)
5824 return 0;
5825 if (register_number (i.op[0].regs)
5826 != register_number (i.index_reg)
5827 && register_number (i.op[2].regs)
5828 != register_number (i.index_reg)
5829 && register_number (i.op[0].regs)
5830 != register_number (i.op[2].regs))
5831 return 0;
5832 if (operand_check == check_error)
5833 {
5834 i.error = invalid_vector_register_set;
5835 return 1;
5836 }
5837 as_warn (_("mask, index, and destination registers should be distinct"));
5838 }
5839 else if (i.reg_operands == 1 && i.mask)
5840 {
5841 if (i.types[1].bitfield.class == RegSIMD
5842 && (i.types[1].bitfield.xmmword
5843 || i.types[1].bitfield.ymmword
5844 || i.types[1].bitfield.zmmword)
5845 && (register_number (i.op[1].regs)
5846 == register_number (i.index_reg)))
5847 {
5848 if (operand_check == check_error)
5849 {
5850 i.error = invalid_vector_register_set;
5851 return 1;
5852 }
5853 if (operand_check != check_none)
5854 as_warn (_("index and destination registers should be distinct"));
5855 }
5856 }
5857 }
5858
5859 /* For AMX instructions with three tmmword operands, all tmmword operand must be
5860 distinct */
5861 if (t->operand_types[0].bitfield.tmmword
5862 && i.reg_operands == 3)
5863 {
5864 if (register_number (i.op[0].regs)
5865 == register_number (i.op[1].regs)
5866 || register_number (i.op[0].regs)
5867 == register_number (i.op[2].regs)
5868 || register_number (i.op[1].regs)
5869 == register_number (i.op[2].regs))
5870 {
5871 i.error = invalid_tmm_register_set;
5872 return 1;
5873 }
5874 }
5875
5876 /* Check if broadcast is supported by the instruction and is applied
5877 to the memory operand. */
5878 if (i.broadcast)
5879 {
5880 i386_operand_type type, overlap;
5881
5882 /* Check if specified broadcast is supported in this instruction,
5883 and its broadcast bytes match the memory operand. */
5884 op = i.broadcast->operand;
5885 if (!t->opcode_modifier.broadcast
5886 || !(i.flags[op] & Operand_Mem)
5887 || (!i.types[op].bitfield.unspecified
5888 && !match_broadcast_size (t, op)))
5889 {
5890 bad_broadcast:
5891 i.error = unsupported_broadcast;
5892 return 1;
5893 }
5894
5895 i.broadcast->bytes = ((1 << (t->opcode_modifier.broadcast - 1))
5896 * i.broadcast->type);
5897 operand_type_set (&type, 0);
5898 switch (i.broadcast->bytes)
5899 {
5900 case 2:
5901 type.bitfield.word = 1;
5902 break;
5903 case 4:
5904 type.bitfield.dword = 1;
5905 break;
5906 case 8:
5907 type.bitfield.qword = 1;
5908 break;
5909 case 16:
5910 type.bitfield.xmmword = 1;
5911 break;
5912 case 32:
5913 type.bitfield.ymmword = 1;
5914 break;
5915 case 64:
5916 type.bitfield.zmmword = 1;
5917 break;
5918 default:
5919 goto bad_broadcast;
5920 }
5921
5922 overlap = operand_type_and (type, t->operand_types[op]);
5923 if (t->operand_types[op].bitfield.class == RegSIMD
5924 && t->operand_types[op].bitfield.byte
5925 + t->operand_types[op].bitfield.word
5926 + t->operand_types[op].bitfield.dword
5927 + t->operand_types[op].bitfield.qword > 1)
5928 {
5929 overlap.bitfield.xmmword = 0;
5930 overlap.bitfield.ymmword = 0;
5931 overlap.bitfield.zmmword = 0;
5932 }
5933 if (operand_type_all_zero (&overlap))
5934 goto bad_broadcast;
5935
5936 if (t->opcode_modifier.checkregsize)
5937 {
5938 unsigned int j;
5939
5940 type.bitfield.baseindex = 1;
5941 for (j = 0; j < i.operands; ++j)
5942 {
5943 if (j != op
5944 && !operand_type_register_match(i.types[j],
5945 t->operand_types[j],
5946 type,
5947 t->operand_types[op]))
5948 goto bad_broadcast;
5949 }
5950 }
5951 }
5952 /* If broadcast is supported in this instruction, we need to check if
5953 operand of one-element size isn't specified without broadcast. */
5954 else if (t->opcode_modifier.broadcast && i.mem_operands)
5955 {
5956 /* Find memory operand. */
5957 for (op = 0; op < i.operands; op++)
5958 if (i.flags[op] & Operand_Mem)
5959 break;
5960 gas_assert (op < i.operands);
5961 /* Check size of the memory operand. */
5962 if (match_broadcast_size (t, op))
5963 {
5964 i.error = broadcast_needed;
5965 return 1;
5966 }
5967 }
5968 else
5969 op = MAX_OPERANDS - 1; /* Avoid uninitialized variable warning. */
5970
5971 /* Check if requested masking is supported. */
5972 if (i.mask)
5973 {
5974 switch (t->opcode_modifier.masking)
5975 {
5976 case BOTH_MASKING:
5977 break;
5978 case MERGING_MASKING:
5979 if (i.mask->zeroing)
5980 {
5981 case 0:
5982 i.error = unsupported_masking;
5983 return 1;
5984 }
5985 break;
5986 case DYNAMIC_MASKING:
5987 /* Memory destinations allow only merging masking. */
5988 if (i.mask->zeroing && i.mem_operands)
5989 {
5990 /* Find memory operand. */
5991 for (op = 0; op < i.operands; op++)
5992 if (i.flags[op] & Operand_Mem)
5993 break;
5994 gas_assert (op < i.operands);
5995 if (op == i.operands - 1)
5996 {
5997 i.error = unsupported_masking;
5998 return 1;
5999 }
6000 }
6001 break;
6002 default:
6003 abort ();
6004 }
6005 }
6006
6007 /* Check if masking is applied to dest operand. */
6008 if (i.mask && (i.mask->operand != (int) (i.operands - 1)))
6009 {
6010 i.error = mask_not_on_destination;
6011 return 1;
6012 }
6013
6014 /* Check RC/SAE. */
6015 if (i.rounding)
6016 {
6017 if (!t->opcode_modifier.sae
6018 || (i.rounding->type != saeonly && !t->opcode_modifier.staticrounding))
6019 {
6020 i.error = unsupported_rc_sae;
6021 return 1;
6022 }
6023 /* If the instruction has several immediate operands and one of
6024 them is rounding, the rounding operand should be the last
6025 immediate operand. */
6026 if (i.imm_operands > 1
6027 && i.rounding->operand != (int) (i.imm_operands - 1))
6028 {
6029 i.error = rc_sae_operand_not_last_imm;
6030 return 1;
6031 }
6032 }
6033
6034 /* Check the special Imm4 cases; must be the first operand. */
6035 if (t->cpu_flags.bitfield.cpuxop && t->operands == 5)
6036 {
6037 if (i.op[0].imms->X_op != O_constant
6038 || !fits_in_imm4 (i.op[0].imms->X_add_number))
6039 {
6040 i.error = bad_imm4;
6041 return 1;
6042 }
6043
6044 /* Turn off Imm<N> so that update_imm won't complain. */
6045 operand_type_set (&i.types[0], 0);
6046 }
6047
6048 /* Check vector Disp8 operand. */
6049 if (t->opcode_modifier.disp8memshift
6050 && i.disp_encoding != disp_encoding_32bit)
6051 {
6052 if (i.broadcast)
6053 i.memshift = t->opcode_modifier.broadcast - 1;
6054 else if (t->opcode_modifier.disp8memshift != DISP8_SHIFT_VL)
6055 i.memshift = t->opcode_modifier.disp8memshift;
6056 else
6057 {
6058 const i386_operand_type *type = NULL;
6059
6060 i.memshift = 0;
6061 for (op = 0; op < i.operands; op++)
6062 if (i.flags[op] & Operand_Mem)
6063 {
6064 if (t->opcode_modifier.evex == EVEXLIG)
6065 i.memshift = 2 + (i.suffix == QWORD_MNEM_SUFFIX);
6066 else if (t->operand_types[op].bitfield.xmmword
6067 + t->operand_types[op].bitfield.ymmword
6068 + t->operand_types[op].bitfield.zmmword <= 1)
6069 type = &t->operand_types[op];
6070 else if (!i.types[op].bitfield.unspecified)
6071 type = &i.types[op];
6072 }
6073 else if (i.types[op].bitfield.class == RegSIMD
6074 && t->opcode_modifier.evex != EVEXLIG)
6075 {
6076 if (i.types[op].bitfield.zmmword)
6077 i.memshift = 6;
6078 else if (i.types[op].bitfield.ymmword && i.memshift < 5)
6079 i.memshift = 5;
6080 else if (i.types[op].bitfield.xmmword && i.memshift < 4)
6081 i.memshift = 4;
6082 }
6083
6084 if (type)
6085 {
6086 if (type->bitfield.zmmword)
6087 i.memshift = 6;
6088 else if (type->bitfield.ymmword)
6089 i.memshift = 5;
6090 else if (type->bitfield.xmmword)
6091 i.memshift = 4;
6092 }
6093
6094 /* For the check in fits_in_disp8(). */
6095 if (i.memshift == 0)
6096 i.memshift = -1;
6097 }
6098
6099 for (op = 0; op < i.operands; op++)
6100 if (operand_type_check (i.types[op], disp)
6101 && i.op[op].disps->X_op == O_constant)
6102 {
6103 if (fits_in_disp8 (i.op[op].disps->X_add_number))
6104 {
6105 i.types[op].bitfield.disp8 = 1;
6106 return 0;
6107 }
6108 i.types[op].bitfield.disp8 = 0;
6109 }
6110 }
6111
6112 i.memshift = 0;
6113
6114 return 0;
6115 }
6116
6117 /* Check if encoding requirements are met by the instruction. */
6118
6119 static int
6120 VEX_check_encoding (const insn_template *t)
6121 {
6122 if (i.vec_encoding == vex_encoding_error)
6123 {
6124 i.error = unsupported;
6125 return 1;
6126 }
6127
6128 if (i.vec_encoding == vex_encoding_evex)
6129 {
6130 /* This instruction must be encoded with EVEX prefix. */
6131 if (!is_evex_encoding (t))
6132 {
6133 i.error = unsupported;
6134 return 1;
6135 }
6136 return 0;
6137 }
6138
6139 if (!t->opcode_modifier.vex)
6140 {
6141 /* This instruction template doesn't have VEX prefix. */
6142 if (i.vec_encoding != vex_encoding_default)
6143 {
6144 i.error = unsupported;
6145 return 1;
6146 }
6147 return 0;
6148 }
6149
6150 return 0;
6151 }
6152
6153 static const insn_template *
6154 match_template (char mnem_suffix)
6155 {
6156 /* Points to template once we've found it. */
6157 const insn_template *t;
6158 i386_operand_type overlap0, overlap1, overlap2, overlap3;
6159 i386_operand_type overlap4;
6160 unsigned int found_reverse_match;
6161 i386_opcode_modifier suffix_check;
6162 i386_operand_type operand_types [MAX_OPERANDS];
6163 int addr_prefix_disp;
6164 unsigned int j, size_match, check_register;
6165 enum i386_error specific_error = 0;
6166
6167 #if MAX_OPERANDS != 5
6168 # error "MAX_OPERANDS must be 5."
6169 #endif
6170
6171 found_reverse_match = 0;
6172 addr_prefix_disp = -1;
6173
6174 /* Prepare for mnemonic suffix check. */
6175 memset (&suffix_check, 0, sizeof (suffix_check));
6176 switch (mnem_suffix)
6177 {
6178 case BYTE_MNEM_SUFFIX:
6179 suffix_check.no_bsuf = 1;
6180 break;
6181 case WORD_MNEM_SUFFIX:
6182 suffix_check.no_wsuf = 1;
6183 break;
6184 case SHORT_MNEM_SUFFIX:
6185 suffix_check.no_ssuf = 1;
6186 break;
6187 case LONG_MNEM_SUFFIX:
6188 suffix_check.no_lsuf = 1;
6189 break;
6190 case QWORD_MNEM_SUFFIX:
6191 suffix_check.no_qsuf = 1;
6192 break;
6193 default:
6194 /* NB: In Intel syntax, normally we can check for memory operand
6195 size when there is no mnemonic suffix. But jmp and call have
6196 2 different encodings with Dword memory operand size, one with
6197 No_ldSuf and the other without. i.suffix is set to
6198 LONG_DOUBLE_MNEM_SUFFIX to skip the one with No_ldSuf. */
6199 if (i.suffix == LONG_DOUBLE_MNEM_SUFFIX)
6200 suffix_check.no_ldsuf = 1;
6201 }
6202
6203 /* Must have right number of operands. */
6204 i.error = number_of_operands_mismatch;
6205
6206 for (t = current_templates->start; t < current_templates->end; t++)
6207 {
6208 addr_prefix_disp = -1;
6209 found_reverse_match = 0;
6210
6211 if (i.operands != t->operands)
6212 continue;
6213
6214 /* Check processor support. */
6215 i.error = unsupported;
6216 if (cpu_flags_match (t) != CPU_FLAGS_PERFECT_MATCH)
6217 continue;
6218
6219 /* Check Pseudo Prefix. */
6220 i.error = unsupported;
6221 if (t->opcode_modifier.pseudovexprefix
6222 && !(i.vec_encoding == vex_encoding_vex
6223 || i.vec_encoding == vex_encoding_vex3))
6224 continue;
6225
6226 /* Check AT&T mnemonic. */
6227 i.error = unsupported_with_intel_mnemonic;
6228 if (intel_mnemonic && t->opcode_modifier.attmnemonic)
6229 continue;
6230
6231 /* Check AT&T/Intel syntax. */
6232 i.error = unsupported_syntax;
6233 if ((intel_syntax && t->opcode_modifier.attsyntax)
6234 || (!intel_syntax && t->opcode_modifier.intelsyntax))
6235 continue;
6236
6237 /* Check Intel64/AMD64 ISA. */
6238 switch (isa64)
6239 {
6240 default:
6241 /* Default: Don't accept Intel64. */
6242 if (t->opcode_modifier.isa64 == INTEL64)
6243 continue;
6244 break;
6245 case amd64:
6246 /* -mamd64: Don't accept Intel64 and Intel64 only. */
6247 if (t->opcode_modifier.isa64 >= INTEL64)
6248 continue;
6249 break;
6250 case intel64:
6251 /* -mintel64: Don't accept AMD64. */
6252 if (t->opcode_modifier.isa64 == AMD64 && flag_code == CODE_64BIT)
6253 continue;
6254 break;
6255 }
6256
6257 /* Check the suffix. */
6258 i.error = invalid_instruction_suffix;
6259 if ((t->opcode_modifier.no_bsuf && suffix_check.no_bsuf)
6260 || (t->opcode_modifier.no_wsuf && suffix_check.no_wsuf)
6261 || (t->opcode_modifier.no_lsuf && suffix_check.no_lsuf)
6262 || (t->opcode_modifier.no_ssuf && suffix_check.no_ssuf)
6263 || (t->opcode_modifier.no_qsuf && suffix_check.no_qsuf)
6264 || (t->opcode_modifier.no_ldsuf && suffix_check.no_ldsuf))
6265 continue;
6266
6267 size_match = operand_size_match (t);
6268 if (!size_match)
6269 continue;
6270
6271 /* This is intentionally not
6272
6273 if (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE))
6274
6275 as the case of a missing * on the operand is accepted (perhaps with
6276 a warning, issued further down). */
6277 if (i.jumpabsolute && t->opcode_modifier.jump != JUMP_ABSOLUTE)
6278 {
6279 i.error = operand_type_mismatch;
6280 continue;
6281 }
6282
6283 for (j = 0; j < MAX_OPERANDS; j++)
6284 operand_types[j] = t->operand_types[j];
6285
6286 /* In general, don't allow
6287 - 64-bit operands outside of 64-bit mode,
6288 - 32-bit operands on pre-386. */
6289 j = i.imm_operands + (t->operands > i.imm_operands + 1);
6290 if (((i.suffix == QWORD_MNEM_SUFFIX
6291 && flag_code != CODE_64BIT
6292 && !(t->base_opcode == 0xfc7
6293 && t->opcode_modifier.opcodeprefix == PREFIX_NONE
6294 && t->extension_opcode == 1) /* cmpxchg8b */)
6295 || (i.suffix == LONG_MNEM_SUFFIX
6296 && !cpu_arch_flags.bitfield.cpui386))
6297 && (intel_syntax
6298 ? (t->opcode_modifier.mnemonicsize != IGNORESIZE
6299 && !intel_float_operand (t->name))
6300 : intel_float_operand (t->name) != 2)
6301 && (t->operands == i.imm_operands
6302 || (operand_types[i.imm_operands].bitfield.class != RegMMX
6303 && operand_types[i.imm_operands].bitfield.class != RegSIMD
6304 && operand_types[i.imm_operands].bitfield.class != RegMask)
6305 || (operand_types[j].bitfield.class != RegMMX
6306 && operand_types[j].bitfield.class != RegSIMD
6307 && operand_types[j].bitfield.class != RegMask))
6308 && !t->opcode_modifier.sib)
6309 continue;
6310
6311 /* Do not verify operands when there are none. */
6312 if (!t->operands)
6313 {
6314 if (VEX_check_encoding (t))
6315 {
6316 specific_error = i.error;
6317 continue;
6318 }
6319
6320 /* We've found a match; break out of loop. */
6321 break;
6322 }
6323
6324 if (!t->opcode_modifier.jump
6325 || t->opcode_modifier.jump == JUMP_ABSOLUTE)
6326 {
6327 /* There should be only one Disp operand. */
6328 for (j = 0; j < MAX_OPERANDS; j++)
6329 if (operand_type_check (operand_types[j], disp))
6330 break;
6331 if (j < MAX_OPERANDS)
6332 {
6333 bfd_boolean override = (i.prefix[ADDR_PREFIX] != 0);
6334
6335 addr_prefix_disp = j;
6336
6337 /* Address size prefix will turn Disp64/Disp32S/Disp32/Disp16
6338 operand into Disp32/Disp32/Disp16/Disp32 operand. */
6339 switch (flag_code)
6340 {
6341 case CODE_16BIT:
6342 override = !override;
6343 /* Fall through. */
6344 case CODE_32BIT:
6345 if (operand_types[j].bitfield.disp32
6346 && operand_types[j].bitfield.disp16)
6347 {
6348 operand_types[j].bitfield.disp16 = override;
6349 operand_types[j].bitfield.disp32 = !override;
6350 }
6351 operand_types[j].bitfield.disp32s = 0;
6352 operand_types[j].bitfield.disp64 = 0;
6353 break;
6354
6355 case CODE_64BIT:
6356 if (operand_types[j].bitfield.disp32s
6357 || operand_types[j].bitfield.disp64)
6358 {
6359 operand_types[j].bitfield.disp64 &= !override;
6360 operand_types[j].bitfield.disp32s &= !override;
6361 operand_types[j].bitfield.disp32 = override;
6362 }
6363 operand_types[j].bitfield.disp16 = 0;
6364 break;
6365 }
6366 }
6367 }
6368
6369 /* Force 0x8b encoding for "mov foo@GOT, %eax". */
6370 if (i.reloc[0] == BFD_RELOC_386_GOT32
6371 && t->base_opcode == 0xa0
6372 && t->opcode_modifier.opcodespace == SPACE_BASE)
6373 continue;
6374
6375 /* We check register size if needed. */
6376 if (t->opcode_modifier.checkregsize)
6377 {
6378 check_register = (1 << t->operands) - 1;
6379 if (i.broadcast)
6380 check_register &= ~(1 << i.broadcast->operand);
6381 }
6382 else
6383 check_register = 0;
6384
6385 overlap0 = operand_type_and (i.types[0], operand_types[0]);
6386 switch (t->operands)
6387 {
6388 case 1:
6389 if (!operand_type_match (overlap0, i.types[0]))
6390 continue;
6391 break;
6392 case 2:
6393 /* xchg %eax, %eax is a special case. It is an alias for nop
6394 only in 32bit mode and we can use opcode 0x90. In 64bit
6395 mode, we can't use 0x90 for xchg %eax, %eax since it should
6396 zero-extend %eax to %rax. */
6397 if (flag_code == CODE_64BIT
6398 && t->base_opcode == 0x90
6399 && t->opcode_modifier.opcodespace == SPACE_BASE
6400 && i.types[0].bitfield.instance == Accum
6401 && i.types[0].bitfield.dword
6402 && i.types[1].bitfield.instance == Accum
6403 && i.types[1].bitfield.dword)
6404 continue;
6405 /* xrelease mov %eax, <disp> is another special case. It must not
6406 match the accumulator-only encoding of mov. */
6407 if (flag_code != CODE_64BIT
6408 && i.hle_prefix
6409 && t->base_opcode == 0xa0
6410 && t->opcode_modifier.opcodespace == SPACE_BASE
6411 && i.types[0].bitfield.instance == Accum
6412 && (i.flags[1] & Operand_Mem))
6413 continue;
6414 /* Fall through. */
6415
6416 case 3:
6417 if (!(size_match & MATCH_STRAIGHT))
6418 goto check_reverse;
6419 /* Reverse direction of operands if swapping is possible in the first
6420 place (operands need to be symmetric) and
6421 - the load form is requested, and the template is a store form,
6422 - the store form is requested, and the template is a load form,
6423 - the non-default (swapped) form is requested. */
6424 overlap1 = operand_type_and (operand_types[0], operand_types[1]);
6425 if (t->opcode_modifier.d && i.reg_operands == i.operands
6426 && !operand_type_all_zero (&overlap1))
6427 switch (i.dir_encoding)
6428 {
6429 case dir_encoding_load:
6430 if (operand_type_check (operand_types[i.operands - 1], anymem)
6431 || t->opcode_modifier.regmem)
6432 goto check_reverse;
6433 break;
6434
6435 case dir_encoding_store:
6436 if (!operand_type_check (operand_types[i.operands - 1], anymem)
6437 && !t->opcode_modifier.regmem)
6438 goto check_reverse;
6439 break;
6440
6441 case dir_encoding_swap:
6442 goto check_reverse;
6443
6444 case dir_encoding_default:
6445 break;
6446 }
6447 /* If we want store form, we skip the current load. */
6448 if ((i.dir_encoding == dir_encoding_store
6449 || i.dir_encoding == dir_encoding_swap)
6450 && i.mem_operands == 0
6451 && t->opcode_modifier.load)
6452 continue;
6453 /* Fall through. */
6454 case 4:
6455 case 5:
6456 overlap1 = operand_type_and (i.types[1], operand_types[1]);
6457 if (!operand_type_match (overlap0, i.types[0])
6458 || !operand_type_match (overlap1, i.types[1])
6459 || ((check_register & 3) == 3
6460 && !operand_type_register_match (i.types[0],
6461 operand_types[0],
6462 i.types[1],
6463 operand_types[1])))
6464 {
6465 /* Check if other direction is valid ... */
6466 if (!t->opcode_modifier.d)
6467 continue;
6468
6469 check_reverse:
6470 if (!(size_match & MATCH_REVERSE))
6471 continue;
6472 /* Try reversing direction of operands. */
6473 overlap0 = operand_type_and (i.types[0], operand_types[i.operands - 1]);
6474 overlap1 = operand_type_and (i.types[i.operands - 1], operand_types[0]);
6475 if (!operand_type_match (overlap0, i.types[0])
6476 || !operand_type_match (overlap1, i.types[i.operands - 1])
6477 || (check_register
6478 && !operand_type_register_match (i.types[0],
6479 operand_types[i.operands - 1],
6480 i.types[i.operands - 1],
6481 operand_types[0])))
6482 {
6483 /* Does not match either direction. */
6484 continue;
6485 }
6486 /* found_reverse_match holds which of D or FloatR
6487 we've found. */
6488 if (!t->opcode_modifier.d)
6489 found_reverse_match = 0;
6490 else if (operand_types[0].bitfield.tbyte)
6491 found_reverse_match = Opcode_FloatD;
6492 else if (operand_types[0].bitfield.xmmword
6493 || operand_types[i.operands - 1].bitfield.xmmword
6494 || operand_types[0].bitfield.class == RegMMX
6495 || operand_types[i.operands - 1].bitfield.class == RegMMX
6496 || is_any_vex_encoding(t))
6497 found_reverse_match = (t->base_opcode & 0xee) != 0x6e
6498 ? Opcode_SIMD_FloatD : Opcode_SIMD_IntD;
6499 else
6500 found_reverse_match = Opcode_D;
6501 if (t->opcode_modifier.floatr)
6502 found_reverse_match |= Opcode_FloatR;
6503 }
6504 else
6505 {
6506 /* Found a forward 2 operand match here. */
6507 switch (t->operands)
6508 {
6509 case 5:
6510 overlap4 = operand_type_and (i.types[4],
6511 operand_types[4]);
6512 /* Fall through. */
6513 case 4:
6514 overlap3 = operand_type_and (i.types[3],
6515 operand_types[3]);
6516 /* Fall through. */
6517 case 3:
6518 overlap2 = operand_type_and (i.types[2],
6519 operand_types[2]);
6520 break;
6521 }
6522
6523 switch (t->operands)
6524 {
6525 case 5:
6526 if (!operand_type_match (overlap4, i.types[4])
6527 || !operand_type_register_match (i.types[3],
6528 operand_types[3],
6529 i.types[4],
6530 operand_types[4]))
6531 continue;
6532 /* Fall through. */
6533 case 4:
6534 if (!operand_type_match (overlap3, i.types[3])
6535 || ((check_register & 0xa) == 0xa
6536 && !operand_type_register_match (i.types[1],
6537 operand_types[1],
6538 i.types[3],
6539 operand_types[3]))
6540 || ((check_register & 0xc) == 0xc
6541 && !operand_type_register_match (i.types[2],
6542 operand_types[2],
6543 i.types[3],
6544 operand_types[3])))
6545 continue;
6546 /* Fall through. */
6547 case 3:
6548 /* Here we make use of the fact that there are no
6549 reverse match 3 operand instructions. */
6550 if (!operand_type_match (overlap2, i.types[2])
6551 || ((check_register & 5) == 5
6552 && !operand_type_register_match (i.types[0],
6553 operand_types[0],
6554 i.types[2],
6555 operand_types[2]))
6556 || ((check_register & 6) == 6
6557 && !operand_type_register_match (i.types[1],
6558 operand_types[1],
6559 i.types[2],
6560 operand_types[2])))
6561 continue;
6562 break;
6563 }
6564 }
6565 /* Found either forward/reverse 2, 3 or 4 operand match here:
6566 slip through to break. */
6567 }
6568
6569 /* Check if vector operands are valid. */
6570 if (check_VecOperands (t))
6571 {
6572 specific_error = i.error;
6573 continue;
6574 }
6575
6576 /* Check if VEX/EVEX encoding requirements can be satisfied. */
6577 if (VEX_check_encoding (t))
6578 {
6579 specific_error = i.error;
6580 continue;
6581 }
6582
6583 /* We've found a match; break out of loop. */
6584 break;
6585 }
6586
6587 if (t == current_templates->end)
6588 {
6589 /* We found no match. */
6590 const char *err_msg;
6591 switch (specific_error ? specific_error : i.error)
6592 {
6593 default:
6594 abort ();
6595 case operand_size_mismatch:
6596 err_msg = _("operand size mismatch");
6597 break;
6598 case operand_type_mismatch:
6599 err_msg = _("operand type mismatch");
6600 break;
6601 case register_type_mismatch:
6602 err_msg = _("register type mismatch");
6603 break;
6604 case number_of_operands_mismatch:
6605 err_msg = _("number of operands mismatch");
6606 break;
6607 case invalid_instruction_suffix:
6608 err_msg = _("invalid instruction suffix");
6609 break;
6610 case bad_imm4:
6611 err_msg = _("constant doesn't fit in 4 bits");
6612 break;
6613 case unsupported_with_intel_mnemonic:
6614 err_msg = _("unsupported with Intel mnemonic");
6615 break;
6616 case unsupported_syntax:
6617 err_msg = _("unsupported syntax");
6618 break;
6619 case unsupported:
6620 as_bad (_("unsupported instruction `%s'"),
6621 current_templates->start->name);
6622 return NULL;
6623 case invalid_sib_address:
6624 err_msg = _("invalid SIB address");
6625 break;
6626 case invalid_vsib_address:
6627 err_msg = _("invalid VSIB address");
6628 break;
6629 case invalid_vector_register_set:
6630 err_msg = _("mask, index, and destination registers must be distinct");
6631 break;
6632 case invalid_tmm_register_set:
6633 err_msg = _("all tmm registers must be distinct");
6634 break;
6635 case unsupported_vector_index_register:
6636 err_msg = _("unsupported vector index register");
6637 break;
6638 case unsupported_broadcast:
6639 err_msg = _("unsupported broadcast");
6640 break;
6641 case broadcast_needed:
6642 err_msg = _("broadcast is needed for operand of such type");
6643 break;
6644 case unsupported_masking:
6645 err_msg = _("unsupported masking");
6646 break;
6647 case mask_not_on_destination:
6648 err_msg = _("mask not on destination operand");
6649 break;
6650 case no_default_mask:
6651 err_msg = _("default mask isn't allowed");
6652 break;
6653 case unsupported_rc_sae:
6654 err_msg = _("unsupported static rounding/sae");
6655 break;
6656 case rc_sae_operand_not_last_imm:
6657 if (intel_syntax)
6658 err_msg = _("RC/SAE operand must precede immediate operands");
6659 else
6660 err_msg = _("RC/SAE operand must follow immediate operands");
6661 break;
6662 case invalid_register_operand:
6663 err_msg = _("invalid register operand");
6664 break;
6665 }
6666 as_bad (_("%s for `%s'"), err_msg,
6667 current_templates->start->name);
6668 return NULL;
6669 }
6670
6671 if (!quiet_warnings)
6672 {
6673 if (!intel_syntax
6674 && (i.jumpabsolute != (t->opcode_modifier.jump == JUMP_ABSOLUTE)))
6675 as_warn (_("indirect %s without `*'"), t->name);
6676
6677 if (t->opcode_modifier.isprefix
6678 && t->opcode_modifier.mnemonicsize == IGNORESIZE)
6679 {
6680 /* Warn them that a data or address size prefix doesn't
6681 affect assembly of the next line of code. */
6682 as_warn (_("stand-alone `%s' prefix"), t->name);
6683 }
6684 }
6685
6686 /* Copy the template we found. */
6687 install_template (t);
6688
6689 if (addr_prefix_disp != -1)
6690 i.tm.operand_types[addr_prefix_disp]
6691 = operand_types[addr_prefix_disp];
6692
6693 if (found_reverse_match)
6694 {
6695 /* If we found a reverse match we must alter the opcode direction
6696 bit and clear/flip the regmem modifier one. found_reverse_match
6697 holds bits to change (different for int & float insns). */
6698
6699 i.tm.base_opcode ^= found_reverse_match;
6700
6701 i.tm.operand_types[0] = operand_types[i.operands - 1];
6702 i.tm.operand_types[i.operands - 1] = operand_types[0];
6703
6704 /* Certain SIMD insns have their load forms specified in the opcode
6705 table, and hence we need to _set_ RegMem instead of clearing it.
6706 We need to avoid setting the bit though on insns like KMOVW. */
6707 i.tm.opcode_modifier.regmem
6708 = i.tm.opcode_modifier.modrm && i.tm.opcode_modifier.d
6709 && i.tm.operands > 2U - i.tm.opcode_modifier.sse2avx
6710 && !i.tm.opcode_modifier.regmem;
6711 }
6712
6713 return t;
6714 }
6715
6716 static int
6717 check_string (void)
6718 {
6719 unsigned int es_op = i.tm.opcode_modifier.isstring - IS_STRING_ES_OP0;
6720 unsigned int op = i.tm.operand_types[0].bitfield.baseindex ? es_op : 0;
6721
6722 if (i.seg[op] != NULL && i.seg[op] != &es)
6723 {
6724 as_bad (_("`%s' operand %u must use `%ses' segment"),
6725 i.tm.name,
6726 intel_syntax ? i.tm.operands - es_op : es_op + 1,
6727 register_prefix);
6728 return 0;
6729 }
6730
6731 /* There's only ever one segment override allowed per instruction.
6732 This instruction possibly has a legal segment override on the
6733 second operand, so copy the segment to where non-string
6734 instructions store it, allowing common code. */
6735 i.seg[op] = i.seg[1];
6736
6737 return 1;
6738 }
6739
6740 static int
6741 process_suffix (void)
6742 {
6743 bfd_boolean is_crc32 = FALSE;
6744
6745 /* If matched instruction specifies an explicit instruction mnemonic
6746 suffix, use it. */
6747 if (i.tm.opcode_modifier.size == SIZE16)
6748 i.suffix = WORD_MNEM_SUFFIX;
6749 else if (i.tm.opcode_modifier.size == SIZE32)
6750 i.suffix = LONG_MNEM_SUFFIX;
6751 else if (i.tm.opcode_modifier.size == SIZE64)
6752 i.suffix = QWORD_MNEM_SUFFIX;
6753 else if (i.reg_operands
6754 && (i.operands > 1 || i.types[0].bitfield.class == Reg)
6755 && !i.tm.opcode_modifier.addrprefixopreg)
6756 {
6757 unsigned int numop = i.operands;
6758 /* CRC32 */
6759 is_crc32 = (i.tm.base_opcode == 0xf38f0
6760 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2);
6761
6762 /* movsx/movzx want only their source operand considered here, for the
6763 ambiguity checking below. The suffix will be replaced afterwards
6764 to represent the destination (register). */
6765 if (((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w)
6766 || (i.tm.base_opcode == 0x63
6767 && i.tm.opcode_modifier.opcodespace == SPACE_BASE
6768 && i.tm.cpu_flags.bitfield.cpu64))
6769 --i.operands;
6770
6771 /* crc32 needs REX.W set regardless of suffix / source operand size. */
6772 if (is_crc32 && i.tm.operand_types[1].bitfield.qword)
6773 i.rex |= REX_W;
6774
6775 /* If there's no instruction mnemonic suffix we try to invent one
6776 based on GPR operands. */
6777 if (!i.suffix)
6778 {
6779 /* We take i.suffix from the last register operand specified,
6780 Destination register type is more significant than source
6781 register type. crc32 in SSE4.2 prefers source register
6782 type. */
6783 unsigned int op = is_crc32 ? 1 : i.operands;
6784
6785 while (op--)
6786 if (i.tm.operand_types[op].bitfield.instance == InstanceNone
6787 || i.tm.operand_types[op].bitfield.instance == Accum)
6788 {
6789 if (i.types[op].bitfield.class != Reg)
6790 continue;
6791 if (i.types[op].bitfield.byte)
6792 i.suffix = BYTE_MNEM_SUFFIX;
6793 else if (i.types[op].bitfield.word)
6794 i.suffix = WORD_MNEM_SUFFIX;
6795 else if (i.types[op].bitfield.dword)
6796 i.suffix = LONG_MNEM_SUFFIX;
6797 else if (i.types[op].bitfield.qword)
6798 i.suffix = QWORD_MNEM_SUFFIX;
6799 else
6800 continue;
6801 break;
6802 }
6803
6804 /* As an exception, movsx/movzx silently default to a byte source
6805 in AT&T mode. */
6806 if ((i.tm.base_opcode | 8) == 0xfbe && i.tm.opcode_modifier.w
6807 && !i.suffix && !intel_syntax)
6808 i.suffix = BYTE_MNEM_SUFFIX;
6809 }
6810 else if (i.suffix == BYTE_MNEM_SUFFIX)
6811 {
6812 if (intel_syntax
6813 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6814 && i.tm.opcode_modifier.no_bsuf)
6815 i.suffix = 0;
6816 else if (!check_byte_reg ())
6817 return 0;
6818 }
6819 else if (i.suffix == LONG_MNEM_SUFFIX)
6820 {
6821 if (intel_syntax
6822 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6823 && i.tm.opcode_modifier.no_lsuf
6824 && !i.tm.opcode_modifier.todword
6825 && !i.tm.opcode_modifier.toqword)
6826 i.suffix = 0;
6827 else if (!check_long_reg ())
6828 return 0;
6829 }
6830 else if (i.suffix == QWORD_MNEM_SUFFIX)
6831 {
6832 if (intel_syntax
6833 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6834 && i.tm.opcode_modifier.no_qsuf
6835 && !i.tm.opcode_modifier.todword
6836 && !i.tm.opcode_modifier.toqword)
6837 i.suffix = 0;
6838 else if (!check_qword_reg ())
6839 return 0;
6840 }
6841 else if (i.suffix == WORD_MNEM_SUFFIX)
6842 {
6843 if (intel_syntax
6844 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE
6845 && i.tm.opcode_modifier.no_wsuf)
6846 i.suffix = 0;
6847 else if (!check_word_reg ())
6848 return 0;
6849 }
6850 else if (intel_syntax
6851 && i.tm.opcode_modifier.mnemonicsize == IGNORESIZE)
6852 /* Do nothing if the instruction is going to ignore the prefix. */
6853 ;
6854 else
6855 abort ();
6856
6857 /* Undo the movsx/movzx change done above. */
6858 i.operands = numop;
6859 }
6860 else if (i.tm.opcode_modifier.mnemonicsize == DEFAULTSIZE
6861 && !i.suffix)
6862 {
6863 i.suffix = stackop_size;
6864 if (stackop_size == LONG_MNEM_SUFFIX)
6865 {
6866 /* stackop_size is set to LONG_MNEM_SUFFIX for the
6867 .code16gcc directive to support 16-bit mode with
6868 32-bit address. For IRET without a suffix, generate
6869 16-bit IRET (opcode 0xcf) to return from an interrupt
6870 handler. */
6871 if (i.tm.base_opcode == 0xcf)
6872 {
6873 i.suffix = WORD_MNEM_SUFFIX;
6874 as_warn (_("generating 16-bit `iret' for .code16gcc directive"));
6875 }
6876 /* Warn about changed behavior for segment register push/pop. */
6877 else if ((i.tm.base_opcode | 1) == 0x07)
6878 as_warn (_("generating 32-bit `%s', unlike earlier gas versions"),
6879 i.tm.name);
6880 }
6881 }
6882 else if (!i.suffix
6883 && (i.tm.opcode_modifier.jump == JUMP_ABSOLUTE
6884 || i.tm.opcode_modifier.jump == JUMP_BYTE
6885 || i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT
6886 || (i.tm.base_opcode == 0x0f01 /* [ls][gi]dt */
6887 && i.tm.extension_opcode <= 3)))
6888 {
6889 switch (flag_code)
6890 {
6891 case CODE_64BIT:
6892 if (!i.tm.opcode_modifier.no_qsuf)
6893 {
6894 if (i.tm.opcode_modifier.jump == JUMP_BYTE
6895 || i.tm.opcode_modifier.no_lsuf)
6896 i.suffix = QWORD_MNEM_SUFFIX;
6897 break;
6898 }
6899 /* Fall through. */
6900 case CODE_32BIT:
6901 if (!i.tm.opcode_modifier.no_lsuf)
6902 i.suffix = LONG_MNEM_SUFFIX;
6903 break;
6904 case CODE_16BIT:
6905 if (!i.tm.opcode_modifier.no_wsuf)
6906 i.suffix = WORD_MNEM_SUFFIX;
6907 break;
6908 }
6909 }
6910
6911 if (!i.suffix
6912 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6913 /* Also cover lret/retf/iret in 64-bit mode. */
6914 || (flag_code == CODE_64BIT
6915 && !i.tm.opcode_modifier.no_lsuf
6916 && !i.tm.opcode_modifier.no_qsuf))
6917 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
6918 /* Explicit sizing prefixes are assumed to disambiguate insns. */
6919 && !i.prefix[DATA_PREFIX] && !(i.prefix[REX_PREFIX] & REX_W)
6920 /* Accept FLDENV et al without suffix. */
6921 && (i.tm.opcode_modifier.no_ssuf || i.tm.opcode_modifier.floatmf))
6922 {
6923 unsigned int suffixes, evex = 0;
6924
6925 suffixes = !i.tm.opcode_modifier.no_bsuf;
6926 if (!i.tm.opcode_modifier.no_wsuf)
6927 suffixes |= 1 << 1;
6928 if (!i.tm.opcode_modifier.no_lsuf)
6929 suffixes |= 1 << 2;
6930 if (!i.tm.opcode_modifier.no_ldsuf)
6931 suffixes |= 1 << 3;
6932 if (!i.tm.opcode_modifier.no_ssuf)
6933 suffixes |= 1 << 4;
6934 if (flag_code == CODE_64BIT && !i.tm.opcode_modifier.no_qsuf)
6935 suffixes |= 1 << 5;
6936
6937 /* For [XYZ]MMWORD operands inspect operand sizes. While generally
6938 also suitable for AT&T syntax mode, it was requested that this be
6939 restricted to just Intel syntax. */
6940 if (intel_syntax && is_any_vex_encoding (&i.tm) && !i.broadcast)
6941 {
6942 unsigned int op;
6943
6944 for (op = 0; op < i.tm.operands; ++op)
6945 {
6946 if (is_evex_encoding (&i.tm)
6947 && !cpu_arch_flags.bitfield.cpuavx512vl)
6948 {
6949 if (i.tm.operand_types[op].bitfield.ymmword)
6950 i.tm.operand_types[op].bitfield.xmmword = 0;
6951 if (i.tm.operand_types[op].bitfield.zmmword)
6952 i.tm.operand_types[op].bitfield.ymmword = 0;
6953 if (!i.tm.opcode_modifier.evex
6954 || i.tm.opcode_modifier.evex == EVEXDYN)
6955 i.tm.opcode_modifier.evex = EVEX512;
6956 }
6957
6958 if (i.tm.operand_types[op].bitfield.xmmword
6959 + i.tm.operand_types[op].bitfield.ymmword
6960 + i.tm.operand_types[op].bitfield.zmmword < 2)
6961 continue;
6962
6963 /* Any properly sized operand disambiguates the insn. */
6964 if (i.types[op].bitfield.xmmword
6965 || i.types[op].bitfield.ymmword
6966 || i.types[op].bitfield.zmmword)
6967 {
6968 suffixes &= ~(7 << 6);
6969 evex = 0;
6970 break;
6971 }
6972
6973 if ((i.flags[op] & Operand_Mem)
6974 && i.tm.operand_types[op].bitfield.unspecified)
6975 {
6976 if (i.tm.operand_types[op].bitfield.xmmword)
6977 suffixes |= 1 << 6;
6978 if (i.tm.operand_types[op].bitfield.ymmword)
6979 suffixes |= 1 << 7;
6980 if (i.tm.operand_types[op].bitfield.zmmword)
6981 suffixes |= 1 << 8;
6982 if (is_evex_encoding (&i.tm))
6983 evex = EVEX512;
6984 }
6985 }
6986 }
6987
6988 /* Are multiple suffixes / operand sizes allowed? */
6989 if (suffixes & (suffixes - 1))
6990 {
6991 if (intel_syntax
6992 && (i.tm.opcode_modifier.mnemonicsize != DEFAULTSIZE
6993 || operand_check == check_error))
6994 {
6995 as_bad (_("ambiguous operand size for `%s'"), i.tm.name);
6996 return 0;
6997 }
6998 if (operand_check == check_error)
6999 {
7000 as_bad (_("no instruction mnemonic suffix given and "
7001 "no register operands; can't size `%s'"), i.tm.name);
7002 return 0;
7003 }
7004 if (operand_check == check_warning)
7005 as_warn (_("%s; using default for `%s'"),
7006 intel_syntax
7007 ? _("ambiguous operand size")
7008 : _("no instruction mnemonic suffix given and "
7009 "no register operands"),
7010 i.tm.name);
7011
7012 if (i.tm.opcode_modifier.floatmf)
7013 i.suffix = SHORT_MNEM_SUFFIX;
7014 else if ((i.tm.base_opcode | 8) == 0xfbe
7015 || (i.tm.base_opcode == 0x63
7016 && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7017 && i.tm.cpu_flags.bitfield.cpu64))
7018 /* handled below */;
7019 else if (evex)
7020 i.tm.opcode_modifier.evex = evex;
7021 else if (flag_code == CODE_16BIT)
7022 i.suffix = WORD_MNEM_SUFFIX;
7023 else if (!i.tm.opcode_modifier.no_lsuf)
7024 i.suffix = LONG_MNEM_SUFFIX;
7025 else
7026 i.suffix = QWORD_MNEM_SUFFIX;
7027 }
7028 }
7029
7030 if ((i.tm.base_opcode | 8) == 0xfbe
7031 || (i.tm.base_opcode == 0x63
7032 && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7033 && i.tm.cpu_flags.bitfield.cpu64))
7034 {
7035 /* In Intel syntax, movsx/movzx must have a "suffix" (checked above).
7036 In AT&T syntax, if there is no suffix (warned about above), the default
7037 will be byte extension. */
7038 if (i.tm.opcode_modifier.w && i.suffix && i.suffix != BYTE_MNEM_SUFFIX)
7039 i.tm.base_opcode |= 1;
7040
7041 /* For further processing, the suffix should represent the destination
7042 (register). This is already the case when one was used with
7043 mov[sz][bw]*, but we need to replace it for mov[sz]x, or if there was
7044 no suffix to begin with. */
7045 if (i.tm.opcode_modifier.w || i.tm.base_opcode == 0x63 || !i.suffix)
7046 {
7047 if (i.types[1].bitfield.word)
7048 i.suffix = WORD_MNEM_SUFFIX;
7049 else if (i.types[1].bitfield.qword)
7050 i.suffix = QWORD_MNEM_SUFFIX;
7051 else
7052 i.suffix = LONG_MNEM_SUFFIX;
7053
7054 i.tm.opcode_modifier.w = 0;
7055 }
7056 }
7057
7058 if (!i.tm.opcode_modifier.modrm && i.reg_operands && i.tm.operands < 3)
7059 i.short_form = (i.tm.operand_types[0].bitfield.class == Reg)
7060 != (i.tm.operand_types[1].bitfield.class == Reg);
7061
7062 /* Change the opcode based on the operand size given by i.suffix. */
7063 switch (i.suffix)
7064 {
7065 /* Size floating point instruction. */
7066 case LONG_MNEM_SUFFIX:
7067 if (i.tm.opcode_modifier.floatmf)
7068 {
7069 i.tm.base_opcode ^= 4;
7070 break;
7071 }
7072 /* fall through */
7073 case WORD_MNEM_SUFFIX:
7074 case QWORD_MNEM_SUFFIX:
7075 /* It's not a byte, select word/dword operation. */
7076 if (i.tm.opcode_modifier.w)
7077 {
7078 if (i.short_form)
7079 i.tm.base_opcode |= 8;
7080 else
7081 i.tm.base_opcode |= 1;
7082 }
7083 /* fall through */
7084 case SHORT_MNEM_SUFFIX:
7085 /* Now select between word & dword operations via the operand
7086 size prefix, except for instructions that will ignore this
7087 prefix anyway. */
7088 if (i.suffix != QWORD_MNEM_SUFFIX
7089 && i.tm.opcode_modifier.mnemonicsize != IGNORESIZE
7090 && !i.tm.opcode_modifier.floatmf
7091 && !is_any_vex_encoding (&i.tm)
7092 && ((i.suffix == LONG_MNEM_SUFFIX) == (flag_code == CODE_16BIT)
7093 || (flag_code == CODE_64BIT
7094 && i.tm.opcode_modifier.jump == JUMP_BYTE)))
7095 {
7096 unsigned int prefix = DATA_PREFIX_OPCODE;
7097
7098 if (i.tm.opcode_modifier.jump == JUMP_BYTE) /* jcxz, loop */
7099 prefix = ADDR_PREFIX_OPCODE;
7100
7101 if (!add_prefix (prefix))
7102 return 0;
7103 }
7104
7105 /* Set mode64 for an operand. */
7106 if (i.suffix == QWORD_MNEM_SUFFIX
7107 && flag_code == CODE_64BIT
7108 && !i.tm.opcode_modifier.norex64
7109 && !i.tm.opcode_modifier.vexw
7110 /* Special case for xchg %rax,%rax. It is NOP and doesn't
7111 need rex64. */
7112 && ! (i.operands == 2
7113 && i.tm.base_opcode == 0x90
7114 && i.tm.extension_opcode == None
7115 && i.types[0].bitfield.instance == Accum
7116 && i.types[0].bitfield.qword
7117 && i.types[1].bitfield.instance == Accum
7118 && i.types[1].bitfield.qword))
7119 i.rex |= REX_W;
7120
7121 break;
7122
7123 case 0:
7124 /* Select word/dword/qword operation with explicit data sizing prefix
7125 when there are no suitable register operands. */
7126 if (i.tm.opcode_modifier.w
7127 && (i.prefix[DATA_PREFIX] || (i.prefix[REX_PREFIX] & REX_W))
7128 && (!i.reg_operands
7129 || (i.reg_operands == 1
7130 /* ShiftCount */
7131 && (i.tm.operand_types[0].bitfield.instance == RegC
7132 /* InOutPortReg */
7133 || i.tm.operand_types[0].bitfield.instance == RegD
7134 || i.tm.operand_types[1].bitfield.instance == RegD
7135 /* CRC32 */
7136 || is_crc32))))
7137 i.tm.base_opcode |= 1;
7138 break;
7139 }
7140
7141 if (i.tm.opcode_modifier.addrprefixopreg)
7142 {
7143 gas_assert (!i.suffix);
7144 gas_assert (i.reg_operands);
7145
7146 if (i.tm.operand_types[0].bitfield.instance == Accum
7147 || i.operands == 1)
7148 {
7149 /* The address size override prefix changes the size of the
7150 first operand. */
7151 if (flag_code == CODE_64BIT
7152 && i.op[0].regs->reg_type.bitfield.word)
7153 {
7154 as_bad (_("16-bit addressing unavailable for `%s'"),
7155 i.tm.name);
7156 return 0;
7157 }
7158
7159 if ((flag_code == CODE_32BIT
7160 ? i.op[0].regs->reg_type.bitfield.word
7161 : i.op[0].regs->reg_type.bitfield.dword)
7162 && !add_prefix (ADDR_PREFIX_OPCODE))
7163 return 0;
7164 }
7165 else
7166 {
7167 /* Check invalid register operand when the address size override
7168 prefix changes the size of register operands. */
7169 unsigned int op;
7170 enum { need_word, need_dword, need_qword } need;
7171
7172 /* Check the register operand for the address size prefix if
7173 the memory operand has no real registers, like symbol, DISP
7174 or bogus (x32-only) symbol(%rip) when symbol(%eip) is meant. */
7175 if (i.mem_operands == 1
7176 && i.reg_operands == 1
7177 && i.operands == 2
7178 && i.types[1].bitfield.class == Reg
7179 && (flag_code == CODE_32BIT
7180 ? i.op[1].regs->reg_type.bitfield.word
7181 : i.op[1].regs->reg_type.bitfield.dword)
7182 && ((i.base_reg == NULL && i.index_reg == NULL)
7183 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
7184 || (x86_elf_abi == X86_64_X32_ABI
7185 && i.base_reg
7186 && i.base_reg->reg_num == RegIP
7187 && i.base_reg->reg_type.bitfield.qword))
7188 #else
7189 || 0)
7190 #endif
7191 && !add_prefix (ADDR_PREFIX_OPCODE))
7192 return 0;
7193
7194 if (flag_code == CODE_32BIT)
7195 need = i.prefix[ADDR_PREFIX] ? need_word : need_dword;
7196 else if (i.prefix[ADDR_PREFIX])
7197 need = need_dword;
7198 else
7199 need = flag_code == CODE_64BIT ? need_qword : need_word;
7200
7201 for (op = 0; op < i.operands; op++)
7202 {
7203 if (i.types[op].bitfield.class != Reg)
7204 continue;
7205
7206 switch (need)
7207 {
7208 case need_word:
7209 if (i.op[op].regs->reg_type.bitfield.word)
7210 continue;
7211 break;
7212 case need_dword:
7213 if (i.op[op].regs->reg_type.bitfield.dword)
7214 continue;
7215 break;
7216 case need_qword:
7217 if (i.op[op].regs->reg_type.bitfield.qword)
7218 continue;
7219 break;
7220 }
7221
7222 as_bad (_("invalid register operand size for `%s'"),
7223 i.tm.name);
7224 return 0;
7225 }
7226 }
7227 }
7228
7229 return 1;
7230 }
7231
7232 static int
7233 check_byte_reg (void)
7234 {
7235 int op;
7236
7237 for (op = i.operands; --op >= 0;)
7238 {
7239 /* Skip non-register operands. */
7240 if (i.types[op].bitfield.class != Reg)
7241 continue;
7242
7243 /* If this is an eight bit register, it's OK. If it's the 16 or
7244 32 bit version of an eight bit register, we will just use the
7245 low portion, and that's OK too. */
7246 if (i.types[op].bitfield.byte)
7247 continue;
7248
7249 /* I/O port address operands are OK too. */
7250 if (i.tm.operand_types[op].bitfield.instance == RegD
7251 && i.tm.operand_types[op].bitfield.word)
7252 continue;
7253
7254 /* crc32 only wants its source operand checked here. */
7255 if (i.tm.base_opcode == 0xf38f0
7256 && i.tm.opcode_modifier.opcodeprefix == PREFIX_0XF2
7257 && op != 0)
7258 continue;
7259
7260 /* Any other register is bad. */
7261 as_bad (_("`%s%s' not allowed with `%s%c'"),
7262 register_prefix, i.op[op].regs->reg_name,
7263 i.tm.name, i.suffix);
7264 return 0;
7265 }
7266 return 1;
7267 }
7268
7269 static int
7270 check_long_reg (void)
7271 {
7272 int op;
7273
7274 for (op = i.operands; --op >= 0;)
7275 /* Skip non-register operands. */
7276 if (i.types[op].bitfield.class != Reg)
7277 continue;
7278 /* Reject eight bit registers, except where the template requires
7279 them. (eg. movzb) */
7280 else if (i.types[op].bitfield.byte
7281 && (i.tm.operand_types[op].bitfield.class == Reg
7282 || i.tm.operand_types[op].bitfield.instance == Accum)
7283 && (i.tm.operand_types[op].bitfield.word
7284 || i.tm.operand_types[op].bitfield.dword))
7285 {
7286 as_bad (_("`%s%s' not allowed with `%s%c'"),
7287 register_prefix,
7288 i.op[op].regs->reg_name,
7289 i.tm.name,
7290 i.suffix);
7291 return 0;
7292 }
7293 /* Error if the e prefix on a general reg is missing. */
7294 else if (i.types[op].bitfield.word
7295 && (i.tm.operand_types[op].bitfield.class == Reg
7296 || i.tm.operand_types[op].bitfield.instance == Accum)
7297 && i.tm.operand_types[op].bitfield.dword)
7298 {
7299 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7300 register_prefix, i.op[op].regs->reg_name,
7301 i.suffix);
7302 return 0;
7303 }
7304 /* Warn if the r prefix on a general reg is present. */
7305 else if (i.types[op].bitfield.qword
7306 && (i.tm.operand_types[op].bitfield.class == Reg
7307 || i.tm.operand_types[op].bitfield.instance == Accum)
7308 && i.tm.operand_types[op].bitfield.dword)
7309 {
7310 if (intel_syntax
7311 && i.tm.opcode_modifier.toqword
7312 && i.types[0].bitfield.class != RegSIMD)
7313 {
7314 /* Convert to QWORD. We want REX byte. */
7315 i.suffix = QWORD_MNEM_SUFFIX;
7316 }
7317 else
7318 {
7319 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7320 register_prefix, i.op[op].regs->reg_name,
7321 i.suffix);
7322 return 0;
7323 }
7324 }
7325 return 1;
7326 }
7327
7328 static int
7329 check_qword_reg (void)
7330 {
7331 int op;
7332
7333 for (op = i.operands; --op >= 0; )
7334 /* Skip non-register operands. */
7335 if (i.types[op].bitfield.class != Reg)
7336 continue;
7337 /* Reject eight bit registers, except where the template requires
7338 them. (eg. movzb) */
7339 else if (i.types[op].bitfield.byte
7340 && (i.tm.operand_types[op].bitfield.class == Reg
7341 || i.tm.operand_types[op].bitfield.instance == Accum)
7342 && (i.tm.operand_types[op].bitfield.word
7343 || i.tm.operand_types[op].bitfield.dword))
7344 {
7345 as_bad (_("`%s%s' not allowed with `%s%c'"),
7346 register_prefix,
7347 i.op[op].regs->reg_name,
7348 i.tm.name,
7349 i.suffix);
7350 return 0;
7351 }
7352 /* Warn if the r prefix on a general reg is missing. */
7353 else if ((i.types[op].bitfield.word
7354 || i.types[op].bitfield.dword)
7355 && (i.tm.operand_types[op].bitfield.class == Reg
7356 || i.tm.operand_types[op].bitfield.instance == Accum)
7357 && i.tm.operand_types[op].bitfield.qword)
7358 {
7359 /* Prohibit these changes in the 64bit mode, since the
7360 lowering is more complicated. */
7361 if (intel_syntax
7362 && i.tm.opcode_modifier.todword
7363 && i.types[0].bitfield.class != RegSIMD)
7364 {
7365 /* Convert to DWORD. We don't want REX byte. */
7366 i.suffix = LONG_MNEM_SUFFIX;
7367 }
7368 else
7369 {
7370 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7371 register_prefix, i.op[op].regs->reg_name,
7372 i.suffix);
7373 return 0;
7374 }
7375 }
7376 return 1;
7377 }
7378
7379 static int
7380 check_word_reg (void)
7381 {
7382 int op;
7383 for (op = i.operands; --op >= 0;)
7384 /* Skip non-register operands. */
7385 if (i.types[op].bitfield.class != Reg)
7386 continue;
7387 /* Reject eight bit registers, except where the template requires
7388 them. (eg. movzb) */
7389 else if (i.types[op].bitfield.byte
7390 && (i.tm.operand_types[op].bitfield.class == Reg
7391 || i.tm.operand_types[op].bitfield.instance == Accum)
7392 && (i.tm.operand_types[op].bitfield.word
7393 || i.tm.operand_types[op].bitfield.dword))
7394 {
7395 as_bad (_("`%s%s' not allowed with `%s%c'"),
7396 register_prefix,
7397 i.op[op].regs->reg_name,
7398 i.tm.name,
7399 i.suffix);
7400 return 0;
7401 }
7402 /* Error if the e or r prefix on a general reg is present. */
7403 else if ((i.types[op].bitfield.dword
7404 || i.types[op].bitfield.qword)
7405 && (i.tm.operand_types[op].bitfield.class == Reg
7406 || i.tm.operand_types[op].bitfield.instance == Accum)
7407 && i.tm.operand_types[op].bitfield.word)
7408 {
7409 as_bad (_("incorrect register `%s%s' used with `%c' suffix"),
7410 register_prefix, i.op[op].regs->reg_name,
7411 i.suffix);
7412 return 0;
7413 }
7414 return 1;
7415 }
7416
7417 static int
7418 update_imm (unsigned int j)
7419 {
7420 i386_operand_type overlap = i.types[j];
7421 if ((overlap.bitfield.imm8
7422 || overlap.bitfield.imm8s
7423 || overlap.bitfield.imm16
7424 || overlap.bitfield.imm32
7425 || overlap.bitfield.imm32s
7426 || overlap.bitfield.imm64)
7427 && !operand_type_equal (&overlap, &imm8)
7428 && !operand_type_equal (&overlap, &imm8s)
7429 && !operand_type_equal (&overlap, &imm16)
7430 && !operand_type_equal (&overlap, &imm32)
7431 && !operand_type_equal (&overlap, &imm32s)
7432 && !operand_type_equal (&overlap, &imm64))
7433 {
7434 if (i.suffix)
7435 {
7436 i386_operand_type temp;
7437
7438 operand_type_set (&temp, 0);
7439 if (i.suffix == BYTE_MNEM_SUFFIX)
7440 {
7441 temp.bitfield.imm8 = overlap.bitfield.imm8;
7442 temp.bitfield.imm8s = overlap.bitfield.imm8s;
7443 }
7444 else if (i.suffix == WORD_MNEM_SUFFIX)
7445 temp.bitfield.imm16 = overlap.bitfield.imm16;
7446 else if (i.suffix == QWORD_MNEM_SUFFIX)
7447 {
7448 temp.bitfield.imm64 = overlap.bitfield.imm64;
7449 temp.bitfield.imm32s = overlap.bitfield.imm32s;
7450 }
7451 else
7452 temp.bitfield.imm32 = overlap.bitfield.imm32;
7453 overlap = temp;
7454 }
7455 else if (operand_type_equal (&overlap, &imm16_32_32s)
7456 || operand_type_equal (&overlap, &imm16_32)
7457 || operand_type_equal (&overlap, &imm16_32s))
7458 {
7459 if ((flag_code == CODE_16BIT) ^ (i.prefix[DATA_PREFIX] != 0))
7460 overlap = imm16;
7461 else
7462 overlap = imm32s;
7463 }
7464 else if (i.prefix[REX_PREFIX] & REX_W)
7465 overlap = operand_type_and (overlap, imm32s);
7466 else if (i.prefix[DATA_PREFIX])
7467 overlap = operand_type_and (overlap,
7468 flag_code != CODE_16BIT ? imm16 : imm32);
7469 if (!operand_type_equal (&overlap, &imm8)
7470 && !operand_type_equal (&overlap, &imm8s)
7471 && !operand_type_equal (&overlap, &imm16)
7472 && !operand_type_equal (&overlap, &imm32)
7473 && !operand_type_equal (&overlap, &imm32s)
7474 && !operand_type_equal (&overlap, &imm64))
7475 {
7476 as_bad (_("no instruction mnemonic suffix given; "
7477 "can't determine immediate size"));
7478 return 0;
7479 }
7480 }
7481 i.types[j] = overlap;
7482
7483 return 1;
7484 }
7485
7486 static int
7487 finalize_imm (void)
7488 {
7489 unsigned int j, n;
7490
7491 /* Update the first 2 immediate operands. */
7492 n = i.operands > 2 ? 2 : i.operands;
7493 if (n)
7494 {
7495 for (j = 0; j < n; j++)
7496 if (update_imm (j) == 0)
7497 return 0;
7498
7499 /* The 3rd operand can't be immediate operand. */
7500 gas_assert (operand_type_check (i.types[2], imm) == 0);
7501 }
7502
7503 return 1;
7504 }
7505
7506 static int
7507 process_operands (void)
7508 {
7509 /* Default segment register this instruction will use for memory
7510 accesses. 0 means unknown. This is only for optimizing out
7511 unnecessary segment overrides. */
7512 const seg_entry *default_seg = 0;
7513
7514 if (i.tm.opcode_modifier.sse2avx)
7515 {
7516 /* Legacy encoded insns allow explicit REX prefixes, so these prefixes
7517 need converting. */
7518 i.rex |= i.prefix[REX_PREFIX] & (REX_W | REX_R | REX_X | REX_B);
7519 i.prefix[REX_PREFIX] = 0;
7520 i.rex_encoding = 0;
7521 }
7522 /* ImmExt should be processed after SSE2AVX. */
7523 else if (i.tm.opcode_modifier.immext)
7524 process_immext ();
7525
7526 if (i.tm.opcode_modifier.sse2avx && i.tm.opcode_modifier.vexvvvv)
7527 {
7528 unsigned int dupl = i.operands;
7529 unsigned int dest = dupl - 1;
7530 unsigned int j;
7531
7532 /* The destination must be an xmm register. */
7533 gas_assert (i.reg_operands
7534 && MAX_OPERANDS > dupl
7535 && operand_type_equal (&i.types[dest], &regxmm));
7536
7537 if (i.tm.operand_types[0].bitfield.instance == Accum
7538 && i.tm.operand_types[0].bitfield.xmmword)
7539 {
7540 if (i.tm.opcode_modifier.vexsources == VEX3SOURCES)
7541 {
7542 /* Keep xmm0 for instructions with VEX prefix and 3
7543 sources. */
7544 i.tm.operand_types[0].bitfield.instance = InstanceNone;
7545 i.tm.operand_types[0].bitfield.class = RegSIMD;
7546 goto duplicate;
7547 }
7548 else
7549 {
7550 /* We remove the first xmm0 and keep the number of
7551 operands unchanged, which in fact duplicates the
7552 destination. */
7553 for (j = 1; j < i.operands; j++)
7554 {
7555 i.op[j - 1] = i.op[j];
7556 i.types[j - 1] = i.types[j];
7557 i.tm.operand_types[j - 1] = i.tm.operand_types[j];
7558 i.flags[j - 1] = i.flags[j];
7559 }
7560 }
7561 }
7562 else if (i.tm.opcode_modifier.implicit1stxmm0)
7563 {
7564 gas_assert ((MAX_OPERANDS - 1) > dupl
7565 && (i.tm.opcode_modifier.vexsources
7566 == VEX3SOURCES));
7567
7568 /* Add the implicit xmm0 for instructions with VEX prefix
7569 and 3 sources. */
7570 for (j = i.operands; j > 0; j--)
7571 {
7572 i.op[j] = i.op[j - 1];
7573 i.types[j] = i.types[j - 1];
7574 i.tm.operand_types[j] = i.tm.operand_types[j - 1];
7575 i.flags[j] = i.flags[j - 1];
7576 }
7577 i.op[0].regs
7578 = (const reg_entry *) str_hash_find (reg_hash, "xmm0");
7579 i.types[0] = regxmm;
7580 i.tm.operand_types[0] = regxmm;
7581
7582 i.operands += 2;
7583 i.reg_operands += 2;
7584 i.tm.operands += 2;
7585
7586 dupl++;
7587 dest++;
7588 i.op[dupl] = i.op[dest];
7589 i.types[dupl] = i.types[dest];
7590 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7591 i.flags[dupl] = i.flags[dest];
7592 }
7593 else
7594 {
7595 duplicate:
7596 i.operands++;
7597 i.reg_operands++;
7598 i.tm.operands++;
7599
7600 i.op[dupl] = i.op[dest];
7601 i.types[dupl] = i.types[dest];
7602 i.tm.operand_types[dupl] = i.tm.operand_types[dest];
7603 i.flags[dupl] = i.flags[dest];
7604 }
7605
7606 if (i.tm.opcode_modifier.immext)
7607 process_immext ();
7608 }
7609 else if (i.tm.operand_types[0].bitfield.instance == Accum
7610 && i.tm.operand_types[0].bitfield.xmmword)
7611 {
7612 unsigned int j;
7613
7614 for (j = 1; j < i.operands; j++)
7615 {
7616 i.op[j - 1] = i.op[j];
7617 i.types[j - 1] = i.types[j];
7618
7619 /* We need to adjust fields in i.tm since they are used by
7620 build_modrm_byte. */
7621 i.tm.operand_types [j - 1] = i.tm.operand_types [j];
7622
7623 i.flags[j - 1] = i.flags[j];
7624 }
7625
7626 i.operands--;
7627 i.reg_operands--;
7628 i.tm.operands--;
7629 }
7630 else if (i.tm.opcode_modifier.implicitquadgroup)
7631 {
7632 unsigned int regnum, first_reg_in_group, last_reg_in_group;
7633
7634 /* The second operand must be {x,y,z}mmN, where N is a multiple of 4. */
7635 gas_assert (i.operands >= 2 && i.types[1].bitfield.class == RegSIMD);
7636 regnum = register_number (i.op[1].regs);
7637 first_reg_in_group = regnum & ~3;
7638 last_reg_in_group = first_reg_in_group + 3;
7639 if (regnum != first_reg_in_group)
7640 as_warn (_("source register `%s%s' implicitly denotes"
7641 " `%s%.3s%u' to `%s%.3s%u' source group in `%s'"),
7642 register_prefix, i.op[1].regs->reg_name,
7643 register_prefix, i.op[1].regs->reg_name, first_reg_in_group,
7644 register_prefix, i.op[1].regs->reg_name, last_reg_in_group,
7645 i.tm.name);
7646 }
7647 else if (i.tm.opcode_modifier.regkludge)
7648 {
7649 /* The imul $imm, %reg instruction is converted into
7650 imul $imm, %reg, %reg, and the clr %reg instruction
7651 is converted into xor %reg, %reg. */
7652
7653 unsigned int first_reg_op;
7654
7655 if (operand_type_check (i.types[0], reg))
7656 first_reg_op = 0;
7657 else
7658 first_reg_op = 1;
7659 /* Pretend we saw the extra register operand. */
7660 gas_assert (i.reg_operands == 1
7661 && i.op[first_reg_op + 1].regs == 0);
7662 i.op[first_reg_op + 1].regs = i.op[first_reg_op].regs;
7663 i.types[first_reg_op + 1] = i.types[first_reg_op];
7664 i.operands++;
7665 i.reg_operands++;
7666 }
7667
7668 if (i.tm.opcode_modifier.modrm)
7669 {
7670 /* The opcode is completed (modulo i.tm.extension_opcode which
7671 must be put into the modrm byte). Now, we make the modrm and
7672 index base bytes based on all the info we've collected. */
7673
7674 default_seg = build_modrm_byte ();
7675 }
7676 else if (i.types[0].bitfield.class == SReg)
7677 {
7678 if (flag_code != CODE_64BIT
7679 ? i.tm.base_opcode == POP_SEG_SHORT
7680 && i.op[0].regs->reg_num == 1
7681 : (i.tm.base_opcode | 1) == POP_SEG386_SHORT
7682 && i.op[0].regs->reg_num < 4)
7683 {
7684 as_bad (_("you can't `%s %s%s'"),
7685 i.tm.name, register_prefix, i.op[0].regs->reg_name);
7686 return 0;
7687 }
7688 if ( i.op[0].regs->reg_num > 3 && i.opcode_length == 1 )
7689 {
7690 i.tm.base_opcode ^= POP_SEG_SHORT ^ POP_SEG386_SHORT;
7691 i.opcode_length = 2;
7692 }
7693 i.tm.base_opcode |= (i.op[0].regs->reg_num << 3);
7694 }
7695 else if ((i.tm.base_opcode & ~0x3) == MOV_AX_DISP32)
7696 {
7697 default_seg = &ds;
7698 }
7699 else if (i.tm.opcode_modifier.isstring)
7700 {
7701 /* For the string instructions that allow a segment override
7702 on one of their operands, the default segment is ds. */
7703 default_seg = &ds;
7704 }
7705 else if (i.short_form)
7706 {
7707 /* The register or float register operand is in operand
7708 0 or 1. */
7709 unsigned int op = i.tm.operand_types[0].bitfield.class != Reg;
7710
7711 /* Register goes in low 3 bits of opcode. */
7712 i.tm.base_opcode |= i.op[op].regs->reg_num;
7713 if ((i.op[op].regs->reg_flags & RegRex) != 0)
7714 i.rex |= REX_B;
7715 if (!quiet_warnings && i.tm.opcode_modifier.ugh)
7716 {
7717 /* Warn about some common errors, but press on regardless.
7718 The first case can be generated by gcc (<= 2.8.1). */
7719 if (i.operands == 2)
7720 {
7721 /* Reversed arguments on faddp, fsubp, etc. */
7722 as_warn (_("translating to `%s %s%s,%s%s'"), i.tm.name,
7723 register_prefix, i.op[!intel_syntax].regs->reg_name,
7724 register_prefix, i.op[intel_syntax].regs->reg_name);
7725 }
7726 else
7727 {
7728 /* Extraneous `l' suffix on fp insn. */
7729 as_warn (_("translating to `%s %s%s'"), i.tm.name,
7730 register_prefix, i.op[0].regs->reg_name);
7731 }
7732 }
7733 }
7734
7735 if ((i.seg[0] || i.prefix[SEG_PREFIX])
7736 && i.tm.base_opcode == 0x8d /* lea */
7737 && i.tm.opcode_modifier.opcodespace == SPACE_BASE
7738 && !is_any_vex_encoding(&i.tm))
7739 {
7740 if (!quiet_warnings)
7741 as_warn (_("segment override on `%s' is ineffectual"), i.tm.name);
7742 if (optimize)
7743 {
7744 i.seg[0] = NULL;
7745 i.prefix[SEG_PREFIX] = 0;
7746 }
7747 }
7748
7749 /* If a segment was explicitly specified, and the specified segment
7750 is neither the default nor the one already recorded from a prefix,
7751 use an opcode prefix to select it. If we never figured out what
7752 the default segment is, then default_seg will be zero at this
7753 point, and the specified segment prefix will always be used. */
7754 if (i.seg[0]
7755 && i.seg[0] != default_seg
7756 && i.seg[0]->seg_prefix != i.prefix[SEG_PREFIX])
7757 {
7758 if (!add_prefix (i.seg[0]->seg_prefix))
7759 return 0;
7760 }
7761 return 1;
7762 }
7763
7764 static INLINE void set_rex_vrex (const reg_entry *r, unsigned int rex_bit,
7765 bfd_boolean do_sse2avx)
7766 {
7767 if (r->reg_flags & RegRex)
7768 {
7769 if (i.rex & rex_bit)
7770 as_bad (_("same type of prefix used twice"));
7771 i.rex |= rex_bit;
7772 }
7773 else if (do_sse2avx && (i.rex & rex_bit) && i.vex.register_specifier)
7774 {
7775 gas_assert (i.vex.register_specifier == r);
7776 i.vex.register_specifier += 8;
7777 }
7778
7779 if (r->reg_flags & RegVRex)
7780 i.vrex |= rex_bit;
7781 }
7782
7783 static const seg_entry *
7784 build_modrm_byte (void)
7785 {
7786 const seg_entry *default_seg = 0;
7787 unsigned int source, dest;
7788 int vex_3_sources;
7789
7790 vex_3_sources = i.tm.opcode_modifier.vexsources == VEX3SOURCES;
7791 if (vex_3_sources)
7792 {
7793 unsigned int nds, reg_slot;
7794 expressionS *exp;
7795
7796 dest = i.operands - 1;
7797 nds = dest - 1;
7798
7799 /* There are 2 kinds of instructions:
7800 1. 5 operands: 4 register operands or 3 register operands
7801 plus 1 memory operand plus one Imm4 operand, VexXDS, and
7802 VexW0 or VexW1. The destination must be either XMM, YMM or
7803 ZMM register.
7804 2. 4 operands: 4 register operands or 3 register operands
7805 plus 1 memory operand, with VexXDS. */
7806 gas_assert ((i.reg_operands == 4
7807 || (i.reg_operands == 3 && i.mem_operands == 1))
7808 && i.tm.opcode_modifier.vexvvvv == VEXXDS
7809 && i.tm.opcode_modifier.vexw
7810 && i.tm.operand_types[dest].bitfield.class == RegSIMD);
7811
7812 /* If VexW1 is set, the first non-immediate operand is the source and
7813 the second non-immediate one is encoded in the immediate operand. */
7814 if (i.tm.opcode_modifier.vexw == VEXW1)
7815 {
7816 source = i.imm_operands;
7817 reg_slot = i.imm_operands + 1;
7818 }
7819 else
7820 {
7821 source = i.imm_operands + 1;
7822 reg_slot = i.imm_operands;
7823 }
7824
7825 if (i.imm_operands == 0)
7826 {
7827 /* When there is no immediate operand, generate an 8bit
7828 immediate operand to encode the first operand. */
7829 exp = &im_expressions[i.imm_operands++];
7830 i.op[i.operands].imms = exp;
7831 i.types[i.operands] = imm8;
7832 i.operands++;
7833
7834 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7835 exp->X_op = O_constant;
7836 exp->X_add_number = register_number (i.op[reg_slot].regs) << 4;
7837 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7838 }
7839 else
7840 {
7841 gas_assert (i.imm_operands == 1);
7842 gas_assert (fits_in_imm4 (i.op[0].imms->X_add_number));
7843 gas_assert (!i.tm.opcode_modifier.immext);
7844
7845 /* Turn on Imm8 again so that output_imm will generate it. */
7846 i.types[0].bitfield.imm8 = 1;
7847
7848 gas_assert (i.tm.operand_types[reg_slot].bitfield.class == RegSIMD);
7849 i.op[0].imms->X_add_number
7850 |= register_number (i.op[reg_slot].regs) << 4;
7851 gas_assert ((i.op[reg_slot].regs->reg_flags & RegVRex) == 0);
7852 }
7853
7854 gas_assert (i.tm.operand_types[nds].bitfield.class == RegSIMD);
7855 i.vex.register_specifier = i.op[nds].regs;
7856 }
7857 else
7858 source = dest = 0;
7859
7860 /* i.reg_operands MUST be the number of real register operands;
7861 implicit registers do not count. If there are 3 register
7862 operands, it must be a instruction with VexNDS. For a
7863 instruction with VexNDD, the destination register is encoded
7864 in VEX prefix. If there are 4 register operands, it must be
7865 a instruction with VEX prefix and 3 sources. */
7866 if (i.mem_operands == 0
7867 && ((i.reg_operands == 2
7868 && i.tm.opcode_modifier.vexvvvv <= VEXXDS)
7869 || (i.reg_operands == 3
7870 && i.tm.opcode_modifier.vexvvvv == VEXXDS)
7871 || (i.reg_operands == 4 && vex_3_sources)))
7872 {
7873 switch (i.operands)
7874 {
7875 case 2:
7876 source = 0;
7877 break;
7878 case 3:
7879 /* When there are 3 operands, one of them may be immediate,
7880 which may be the first or the last operand. Otherwise,
7881 the first operand must be shift count register (cl) or it
7882 is an instruction with VexNDS. */
7883 gas_assert (i.imm_operands == 1
7884 || (i.imm_operands == 0
7885 && (i.tm.opcode_modifier.vexvvvv == VEXXDS
7886 || (i.types[0].bitfield.instance == RegC
7887 && i.types[0].bitfield.byte))));
7888 if (operand_type_check (i.types[0], imm)
7889 || (i.types[0].bitfield.instance == RegC
7890 && i.types[0].bitfield.byte))
7891 source = 1;
7892 else
7893 source = 0;
7894 break;
7895 case 4:
7896 /* When there are 4 operands, the first two must be 8bit
7897 immediate operands. The source operand will be the 3rd
7898 one.
7899
7900 For instructions with VexNDS, if the first operand
7901 an imm8, the source operand is the 2nd one. If the last
7902 operand is imm8, the source operand is the first one. */
7903 gas_assert ((i.imm_operands == 2
7904 && i.types[0].bitfield.imm8
7905 && i.types[1].bitfield.imm8)
7906 || (i.tm.opcode_modifier.vexvvvv == VEXXDS
7907 && i.imm_operands == 1
7908 && (i.types[0].bitfield.imm8
7909 || i.types[i.operands - 1].bitfield.imm8
7910 || i.rounding)));
7911 if (i.imm_operands == 2)
7912 source = 2;
7913 else
7914 {
7915 if (i.types[0].bitfield.imm8)
7916 source = 1;
7917 else
7918 source = 0;
7919 }
7920 break;
7921 case 5:
7922 if (is_evex_encoding (&i.tm))
7923 {
7924 /* For EVEX instructions, when there are 5 operands, the
7925 first one must be immediate operand. If the second one
7926 is immediate operand, the source operand is the 3th
7927 one. If the last one is immediate operand, the source
7928 operand is the 2nd one. */
7929 gas_assert (i.imm_operands == 2
7930 && i.tm.opcode_modifier.sae
7931 && operand_type_check (i.types[0], imm));
7932 if (operand_type_check (i.types[1], imm))
7933 source = 2;
7934 else if (operand_type_check (i.types[4], imm))
7935 source = 1;
7936 else
7937 abort ();
7938 }
7939 break;
7940 default:
7941 abort ();
7942 }
7943
7944 if (!vex_3_sources)
7945 {
7946 dest = source + 1;
7947
7948 /* RC/SAE operand could be between DEST and SRC. That happens
7949 when one operand is GPR and the other one is XMM/YMM/ZMM
7950 register. */
7951 if (i.rounding && i.rounding->operand == (int) dest)
7952 dest++;
7953
7954 if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
7955 {
7956 /* For instructions with VexNDS, the register-only source
7957 operand must be a 32/64bit integer, XMM, YMM, ZMM, or mask
7958 register. It is encoded in VEX prefix. */
7959
7960 i386_operand_type op;
7961 unsigned int vvvv;
7962
7963 /* Swap two source operands if needed. */
7964 if (i.tm.opcode_modifier.swapsources)
7965 {
7966 vvvv = source;
7967 source = dest;
7968 }
7969 else
7970 vvvv = dest;
7971
7972 op = i.tm.operand_types[vvvv];
7973 if ((dest + 1) >= i.operands
7974 || ((op.bitfield.class != Reg
7975 || (!op.bitfield.dword && !op.bitfield.qword))
7976 && op.bitfield.class != RegSIMD
7977 && !operand_type_equal (&op, &regmask)))
7978 abort ();
7979 i.vex.register_specifier = i.op[vvvv].regs;
7980 dest++;
7981 }
7982 }
7983
7984 i.rm.mode = 3;
7985 /* One of the register operands will be encoded in the i.rm.reg
7986 field, the other in the combined i.rm.mode and i.rm.regmem
7987 fields. If no form of this instruction supports a memory
7988 destination operand, then we assume the source operand may
7989 sometimes be a memory operand and so we need to store the
7990 destination in the i.rm.reg field. */
7991 if (!i.tm.opcode_modifier.regmem
7992 && operand_type_check (i.tm.operand_types[dest], anymem) == 0)
7993 {
7994 i.rm.reg = i.op[dest].regs->reg_num;
7995 i.rm.regmem = i.op[source].regs->reg_num;
7996 set_rex_vrex (i.op[dest].regs, REX_R, i.tm.opcode_modifier.sse2avx);
7997 set_rex_vrex (i.op[source].regs, REX_B, FALSE);
7998 }
7999 else
8000 {
8001 i.rm.reg = i.op[source].regs->reg_num;
8002 i.rm.regmem = i.op[dest].regs->reg_num;
8003 set_rex_vrex (i.op[dest].regs, REX_B, i.tm.opcode_modifier.sse2avx);
8004 set_rex_vrex (i.op[source].regs, REX_R, FALSE);
8005 }
8006 if (flag_code != CODE_64BIT && (i.rex & REX_R))
8007 {
8008 if (i.types[!i.tm.opcode_modifier.regmem].bitfield.class != RegCR)
8009 abort ();
8010 i.rex &= ~REX_R;
8011 add_prefix (LOCK_PREFIX_OPCODE);
8012 }
8013 }
8014 else
8015 { /* If it's not 2 reg operands... */
8016 unsigned int mem;
8017
8018 if (i.mem_operands)
8019 {
8020 unsigned int fake_zero_displacement = 0;
8021 unsigned int op;
8022
8023 for (op = 0; op < i.operands; op++)
8024 if (i.flags[op] & Operand_Mem)
8025 break;
8026 gas_assert (op < i.operands);
8027
8028 if (i.tm.opcode_modifier.sib)
8029 {
8030 /* The index register of VSIB shouldn't be RegIZ. */
8031 if (i.tm.opcode_modifier.sib != SIBMEM
8032 && i.index_reg->reg_num == RegIZ)
8033 abort ();
8034
8035 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8036 if (!i.base_reg)
8037 {
8038 i.sib.base = NO_BASE_REGISTER;
8039 i.sib.scale = i.log2_scale_factor;
8040 i.types[op].bitfield.disp8 = 0;
8041 i.types[op].bitfield.disp16 = 0;
8042 i.types[op].bitfield.disp64 = 0;
8043 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8044 {
8045 /* Must be 32 bit */
8046 i.types[op].bitfield.disp32 = 1;
8047 i.types[op].bitfield.disp32s = 0;
8048 }
8049 else
8050 {
8051 i.types[op].bitfield.disp32 = 0;
8052 i.types[op].bitfield.disp32s = 1;
8053 }
8054 }
8055
8056 /* Since the mandatory SIB always has index register, so
8057 the code logic remains unchanged. The non-mandatory SIB
8058 without index register is allowed and will be handled
8059 later. */
8060 if (i.index_reg)
8061 {
8062 if (i.index_reg->reg_num == RegIZ)
8063 i.sib.index = NO_INDEX_REGISTER;
8064 else
8065 i.sib.index = i.index_reg->reg_num;
8066 set_rex_vrex (i.index_reg, REX_X, FALSE);
8067 }
8068 }
8069
8070 default_seg = &ds;
8071
8072 if (i.base_reg == 0)
8073 {
8074 i.rm.mode = 0;
8075 if (!i.disp_operands)
8076 fake_zero_displacement = 1;
8077 if (i.index_reg == 0)
8078 {
8079 i386_operand_type newdisp;
8080
8081 /* Both check for VSIB and mandatory non-vector SIB. */
8082 gas_assert (!i.tm.opcode_modifier.sib
8083 || i.tm.opcode_modifier.sib == SIBMEM);
8084 /* Operand is just <disp> */
8085 if (flag_code == CODE_64BIT)
8086 {
8087 /* 64bit mode overwrites the 32bit absolute
8088 addressing by RIP relative addressing and
8089 absolute addressing is encoded by one of the
8090 redundant SIB forms. */
8091 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8092 i.sib.base = NO_BASE_REGISTER;
8093 i.sib.index = NO_INDEX_REGISTER;
8094 newdisp = (!i.prefix[ADDR_PREFIX] ? disp32s : disp32);
8095 }
8096 else if ((flag_code == CODE_16BIT)
8097 ^ (i.prefix[ADDR_PREFIX] != 0))
8098 {
8099 i.rm.regmem = NO_BASE_REGISTER_16;
8100 newdisp = disp16;
8101 }
8102 else
8103 {
8104 i.rm.regmem = NO_BASE_REGISTER;
8105 newdisp = disp32;
8106 }
8107 i.types[op] = operand_type_and_not (i.types[op], anydisp);
8108 i.types[op] = operand_type_or (i.types[op], newdisp);
8109 }
8110 else if (!i.tm.opcode_modifier.sib)
8111 {
8112 /* !i.base_reg && i.index_reg */
8113 if (i.index_reg->reg_num == RegIZ)
8114 i.sib.index = NO_INDEX_REGISTER;
8115 else
8116 i.sib.index = i.index_reg->reg_num;
8117 i.sib.base = NO_BASE_REGISTER;
8118 i.sib.scale = i.log2_scale_factor;
8119 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8120 i.types[op].bitfield.disp8 = 0;
8121 i.types[op].bitfield.disp16 = 0;
8122 i.types[op].bitfield.disp64 = 0;
8123 if (flag_code != CODE_64BIT || i.prefix[ADDR_PREFIX])
8124 {
8125 /* Must be 32 bit */
8126 i.types[op].bitfield.disp32 = 1;
8127 i.types[op].bitfield.disp32s = 0;
8128 }
8129 else
8130 {
8131 i.types[op].bitfield.disp32 = 0;
8132 i.types[op].bitfield.disp32s = 1;
8133 }
8134 if ((i.index_reg->reg_flags & RegRex) != 0)
8135 i.rex |= REX_X;
8136 }
8137 }
8138 /* RIP addressing for 64bit mode. */
8139 else if (i.base_reg->reg_num == RegIP)
8140 {
8141 gas_assert (!i.tm.opcode_modifier.sib);
8142 i.rm.regmem = NO_BASE_REGISTER;
8143 i.types[op].bitfield.disp8 = 0;
8144 i.types[op].bitfield.disp16 = 0;
8145 i.types[op].bitfield.disp32 = 0;
8146 i.types[op].bitfield.disp32s = 1;
8147 i.types[op].bitfield.disp64 = 0;
8148 i.flags[op] |= Operand_PCrel;
8149 if (! i.disp_operands)
8150 fake_zero_displacement = 1;
8151 }
8152 else if (i.base_reg->reg_type.bitfield.word)
8153 {
8154 gas_assert (!i.tm.opcode_modifier.sib);
8155 switch (i.base_reg->reg_num)
8156 {
8157 case 3: /* (%bx) */
8158 if (i.index_reg == 0)
8159 i.rm.regmem = 7;
8160 else /* (%bx,%si) -> 0, or (%bx,%di) -> 1 */
8161 i.rm.regmem = i.index_reg->reg_num - 6;
8162 break;
8163 case 5: /* (%bp) */
8164 default_seg = &ss;
8165 if (i.index_reg == 0)
8166 {
8167 i.rm.regmem = 6;
8168 if (operand_type_check (i.types[op], disp) == 0)
8169 {
8170 /* fake (%bp) into 0(%bp) */
8171 if (i.disp_encoding == disp_encoding_16bit)
8172 i.types[op].bitfield.disp16 = 1;
8173 else
8174 i.types[op].bitfield.disp8 = 1;
8175 fake_zero_displacement = 1;
8176 }
8177 }
8178 else /* (%bp,%si) -> 2, or (%bp,%di) -> 3 */
8179 i.rm.regmem = i.index_reg->reg_num - 6 + 2;
8180 break;
8181 default: /* (%si) -> 4 or (%di) -> 5 */
8182 i.rm.regmem = i.base_reg->reg_num - 6 + 4;
8183 }
8184 if (!fake_zero_displacement
8185 && !i.disp_operands
8186 && i.disp_encoding)
8187 {
8188 fake_zero_displacement = 1;
8189 if (i.disp_encoding == disp_encoding_8bit)
8190 i.types[op].bitfield.disp8 = 1;
8191 else
8192 i.types[op].bitfield.disp16 = 1;
8193 }
8194 i.rm.mode = mode_from_disp_size (i.types[op]);
8195 }
8196 else /* i.base_reg and 32/64 bit mode */
8197 {
8198 if (flag_code == CODE_64BIT
8199 && operand_type_check (i.types[op], disp))
8200 {
8201 i.types[op].bitfield.disp16 = 0;
8202 i.types[op].bitfield.disp64 = 0;
8203 if (i.prefix[ADDR_PREFIX] == 0)
8204 {
8205 i.types[op].bitfield.disp32 = 0;
8206 i.types[op].bitfield.disp32s = 1;
8207 }
8208 else
8209 {
8210 i.types[op].bitfield.disp32 = 1;
8211 i.types[op].bitfield.disp32s = 0;
8212 }
8213 }
8214
8215 if (!i.tm.opcode_modifier.sib)
8216 i.rm.regmem = i.base_reg->reg_num;
8217 if ((i.base_reg->reg_flags & RegRex) != 0)
8218 i.rex |= REX_B;
8219 i.sib.base = i.base_reg->reg_num;
8220 /* x86-64 ignores REX prefix bit here to avoid decoder
8221 complications. */
8222 if (!(i.base_reg->reg_flags & RegRex)
8223 && (i.base_reg->reg_num == EBP_REG_NUM
8224 || i.base_reg->reg_num == ESP_REG_NUM))
8225 default_seg = &ss;
8226 if (i.base_reg->reg_num == 5 && i.disp_operands == 0)
8227 {
8228 fake_zero_displacement = 1;
8229 if (i.disp_encoding == disp_encoding_32bit)
8230 i.types[op].bitfield.disp32 = 1;
8231 else
8232 i.types[op].bitfield.disp8 = 1;
8233 }
8234 i.sib.scale = i.log2_scale_factor;
8235 if (i.index_reg == 0)
8236 {
8237 /* Only check for VSIB. */
8238 gas_assert (i.tm.opcode_modifier.sib != VECSIB128
8239 && i.tm.opcode_modifier.sib != VECSIB256
8240 && i.tm.opcode_modifier.sib != VECSIB512);
8241
8242 /* <disp>(%esp) becomes two byte modrm with no index
8243 register. We've already stored the code for esp
8244 in i.rm.regmem ie. ESCAPE_TO_TWO_BYTE_ADDRESSING.
8245 Any base register besides %esp will not use the
8246 extra modrm byte. */
8247 i.sib.index = NO_INDEX_REGISTER;
8248 }
8249 else if (!i.tm.opcode_modifier.sib)
8250 {
8251 if (i.index_reg->reg_num == RegIZ)
8252 i.sib.index = NO_INDEX_REGISTER;
8253 else
8254 i.sib.index = i.index_reg->reg_num;
8255 i.rm.regmem = ESCAPE_TO_TWO_BYTE_ADDRESSING;
8256 if ((i.index_reg->reg_flags & RegRex) != 0)
8257 i.rex |= REX_X;
8258 }
8259
8260 if (i.disp_operands
8261 && (i.reloc[op] == BFD_RELOC_386_TLS_DESC_CALL
8262 || i.reloc[op] == BFD_RELOC_X86_64_TLSDESC_CALL))
8263 i.rm.mode = 0;
8264 else
8265 {
8266 if (!fake_zero_displacement
8267 && !i.disp_operands
8268 && i.disp_encoding)
8269 {
8270 fake_zero_displacement = 1;
8271 if (i.disp_encoding == disp_encoding_8bit)
8272 i.types[op].bitfield.disp8 = 1;
8273 else
8274 i.types[op].bitfield.disp32 = 1;
8275 }
8276 i.rm.mode = mode_from_disp_size (i.types[op]);
8277 }
8278 }
8279
8280 if (fake_zero_displacement)
8281 {
8282 /* Fakes a zero displacement assuming that i.types[op]
8283 holds the correct displacement size. */
8284 expressionS *exp;
8285
8286 gas_assert (i.op[op].disps == 0);
8287 exp = &disp_expressions[i.disp_operands++];
8288 i.op[op].disps = exp;
8289 exp->X_op = O_constant;
8290 exp->X_add_number = 0;
8291 exp->X_add_symbol = (symbolS *) 0;
8292 exp->X_op_symbol = (symbolS *) 0;
8293 }
8294
8295 mem = op;
8296 }
8297 else
8298 mem = ~0;
8299
8300 if (i.tm.opcode_modifier.vexsources == XOP2SOURCES)
8301 {
8302 if (operand_type_check (i.types[0], imm))
8303 i.vex.register_specifier = NULL;
8304 else
8305 {
8306 /* VEX.vvvv encodes one of the sources when the first
8307 operand is not an immediate. */
8308 if (i.tm.opcode_modifier.vexw == VEXW0)
8309 i.vex.register_specifier = i.op[0].regs;
8310 else
8311 i.vex.register_specifier = i.op[1].regs;
8312 }
8313
8314 /* Destination is a XMM register encoded in the ModRM.reg
8315 and VEX.R bit. */
8316 i.rm.reg = i.op[2].regs->reg_num;
8317 if ((i.op[2].regs->reg_flags & RegRex) != 0)
8318 i.rex |= REX_R;
8319
8320 /* ModRM.rm and VEX.B encodes the other source. */
8321 if (!i.mem_operands)
8322 {
8323 i.rm.mode = 3;
8324
8325 if (i.tm.opcode_modifier.vexw == VEXW0)
8326 i.rm.regmem = i.op[1].regs->reg_num;
8327 else
8328 i.rm.regmem = i.op[0].regs->reg_num;
8329
8330 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8331 i.rex |= REX_B;
8332 }
8333 }
8334 else if (i.tm.opcode_modifier.vexvvvv == VEXLWP)
8335 {
8336 i.vex.register_specifier = i.op[2].regs;
8337 if (!i.mem_operands)
8338 {
8339 i.rm.mode = 3;
8340 i.rm.regmem = i.op[1].regs->reg_num;
8341 if ((i.op[1].regs->reg_flags & RegRex) != 0)
8342 i.rex |= REX_B;
8343 }
8344 }
8345 /* Fill in i.rm.reg or i.rm.regmem field with register operand
8346 (if any) based on i.tm.extension_opcode. Again, we must be
8347 careful to make sure that segment/control/debug/test/MMX
8348 registers are coded into the i.rm.reg field. */
8349 else if (i.reg_operands)
8350 {
8351 unsigned int op;
8352 unsigned int vex_reg = ~0;
8353
8354 for (op = 0; op < i.operands; op++)
8355 if (i.types[op].bitfield.class == Reg
8356 || i.types[op].bitfield.class == RegBND
8357 || i.types[op].bitfield.class == RegMask
8358 || i.types[op].bitfield.class == SReg
8359 || i.types[op].bitfield.class == RegCR
8360 || i.types[op].bitfield.class == RegDR
8361 || i.types[op].bitfield.class == RegTR
8362 || i.types[op].bitfield.class == RegSIMD
8363 || i.types[op].bitfield.class == RegMMX)
8364 break;
8365
8366 if (vex_3_sources)
8367 op = dest;
8368 else if (i.tm.opcode_modifier.vexvvvv == VEXXDS)
8369 {
8370 /* For instructions with VexNDS, the register-only
8371 source operand is encoded in VEX prefix. */
8372 gas_assert (mem != (unsigned int) ~0);
8373
8374 if (op > mem)
8375 {
8376 vex_reg = op++;
8377 gas_assert (op < i.operands);
8378 }
8379 else
8380 {
8381 /* Check register-only source operand when two source
8382 operands are swapped. */
8383 if (!i.tm.operand_types[op].bitfield.baseindex
8384 && i.tm.operand_types[op + 1].bitfield.baseindex)
8385 {
8386 vex_reg = op;
8387 op += 2;
8388 gas_assert (mem == (vex_reg + 1)
8389 && op < i.operands);
8390 }
8391 else
8392 {
8393 vex_reg = op + 1;
8394 gas_assert (vex_reg < i.operands);
8395 }
8396 }
8397 }
8398 else if (i.tm.opcode_modifier.vexvvvv == VEXNDD)
8399 {
8400 /* For instructions with VexNDD, the register destination
8401 is encoded in VEX prefix. */
8402 if (i.mem_operands == 0)
8403 {
8404 /* There is no memory operand. */
8405 gas_assert ((op + 2) == i.operands);
8406 vex_reg = op + 1;
8407 }
8408 else
8409 {
8410 /* There are only 2 non-immediate operands. */
8411 gas_assert (op < i.imm_operands + 2
8412 && i.operands == i.imm_operands + 2);
8413 vex_reg = i.imm_operands + 1;
8414 }
8415 }
8416 else
8417 gas_assert (op < i.operands);
8418
8419 if (vex_reg != (unsigned int) ~0)
8420 {
8421 i386_operand_type *type = &i.tm.operand_types[vex_reg];
8422
8423 if ((type->bitfield.class != Reg
8424 || (!type->bitfield.dword && !type->bitfield.qword))
8425 && type->bitfield.class != RegSIMD
8426 && !operand_type_equal (type, &regmask))
8427 abort ();
8428
8429 i.vex.register_specifier = i.op[vex_reg].regs;
8430 }
8431
8432 /* Don't set OP operand twice. */
8433 if (vex_reg != op)
8434 {
8435 /* If there is an extension opcode to put here, the
8436 register number must be put into the regmem field. */
8437 if (i.tm.extension_opcode != None)
8438 {
8439 i.rm.regmem = i.op[op].regs->reg_num;
8440 set_rex_vrex (i.op[op].regs, REX_B,
8441 i.tm.opcode_modifier.sse2avx);
8442 }
8443 else
8444 {
8445 i.rm.reg = i.op[op].regs->reg_num;
8446 set_rex_vrex (i.op[op].regs, REX_R,
8447 i.tm.opcode_modifier.sse2avx);
8448 }
8449 }
8450
8451 /* Now, if no memory operand has set i.rm.mode = 0, 1, 2 we
8452 must set it to 3 to indicate this is a register operand
8453 in the regmem field. */
8454 if (!i.mem_operands)
8455 i.rm.mode = 3;
8456 }
8457
8458 /* Fill in i.rm.reg field with extension opcode (if any). */
8459 if (i.tm.extension_opcode != None)
8460 i.rm.reg = i.tm.extension_opcode;
8461 }
8462 return default_seg;
8463 }
8464
8465 static INLINE void
8466 frag_opcode_byte (unsigned char byte)
8467 {
8468 if (now_seg != absolute_section)
8469 FRAG_APPEND_1_CHAR (byte);
8470 else
8471 ++abs_section_offset;
8472 }
8473
8474 static unsigned int
8475 flip_code16 (unsigned int code16)
8476 {
8477 gas_assert (i.tm.operands == 1);
8478
8479 return !(i.prefix[REX_PREFIX] & REX_W)
8480 && (code16 ? i.tm.operand_types[0].bitfield.disp32
8481 || i.tm.operand_types[0].bitfield.disp32s
8482 : i.tm.operand_types[0].bitfield.disp16)
8483 ? CODE16 : 0;
8484 }
8485
8486 static void
8487 output_branch (void)
8488 {
8489 char *p;
8490 int size;
8491 int code16;
8492 int prefix;
8493 relax_substateT subtype;
8494 symbolS *sym;
8495 offsetT off;
8496
8497 if (now_seg == absolute_section)
8498 {
8499 as_bad (_("relaxable branches not supported in absolute section"));
8500 return;
8501 }
8502
8503 code16 = flag_code == CODE_16BIT ? CODE16 : 0;
8504 size = i.disp_encoding == disp_encoding_32bit ? BIG : SMALL;
8505
8506 prefix = 0;
8507 if (i.prefix[DATA_PREFIX] != 0)
8508 {
8509 prefix = 1;
8510 i.prefixes -= 1;
8511 code16 ^= flip_code16(code16);
8512 }
8513 /* Pentium4 branch hints. */
8514 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8515 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8516 {
8517 prefix++;
8518 i.prefixes--;
8519 }
8520 if (i.prefix[REX_PREFIX] != 0)
8521 {
8522 prefix++;
8523 i.prefixes--;
8524 }
8525
8526 /* BND prefixed jump. */
8527 if (i.prefix[BND_PREFIX] != 0)
8528 {
8529 prefix++;
8530 i.prefixes--;
8531 }
8532
8533 if (i.prefixes != 0)
8534 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8535
8536 /* It's always a symbol; End frag & setup for relax.
8537 Make sure there is enough room in this frag for the largest
8538 instruction we may generate in md_convert_frag. This is 2
8539 bytes for the opcode and room for the prefix and largest
8540 displacement. */
8541 frag_grow (prefix + 2 + 4);
8542 /* Prefix and 1 opcode byte go in fr_fix. */
8543 p = frag_more (prefix + 1);
8544 if (i.prefix[DATA_PREFIX] != 0)
8545 *p++ = DATA_PREFIX_OPCODE;
8546 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE
8547 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE)
8548 *p++ = i.prefix[SEG_PREFIX];
8549 if (i.prefix[BND_PREFIX] != 0)
8550 *p++ = BND_PREFIX_OPCODE;
8551 if (i.prefix[REX_PREFIX] != 0)
8552 *p++ = i.prefix[REX_PREFIX];
8553 *p = i.tm.base_opcode;
8554
8555 if ((unsigned char) *p == JUMP_PC_RELATIVE)
8556 subtype = ENCODE_RELAX_STATE (UNCOND_JUMP, size);
8557 else if (cpu_arch_flags.bitfield.cpui386)
8558 subtype = ENCODE_RELAX_STATE (COND_JUMP, size);
8559 else
8560 subtype = ENCODE_RELAX_STATE (COND_JUMP86, size);
8561 subtype |= code16;
8562
8563 sym = i.op[0].disps->X_add_symbol;
8564 off = i.op[0].disps->X_add_number;
8565
8566 if (i.op[0].disps->X_op != O_constant
8567 && i.op[0].disps->X_op != O_symbol)
8568 {
8569 /* Handle complex expressions. */
8570 sym = make_expr_symbol (i.op[0].disps);
8571 off = 0;
8572 }
8573
8574 /* 1 possible extra opcode + 4 byte displacement go in var part.
8575 Pass reloc in fr_var. */
8576 frag_var (rs_machine_dependent, 5, i.reloc[0], subtype, sym, off, p);
8577 }
8578
8579 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8580 /* Return TRUE iff PLT32 relocation should be used for branching to
8581 symbol S. */
8582
8583 static bfd_boolean
8584 need_plt32_p (symbolS *s)
8585 {
8586 /* PLT32 relocation is ELF only. */
8587 if (!IS_ELF)
8588 return FALSE;
8589
8590 #ifdef TE_SOLARIS
8591 /* Don't emit PLT32 relocation on Solaris: neither native linker nor
8592 krtld support it. */
8593 return FALSE;
8594 #endif
8595
8596 /* Since there is no need to prepare for PLT branch on x86-64, we
8597 can generate R_X86_64_PLT32, instead of R_X86_64_PC32, which can
8598 be used as a marker for 32-bit PC-relative branches. */
8599 if (!object_64bit)
8600 return FALSE;
8601
8602 if (s == NULL)
8603 return FALSE;
8604
8605 /* Weak or undefined symbol need PLT32 relocation. */
8606 if (S_IS_WEAK (s) || !S_IS_DEFINED (s))
8607 return TRUE;
8608
8609 /* Non-global symbol doesn't need PLT32 relocation. */
8610 if (! S_IS_EXTERNAL (s))
8611 return FALSE;
8612
8613 /* Other global symbols need PLT32 relocation. NB: Symbol with
8614 non-default visibilities are treated as normal global symbol
8615 so that PLT32 relocation can be used as a marker for 32-bit
8616 PC-relative branches. It is useful for linker relaxation. */
8617 return TRUE;
8618 }
8619 #endif
8620
8621 static void
8622 output_jump (void)
8623 {
8624 char *p;
8625 int size;
8626 fixS *fixP;
8627 bfd_reloc_code_real_type jump_reloc = i.reloc[0];
8628
8629 if (i.tm.opcode_modifier.jump == JUMP_BYTE)
8630 {
8631 /* This is a loop or jecxz type instruction. */
8632 size = 1;
8633 if (i.prefix[ADDR_PREFIX] != 0)
8634 {
8635 frag_opcode_byte (ADDR_PREFIX_OPCODE);
8636 i.prefixes -= 1;
8637 }
8638 /* Pentium4 branch hints. */
8639 if (i.prefix[SEG_PREFIX] == CS_PREFIX_OPCODE /* not taken */
8640 || i.prefix[SEG_PREFIX] == DS_PREFIX_OPCODE /* taken */)
8641 {
8642 frag_opcode_byte (i.prefix[SEG_PREFIX]);
8643 i.prefixes--;
8644 }
8645 }
8646 else
8647 {
8648 int code16;
8649
8650 code16 = 0;
8651 if (flag_code == CODE_16BIT)
8652 code16 = CODE16;
8653
8654 if (i.prefix[DATA_PREFIX] != 0)
8655 {
8656 frag_opcode_byte (DATA_PREFIX_OPCODE);
8657 i.prefixes -= 1;
8658 code16 ^= flip_code16(code16);
8659 }
8660
8661 size = 4;
8662 if (code16)
8663 size = 2;
8664 }
8665
8666 /* BND prefixed jump. */
8667 if (i.prefix[BND_PREFIX] != 0)
8668 {
8669 frag_opcode_byte (i.prefix[BND_PREFIX]);
8670 i.prefixes -= 1;
8671 }
8672
8673 if (i.prefix[REX_PREFIX] != 0)
8674 {
8675 frag_opcode_byte (i.prefix[REX_PREFIX]);
8676 i.prefixes -= 1;
8677 }
8678
8679 if (i.prefixes != 0)
8680 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8681
8682 if (now_seg == absolute_section)
8683 {
8684 abs_section_offset += i.opcode_length + size;
8685 return;
8686 }
8687
8688 p = frag_more (i.opcode_length + size);
8689 switch (i.opcode_length)
8690 {
8691 case 2:
8692 *p++ = i.tm.base_opcode >> 8;
8693 /* Fall through. */
8694 case 1:
8695 *p++ = i.tm.base_opcode;
8696 break;
8697 default:
8698 abort ();
8699 }
8700
8701 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8702 if (size == 4
8703 && jump_reloc == NO_RELOC
8704 && need_plt32_p (i.op[0].disps->X_add_symbol))
8705 jump_reloc = BFD_RELOC_X86_64_PLT32;
8706 #endif
8707
8708 jump_reloc = reloc (size, 1, 1, jump_reloc);
8709
8710 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8711 i.op[0].disps, 1, jump_reloc);
8712
8713 /* All jumps handled here are signed, but don't use a signed limit
8714 check for 32 and 16 bit jumps as we want to allow wrap around at
8715 4G and 64k respectively. */
8716 if (size == 1)
8717 fixP->fx_signed = 1;
8718 }
8719
8720 static void
8721 output_interseg_jump (void)
8722 {
8723 char *p;
8724 int size;
8725 int prefix;
8726 int code16;
8727
8728 code16 = 0;
8729 if (flag_code == CODE_16BIT)
8730 code16 = CODE16;
8731
8732 prefix = 0;
8733 if (i.prefix[DATA_PREFIX] != 0)
8734 {
8735 prefix = 1;
8736 i.prefixes -= 1;
8737 code16 ^= CODE16;
8738 }
8739
8740 gas_assert (!i.prefix[REX_PREFIX]);
8741
8742 size = 4;
8743 if (code16)
8744 size = 2;
8745
8746 if (i.prefixes != 0)
8747 as_warn (_("skipping prefixes on `%s'"), i.tm.name);
8748
8749 if (now_seg == absolute_section)
8750 {
8751 abs_section_offset += prefix + 1 + 2 + size;
8752 return;
8753 }
8754
8755 /* 1 opcode; 2 segment; offset */
8756 p = frag_more (prefix + 1 + 2 + size);
8757
8758 if (i.prefix[DATA_PREFIX] != 0)
8759 *p++ = DATA_PREFIX_OPCODE;
8760
8761 if (i.prefix[REX_PREFIX] != 0)
8762 *p++ = i.prefix[REX_PREFIX];
8763
8764 *p++ = i.tm.base_opcode;
8765 if (i.op[1].imms->X_op == O_constant)
8766 {
8767 offsetT n = i.op[1].imms->X_add_number;
8768
8769 if (size == 2
8770 && !fits_in_unsigned_word (n)
8771 && !fits_in_signed_word (n))
8772 {
8773 as_bad (_("16-bit jump out of range"));
8774 return;
8775 }
8776 md_number_to_chars (p, n, size);
8777 }
8778 else
8779 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
8780 i.op[1].imms, 0, reloc (size, 0, 0, i.reloc[1]));
8781
8782 p += size;
8783 if (i.op[0].imms->X_op == O_constant)
8784 md_number_to_chars (p, (valueT) i.op[0].imms->X_add_number, 2);
8785 else
8786 fix_new_exp (frag_now, p - frag_now->fr_literal, 2,
8787 i.op[0].imms, 0, reloc (2, 0, 0, i.reloc[0]));
8788 }
8789
8790 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
8791 void
8792 x86_cleanup (void)
8793 {
8794 char *p;
8795 asection *seg = now_seg;
8796 subsegT subseg = now_subseg;
8797 asection *sec;
8798 unsigned int alignment, align_size_1;
8799 unsigned int isa_1_descsz, feature_2_descsz, descsz;
8800 unsigned int isa_1_descsz_raw, feature_2_descsz_raw;
8801 unsigned int padding;
8802
8803 if (!IS_ELF || !x86_used_note)
8804 return;
8805
8806 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X86;
8807
8808 /* The .note.gnu.property section layout:
8809
8810 Field Length Contents
8811 ---- ---- ----
8812 n_namsz 4 4
8813 n_descsz 4 The note descriptor size
8814 n_type 4 NT_GNU_PROPERTY_TYPE_0
8815 n_name 4 "GNU"
8816 n_desc n_descsz The program property array
8817 .... .... ....
8818 */
8819
8820 /* Create the .note.gnu.property section. */
8821 sec = subseg_new (NOTE_GNU_PROPERTY_SECTION_NAME, 0);
8822 bfd_set_section_flags (sec,
8823 (SEC_ALLOC
8824 | SEC_LOAD
8825 | SEC_DATA
8826 | SEC_HAS_CONTENTS
8827 | SEC_READONLY));
8828
8829 if (get_elf_backend_data (stdoutput)->s->elfclass == ELFCLASS64)
8830 {
8831 align_size_1 = 7;
8832 alignment = 3;
8833 }
8834 else
8835 {
8836 align_size_1 = 3;
8837 alignment = 2;
8838 }
8839
8840 bfd_set_section_alignment (sec, alignment);
8841 elf_section_type (sec) = SHT_NOTE;
8842
8843 /* GNU_PROPERTY_X86_ISA_1_USED: 4-byte type + 4-byte data size
8844 + 4-byte data */
8845 isa_1_descsz_raw = 4 + 4 + 4;
8846 /* Align GNU_PROPERTY_X86_ISA_1_USED. */
8847 isa_1_descsz = (isa_1_descsz_raw + align_size_1) & ~align_size_1;
8848
8849 feature_2_descsz_raw = isa_1_descsz;
8850 /* GNU_PROPERTY_X86_FEATURE_2_USED: 4-byte type + 4-byte data size
8851 + 4-byte data */
8852 feature_2_descsz_raw += 4 + 4 + 4;
8853 /* Align GNU_PROPERTY_X86_FEATURE_2_USED. */
8854 feature_2_descsz = ((feature_2_descsz_raw + align_size_1)
8855 & ~align_size_1);
8856
8857 descsz = feature_2_descsz;
8858 /* Section size: n_namsz + n_descsz + n_type + n_name + n_descsz. */
8859 p = frag_more (4 + 4 + 4 + 4 + descsz);
8860
8861 /* Write n_namsz. */
8862 md_number_to_chars (p, (valueT) 4, 4);
8863
8864 /* Write n_descsz. */
8865 md_number_to_chars (p + 4, (valueT) descsz, 4);
8866
8867 /* Write n_type. */
8868 md_number_to_chars (p + 4 * 2, (valueT) NT_GNU_PROPERTY_TYPE_0, 4);
8869
8870 /* Write n_name. */
8871 memcpy (p + 4 * 3, "GNU", 4);
8872
8873 /* Write 4-byte type. */
8874 md_number_to_chars (p + 4 * 4,
8875 (valueT) GNU_PROPERTY_X86_ISA_1_USED, 4);
8876
8877 /* Write 4-byte data size. */
8878 md_number_to_chars (p + 4 * 5, (valueT) 4, 4);
8879
8880 /* Write 4-byte data. */
8881 md_number_to_chars (p + 4 * 6, (valueT) x86_isa_1_used, 4);
8882
8883 /* Zero out paddings. */
8884 padding = isa_1_descsz - isa_1_descsz_raw;
8885 if (padding)
8886 memset (p + 4 * 7, 0, padding);
8887
8888 /* Write 4-byte type. */
8889 md_number_to_chars (p + isa_1_descsz + 4 * 4,
8890 (valueT) GNU_PROPERTY_X86_FEATURE_2_USED, 4);
8891
8892 /* Write 4-byte data size. */
8893 md_number_to_chars (p + isa_1_descsz + 4 * 5, (valueT) 4, 4);
8894
8895 /* Write 4-byte data. */
8896 md_number_to_chars (p + isa_1_descsz + 4 * 6,
8897 (valueT) x86_feature_2_used, 4);
8898
8899 /* Zero out paddings. */
8900 padding = feature_2_descsz - feature_2_descsz_raw;
8901 if (padding)
8902 memset (p + isa_1_descsz + 4 * 7, 0, padding);
8903
8904 /* We probably can't restore the current segment, for there likely
8905 isn't one yet... */
8906 if (seg && subseg)
8907 subseg_set (seg, subseg);
8908 }
8909 #endif
8910
8911 static unsigned int
8912 encoding_length (const fragS *start_frag, offsetT start_off,
8913 const char *frag_now_ptr)
8914 {
8915 unsigned int len = 0;
8916
8917 if (start_frag != frag_now)
8918 {
8919 const fragS *fr = start_frag;
8920
8921 do {
8922 len += fr->fr_fix;
8923 fr = fr->fr_next;
8924 } while (fr && fr != frag_now);
8925 }
8926
8927 return len - start_off + (frag_now_ptr - frag_now->fr_literal);
8928 }
8929
8930 /* Return 1 for test, and, cmp, add, sub, inc and dec which may
8931 be macro-fused with conditional jumps.
8932 NB: If TEST/AND/CMP/ADD/SUB/INC/DEC is of RIP relative address,
8933 or is one of the following format:
8934
8935 cmp m, imm
8936 add m, imm
8937 sub m, imm
8938 test m, imm
8939 and m, imm
8940 inc m
8941 dec m
8942
8943 it is unfusible. */
8944
8945 static int
8946 maybe_fused_with_jcc_p (enum mf_cmp_kind* mf_cmp_p)
8947 {
8948 /* No RIP address. */
8949 if (i.base_reg && i.base_reg->reg_num == RegIP)
8950 return 0;
8951
8952 /* No VEX/EVEX encoding. */
8953 if (is_any_vex_encoding (&i.tm))
8954 return 0;
8955
8956 /* add, sub without add/sub m, imm. */
8957 if (i.tm.base_opcode <= 5
8958 || (i.tm.base_opcode >= 0x28 && i.tm.base_opcode <= 0x2d)
8959 || ((i.tm.base_opcode | 3) == 0x83
8960 && (i.tm.extension_opcode == 0x5
8961 || i.tm.extension_opcode == 0x0)))
8962 {
8963 *mf_cmp_p = mf_cmp_alu_cmp;
8964 return !(i.mem_operands && i.imm_operands);
8965 }
8966
8967 /* and without and m, imm. */
8968 if ((i.tm.base_opcode >= 0x20 && i.tm.base_opcode <= 0x25)
8969 || ((i.tm.base_opcode | 3) == 0x83
8970 && i.tm.extension_opcode == 0x4))
8971 {
8972 *mf_cmp_p = mf_cmp_test_and;
8973 return !(i.mem_operands && i.imm_operands);
8974 }
8975
8976 /* test without test m imm. */
8977 if ((i.tm.base_opcode | 1) == 0x85
8978 || (i.tm.base_opcode | 1) == 0xa9
8979 || ((i.tm.base_opcode | 1) == 0xf7
8980 && i.tm.extension_opcode == 0))
8981 {
8982 *mf_cmp_p = mf_cmp_test_and;
8983 return !(i.mem_operands && i.imm_operands);
8984 }
8985
8986 /* cmp without cmp m, imm. */
8987 if ((i.tm.base_opcode >= 0x38 && i.tm.base_opcode <= 0x3d)
8988 || ((i.tm.base_opcode | 3) == 0x83
8989 && (i.tm.extension_opcode == 0x7)))
8990 {
8991 *mf_cmp_p = mf_cmp_alu_cmp;
8992 return !(i.mem_operands && i.imm_operands);
8993 }
8994
8995 /* inc, dec without inc/dec m. */
8996 if ((i.tm.cpu_flags.bitfield.cpuno64
8997 && (i.tm.base_opcode | 0xf) == 0x4f)
8998 || ((i.tm.base_opcode | 1) == 0xff
8999 && i.tm.extension_opcode <= 0x1))
9000 {
9001 *mf_cmp_p = mf_cmp_incdec;
9002 return !i.mem_operands;
9003 }
9004
9005 return 0;
9006 }
9007
9008 /* Return 1 if a FUSED_JCC_PADDING frag should be generated. */
9009
9010 static int
9011 add_fused_jcc_padding_frag_p (enum mf_cmp_kind* mf_cmp_p)
9012 {
9013 /* NB: Don't work with COND_JUMP86 without i386. */
9014 if (!align_branch_power
9015 || now_seg == absolute_section
9016 || !cpu_arch_flags.bitfield.cpui386
9017 || !(align_branch & align_branch_fused_bit))
9018 return 0;
9019
9020 if (maybe_fused_with_jcc_p (mf_cmp_p))
9021 {
9022 if (last_insn.kind == last_insn_other
9023 || last_insn.seg != now_seg)
9024 return 1;
9025 if (flag_debug)
9026 as_warn_where (last_insn.file, last_insn.line,
9027 _("`%s` skips -malign-branch-boundary on `%s`"),
9028 last_insn.name, i.tm.name);
9029 }
9030
9031 return 0;
9032 }
9033
9034 /* Return 1 if a BRANCH_PREFIX frag should be generated. */
9035
9036 static int
9037 add_branch_prefix_frag_p (void)
9038 {
9039 /* NB: Don't work with COND_JUMP86 without i386. Don't add prefix
9040 to PadLock instructions since they include prefixes in opcode. */
9041 if (!align_branch_power
9042 || !align_branch_prefix_size
9043 || now_seg == absolute_section
9044 || i.tm.cpu_flags.bitfield.cpupadlock
9045 || !cpu_arch_flags.bitfield.cpui386)
9046 return 0;
9047
9048 /* Don't add prefix if it is a prefix or there is no operand in case
9049 that segment prefix is special. */
9050 if (!i.operands || i.tm.opcode_modifier.isprefix)
9051 return 0;
9052
9053 if (last_insn.kind == last_insn_other
9054 || last_insn.seg != now_seg)
9055 return 1;
9056
9057 if (flag_debug)
9058 as_warn_where (last_insn.file, last_insn.line,
9059 _("`%s` skips -malign-branch-boundary on `%s`"),
9060 last_insn.name, i.tm.name);
9061
9062 return 0;
9063 }
9064
9065 /* Return 1 if a BRANCH_PADDING frag should be generated. */
9066
9067 static int
9068 add_branch_padding_frag_p (enum align_branch_kind *branch_p,
9069 enum mf_jcc_kind *mf_jcc_p)
9070 {
9071 int add_padding;
9072
9073 /* NB: Don't work with COND_JUMP86 without i386. */
9074 if (!align_branch_power
9075 || now_seg == absolute_section
9076 || !cpu_arch_flags.bitfield.cpui386)
9077 return 0;
9078
9079 add_padding = 0;
9080
9081 /* Check for jcc and direct jmp. */
9082 if (i.tm.opcode_modifier.jump == JUMP)
9083 {
9084 if (i.tm.base_opcode == JUMP_PC_RELATIVE)
9085 {
9086 *branch_p = align_branch_jmp;
9087 add_padding = align_branch & align_branch_jmp_bit;
9088 }
9089 else
9090 {
9091 /* Because J<cc> and JN<cc> share same group in macro-fusible table,
9092 igore the lowest bit. */
9093 *mf_jcc_p = (i.tm.base_opcode & 0x0e) >> 1;
9094 *branch_p = align_branch_jcc;
9095 if ((align_branch & align_branch_jcc_bit))
9096 add_padding = 1;
9097 }
9098 }
9099 else if (is_any_vex_encoding (&i.tm))
9100 return 0;
9101 else if ((i.tm.base_opcode | 1) == 0xc3)
9102 {
9103 /* Near ret. */
9104 *branch_p = align_branch_ret;
9105 if ((align_branch & align_branch_ret_bit))
9106 add_padding = 1;
9107 }
9108 else
9109 {
9110 /* Check for indirect jmp, direct and indirect calls. */
9111 if (i.tm.base_opcode == 0xe8)
9112 {
9113 /* Direct call. */
9114 *branch_p = align_branch_call;
9115 if ((align_branch & align_branch_call_bit))
9116 add_padding = 1;
9117 }
9118 else if (i.tm.base_opcode == 0xff
9119 && (i.tm.extension_opcode == 2
9120 || i.tm.extension_opcode == 4))
9121 {
9122 /* Indirect call and jmp. */
9123 *branch_p = align_branch_indirect;
9124 if ((align_branch & align_branch_indirect_bit))
9125 add_padding = 1;
9126 }
9127
9128 if (add_padding
9129 && i.disp_operands
9130 && tls_get_addr
9131 && (i.op[0].disps->X_op == O_symbol
9132 || (i.op[0].disps->X_op == O_subtract
9133 && i.op[0].disps->X_op_symbol == GOT_symbol)))
9134 {
9135 symbolS *s = i.op[0].disps->X_add_symbol;
9136 /* No padding to call to global or undefined tls_get_addr. */
9137 if ((S_IS_EXTERNAL (s) || !S_IS_DEFINED (s))
9138 && strcmp (S_GET_NAME (s), tls_get_addr) == 0)
9139 return 0;
9140 }
9141 }
9142
9143 if (add_padding
9144 && last_insn.kind != last_insn_other
9145 && last_insn.seg == now_seg)
9146 {
9147 if (flag_debug)
9148 as_warn_where (last_insn.file, last_insn.line,
9149 _("`%s` skips -malign-branch-boundary on `%s`"),
9150 last_insn.name, i.tm.name);
9151 return 0;
9152 }
9153
9154 return add_padding;
9155 }
9156
9157 static void
9158 output_insn (void)
9159 {
9160 fragS *insn_start_frag;
9161 offsetT insn_start_off;
9162 fragS *fragP = NULL;
9163 enum align_branch_kind branch = align_branch_none;
9164 /* The initializer is arbitrary just to avoid uninitialized error.
9165 it's actually either assigned in add_branch_padding_frag_p
9166 or never be used. */
9167 enum mf_jcc_kind mf_jcc = mf_jcc_jo;
9168
9169 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
9170 if (IS_ELF && x86_used_note && now_seg != absolute_section)
9171 {
9172 if ((i.xstate & xstate_tmm) == xstate_tmm
9173 || i.tm.cpu_flags.bitfield.cpuamx_tile)
9174 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_TMM;
9175
9176 if (i.tm.cpu_flags.bitfield.cpu8087
9177 || i.tm.cpu_flags.bitfield.cpu287
9178 || i.tm.cpu_flags.bitfield.cpu387
9179 || i.tm.cpu_flags.bitfield.cpu687
9180 || i.tm.cpu_flags.bitfield.cpufisttp)
9181 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_X87;
9182
9183 if ((i.xstate & xstate_mmx)
9184 || i.tm.base_opcode == 0xf77 /* emms */
9185 || i.tm.base_opcode == 0xf0e /* femms */)
9186 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MMX;
9187
9188 if (i.index_reg)
9189 {
9190 if (i.index_reg->reg_type.bitfield.zmmword)
9191 i.xstate |= xstate_zmm;
9192 else if (i.index_reg->reg_type.bitfield.ymmword)
9193 i.xstate |= xstate_ymm;
9194 else if (i.index_reg->reg_type.bitfield.xmmword)
9195 i.xstate |= xstate_xmm;
9196 }
9197
9198 /* vzeroall / vzeroupper */
9199 if (i.tm.base_opcode == 0x77 && i.tm.cpu_flags.bitfield.cpuavx)
9200 i.xstate |= xstate_ymm;
9201
9202 if ((i.xstate & xstate_xmm)
9203 /* ldmxcsr / stmxcsr */
9204 || (i.tm.base_opcode == 0xfae && i.tm.cpu_flags.bitfield.cpusse)
9205 /* vldmxcsr / vstmxcsr */
9206 || (i.tm.base_opcode == 0xae && i.tm.cpu_flags.bitfield.cpuavx)
9207 || i.tm.cpu_flags.bitfield.cpuwidekl
9208 || i.tm.cpu_flags.bitfield.cpukl)
9209 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XMM;
9210
9211 if ((i.xstate & xstate_ymm) == xstate_ymm)
9212 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_YMM;
9213 if ((i.xstate & xstate_zmm) == xstate_zmm)
9214 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_ZMM;
9215 if (i.mask || (i.xstate & xstate_mask) == xstate_mask)
9216 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_MASK;
9217 if (i.tm.cpu_flags.bitfield.cpufxsr)
9218 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_FXSR;
9219 if (i.tm.cpu_flags.bitfield.cpuxsave)
9220 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVE;
9221 if (i.tm.cpu_flags.bitfield.cpuxsaveopt)
9222 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT;
9223 if (i.tm.cpu_flags.bitfield.cpuxsavec)
9224 x86_feature_2_used |= GNU_PROPERTY_X86_FEATURE_2_XSAVEC;
9225
9226 if (x86_feature_2_used
9227 || i.tm.cpu_flags.bitfield.cpucmov
9228 || i.tm.cpu_flags.bitfield.cpusyscall
9229 || (i.tm.base_opcode == 0xfc7
9230 && i.tm.opcode_modifier.opcodeprefix == PREFIX_NONE
9231 && i.tm.extension_opcode == 1) /* cmpxchg8b */)
9232 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_BASELINE;
9233 if (i.tm.cpu_flags.bitfield.cpusse3
9234 || i.tm.cpu_flags.bitfield.cpussse3
9235 || i.tm.cpu_flags.bitfield.cpusse4_1
9236 || i.tm.cpu_flags.bitfield.cpusse4_2
9237 || i.tm.cpu_flags.bitfield.cpucx16
9238 || i.tm.cpu_flags.bitfield.cpupopcnt
9239 /* LAHF-SAHF insns in 64-bit mode. */
9240 || (flag_code == CODE_64BIT
9241 && (i.tm.base_opcode | 1) == 0x9f
9242 && i.tm.opcode_modifier.opcodespace == SPACE_BASE))
9243 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V2;
9244 if (i.tm.cpu_flags.bitfield.cpuavx
9245 || i.tm.cpu_flags.bitfield.cpuavx2
9246 /* Any VEX encoded insns execpt for CpuAVX512F, CpuAVX512BW,
9247 CpuAVX512DQ, LPW, TBM and AMX. */
9248 || (i.tm.opcode_modifier.vex
9249 && !i.tm.cpu_flags.bitfield.cpuavx512f
9250 && !i.tm.cpu_flags.bitfield.cpuavx512bw
9251 && !i.tm.cpu_flags.bitfield.cpuavx512dq
9252 && !i.tm.cpu_flags.bitfield.cpulwp
9253 && !i.tm.cpu_flags.bitfield.cputbm
9254 && !(x86_feature_2_used & GNU_PROPERTY_X86_FEATURE_2_TMM))
9255 || i.tm.cpu_flags.bitfield.cpuf16c
9256 || i.tm.cpu_flags.bitfield.cpufma
9257 || i.tm.cpu_flags.bitfield.cpulzcnt
9258 || i.tm.cpu_flags.bitfield.cpumovbe
9259 || i.tm.cpu_flags.bitfield.cpuxsaves
9260 || (x86_feature_2_used
9261 & (GNU_PROPERTY_X86_FEATURE_2_XSAVE
9262 | GNU_PROPERTY_X86_FEATURE_2_XSAVEOPT
9263 | GNU_PROPERTY_X86_FEATURE_2_XSAVEC)) != 0)
9264 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V3;
9265 if (i.tm.cpu_flags.bitfield.cpuavx512f
9266 || i.tm.cpu_flags.bitfield.cpuavx512bw
9267 || i.tm.cpu_flags.bitfield.cpuavx512dq
9268 || i.tm.cpu_flags.bitfield.cpuavx512vl
9269 /* Any EVEX encoded insns except for AVX512ER, AVX512PF and
9270 VNNIW. */
9271 || (i.tm.opcode_modifier.evex
9272 && !i.tm.cpu_flags.bitfield.cpuavx512er
9273 && !i.tm.cpu_flags.bitfield.cpuavx512pf
9274 && !i.tm.cpu_flags.bitfield.cpuavx512_4vnniw))
9275 x86_isa_1_used |= GNU_PROPERTY_X86_ISA_1_V4;
9276 }
9277 #endif
9278
9279 /* Tie dwarf2 debug info to the address at the start of the insn.
9280 We can't do this after the insn has been output as the current
9281 frag may have been closed off. eg. by frag_var. */
9282 dwarf2_emit_insn (0);
9283
9284 insn_start_frag = frag_now;
9285 insn_start_off = frag_now_fix ();
9286
9287 if (add_branch_padding_frag_p (&branch, &mf_jcc))
9288 {
9289 char *p;
9290 /* Branch can be 8 bytes. Leave some room for prefixes. */
9291 unsigned int max_branch_padding_size = 14;
9292
9293 /* Align section to boundary. */
9294 record_alignment (now_seg, align_branch_power);
9295
9296 /* Make room for padding. */
9297 frag_grow (max_branch_padding_size);
9298
9299 /* Start of the padding. */
9300 p = frag_more (0);
9301
9302 fragP = frag_now;
9303
9304 frag_var (rs_machine_dependent, max_branch_padding_size, 0,
9305 ENCODE_RELAX_STATE (BRANCH_PADDING, 0),
9306 NULL, 0, p);
9307
9308 fragP->tc_frag_data.mf_type = mf_jcc;
9309 fragP->tc_frag_data.branch_type = branch;
9310 fragP->tc_frag_data.max_bytes = max_branch_padding_size;
9311 }
9312
9313 /* Output jumps. */
9314 if (i.tm.opcode_modifier.jump == JUMP)
9315 output_branch ();
9316 else if (i.tm.opcode_modifier.jump == JUMP_BYTE
9317 || i.tm.opcode_modifier.jump == JUMP_DWORD)
9318 output_jump ();
9319 else if (i.tm.opcode_modifier.jump == JUMP_INTERSEGMENT)
9320 output_interseg_jump ();
9321 else
9322 {
9323 /* Output normal instructions here. */
9324 char *p;
9325 unsigned char *q;
9326 unsigned int j;
9327 enum mf_cmp_kind mf_cmp;
9328
9329 if (avoid_fence
9330 && (i.tm.base_opcode == 0xfaee8
9331 || i.tm.base_opcode == 0xfaef0
9332 || i.tm.base_opcode == 0xfaef8))
9333 {
9334 /* Encode lfence, mfence, and sfence as
9335 f0 83 04 24 00 lock addl $0x0, (%{re}sp). */
9336 if (now_seg != absolute_section)
9337 {
9338 offsetT val = 0x240483f0ULL;
9339
9340 p = frag_more (5);
9341 md_number_to_chars (p, val, 5);
9342 }
9343 else
9344 abs_section_offset += 5;
9345 return;
9346 }
9347
9348 /* Some processors fail on LOCK prefix. This options makes
9349 assembler ignore LOCK prefix and serves as a workaround. */
9350 if (omit_lock_prefix)
9351 {
9352 if (i.tm.base_opcode == LOCK_PREFIX_OPCODE
9353 && i.tm.opcode_modifier.isprefix)
9354 return;
9355 i.prefix[LOCK_PREFIX] = 0;
9356 }
9357
9358 if (branch)
9359 /* Skip if this is a branch. */
9360 ;
9361 else if (add_fused_jcc_padding_frag_p (&mf_cmp))
9362 {
9363 /* Make room for padding. */
9364 frag_grow (MAX_FUSED_JCC_PADDING_SIZE);
9365 p = frag_more (0);
9366
9367 fragP = frag_now;
9368
9369 frag_var (rs_machine_dependent, MAX_FUSED_JCC_PADDING_SIZE, 0,
9370 ENCODE_RELAX_STATE (FUSED_JCC_PADDING, 0),
9371 NULL, 0, p);
9372
9373 fragP->tc_frag_data.mf_type = mf_cmp;
9374 fragP->tc_frag_data.branch_type = align_branch_fused;
9375 fragP->tc_frag_data.max_bytes = MAX_FUSED_JCC_PADDING_SIZE;
9376 }
9377 else if (add_branch_prefix_frag_p ())
9378 {
9379 unsigned int max_prefix_size = align_branch_prefix_size;
9380
9381 /* Make room for padding. */
9382 frag_grow (max_prefix_size);
9383 p = frag_more (0);
9384
9385 fragP = frag_now;
9386
9387 frag_var (rs_machine_dependent, max_prefix_size, 0,
9388 ENCODE_RELAX_STATE (BRANCH_PREFIX, 0),
9389 NULL, 0, p);
9390
9391 fragP->tc_frag_data.max_bytes = max_prefix_size;
9392 }
9393
9394 /* Since the VEX/EVEX prefix contains the implicit prefix, we
9395 don't need the explicit prefix. */
9396 if (!i.tm.opcode_modifier.vex && !i.tm.opcode_modifier.evex)
9397 {
9398 switch (i.tm.opcode_modifier.opcodeprefix)
9399 {
9400 case PREFIX_0X66:
9401 add_prefix (0x66);
9402 break;
9403 case PREFIX_0XF2:
9404 add_prefix (0xf2);
9405 break;
9406 case PREFIX_0XF3:
9407 if (!i.tm.cpu_flags.bitfield.cpupadlock
9408 || (i.prefix[REP_PREFIX] != 0xf3))
9409 add_prefix (0xf3);
9410 break;
9411 case PREFIX_NONE:
9412 switch (i.opcode_length)
9413 {
9414 case 3:
9415 case 2:
9416 break;
9417 case 1:
9418 /* Check for pseudo prefixes. */
9419 if (!i.tm.opcode_modifier.isprefix || i.tm.base_opcode)
9420 break;
9421 as_bad_where (insn_start_frag->fr_file,
9422 insn_start_frag->fr_line,
9423 _("pseudo prefix without instruction"));
9424 return;
9425 default:
9426 abort ();
9427 }
9428 break;
9429 default:
9430 abort ();
9431 }
9432
9433 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
9434 /* For x32, add a dummy REX_OPCODE prefix for mov/add with
9435 R_X86_64_GOTTPOFF relocation so that linker can safely
9436 perform IE->LE optimization. A dummy REX_OPCODE prefix
9437 is also needed for lea with R_X86_64_GOTPC32_TLSDESC
9438 relocation for GDesc -> IE/LE optimization. */
9439 if (x86_elf_abi == X86_64_X32_ABI
9440 && i.operands == 2
9441 && (i.reloc[0] == BFD_RELOC_X86_64_GOTTPOFF
9442 || i.reloc[0] == BFD_RELOC_X86_64_GOTPC32_TLSDESC)
9443 && i.prefix[REX_PREFIX] == 0)
9444 add_prefix (REX_OPCODE);
9445 #endif
9446
9447 /* The prefix bytes. */
9448 for (j = ARRAY_SIZE (i.prefix), q = i.prefix; j > 0; j--, q++)
9449 if (*q)
9450 frag_opcode_byte (*q);
9451 }
9452 else
9453 {
9454 for (j = 0, q = i.prefix; j < ARRAY_SIZE (i.prefix); j++, q++)
9455 if (*q)
9456 switch (j)
9457 {
9458 case SEG_PREFIX:
9459 case ADDR_PREFIX:
9460 frag_opcode_byte (*q);
9461 break;
9462 default:
9463 /* There should be no other prefixes for instructions
9464 with VEX prefix. */
9465 abort ();
9466 }
9467
9468 /* For EVEX instructions i.vrex should become 0 after
9469 build_evex_prefix. For VEX instructions upper 16 registers
9470 aren't available, so VREX should be 0. */
9471 if (i.vrex)
9472 abort ();
9473 /* Now the VEX prefix. */
9474 if (now_seg != absolute_section)
9475 {
9476 p = frag_more (i.vex.length);
9477 for (j = 0; j < i.vex.length; j++)
9478 p[j] = i.vex.bytes[j];
9479 }
9480 else
9481 abs_section_offset += i.vex.length;
9482 }
9483
9484 /* Now the opcode; be careful about word order here! */
9485 if (now_seg == absolute_section)
9486 abs_section_offset += i.opcode_length;
9487 else if (i.opcode_length == 1)
9488 {
9489 FRAG_APPEND_1_CHAR (i.tm.base_opcode);
9490 }
9491 else
9492 {
9493 switch (i.opcode_length)
9494 {
9495 case 4:
9496 p = frag_more (4);
9497 *p++ = (i.tm.base_opcode >> 24) & 0xff;
9498 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9499 break;
9500 case 3:
9501 p = frag_more (3);
9502 *p++ = (i.tm.base_opcode >> 16) & 0xff;
9503 break;
9504 case 2:
9505 p = frag_more (2);
9506 break;
9507 default:
9508 abort ();
9509 break;
9510 }
9511
9512 /* Put out high byte first: can't use md_number_to_chars! */
9513 *p++ = (i.tm.base_opcode >> 8) & 0xff;
9514 *p = i.tm.base_opcode & 0xff;
9515 }
9516
9517 /* Now the modrm byte and sib byte (if present). */
9518 if (i.tm.opcode_modifier.modrm)
9519 {
9520 frag_opcode_byte ((i.rm.regmem << 0)
9521 | (i.rm.reg << 3)
9522 | (i.rm.mode << 6));
9523 /* If i.rm.regmem == ESP (4)
9524 && i.rm.mode != (Register mode)
9525 && not 16 bit
9526 ==> need second modrm byte. */
9527 if (i.rm.regmem == ESCAPE_TO_TWO_BYTE_ADDRESSING
9528 && i.rm.mode != 3
9529 && !(i.base_reg && i.base_reg->reg_type.bitfield.word))
9530 frag_opcode_byte ((i.sib.base << 0)
9531 | (i.sib.index << 3)
9532 | (i.sib.scale << 6));
9533 }
9534
9535 if (i.disp_operands)
9536 output_disp (insn_start_frag, insn_start_off);
9537
9538 if (i.imm_operands)
9539 output_imm (insn_start_frag, insn_start_off);
9540
9541 /*
9542 * frag_now_fix () returning plain abs_section_offset when we're in the
9543 * absolute section, and abs_section_offset not getting updated as data
9544 * gets added to the frag breaks the logic below.
9545 */
9546 if (now_seg != absolute_section)
9547 {
9548 j = encoding_length (insn_start_frag, insn_start_off, frag_more (0));
9549 if (j > 15)
9550 as_warn (_("instruction length of %u bytes exceeds the limit of 15"),
9551 j);
9552 else if (fragP)
9553 {
9554 /* NB: Don't add prefix with GOTPC relocation since
9555 output_disp() above depends on the fixed encoding
9556 length. Can't add prefix with TLS relocation since
9557 it breaks TLS linker optimization. */
9558 unsigned int max = i.has_gotpc_tls_reloc ? 0 : 15 - j;
9559 /* Prefix count on the current instruction. */
9560 unsigned int count = i.vex.length;
9561 unsigned int k;
9562 for (k = 0; k < ARRAY_SIZE (i.prefix); k++)
9563 /* REX byte is encoded in VEX/EVEX prefix. */
9564 if (i.prefix[k] && (k != REX_PREFIX || !i.vex.length))
9565 count++;
9566
9567 /* Count prefixes for extended opcode maps. */
9568 if (!i.vex.length)
9569 switch (i.opcode_length)
9570 {
9571 case 3:
9572 if (((i.tm.base_opcode >> 16) & 0xff) == 0xf)
9573 {
9574 count++;
9575 switch ((i.tm.base_opcode >> 8) & 0xff)
9576 {
9577 case 0x38:
9578 case 0x3a:
9579 count++;
9580 break;
9581 default:
9582 break;
9583 }
9584 }
9585 break;
9586 case 2:
9587 if (((i.tm.base_opcode >> 8) & 0xff) == 0xf)
9588 count++;
9589 break;
9590 case 1:
9591 break;
9592 default:
9593 abort ();
9594 }
9595
9596 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
9597 == BRANCH_PREFIX)
9598 {
9599 /* Set the maximum prefix size in BRANCH_PREFIX
9600 frag. */
9601 if (fragP->tc_frag_data.max_bytes > max)
9602 fragP->tc_frag_data.max_bytes = max;
9603 if (fragP->tc_frag_data.max_bytes > count)
9604 fragP->tc_frag_data.max_bytes -= count;
9605 else
9606 fragP->tc_frag_data.max_bytes = 0;
9607 }
9608 else
9609 {
9610 /* Remember the maximum prefix size in FUSED_JCC_PADDING
9611 frag. */
9612 unsigned int max_prefix_size;
9613 if (align_branch_prefix_size > max)
9614 max_prefix_size = max;
9615 else
9616 max_prefix_size = align_branch_prefix_size;
9617 if (max_prefix_size > count)
9618 fragP->tc_frag_data.max_prefix_length
9619 = max_prefix_size - count;
9620 }
9621
9622 /* Use existing segment prefix if possible. Use CS
9623 segment prefix in 64-bit mode. In 32-bit mode, use SS
9624 segment prefix with ESP/EBP base register and use DS
9625 segment prefix without ESP/EBP base register. */
9626 if (i.prefix[SEG_PREFIX])
9627 fragP->tc_frag_data.default_prefix = i.prefix[SEG_PREFIX];
9628 else if (flag_code == CODE_64BIT)
9629 fragP->tc_frag_data.default_prefix = CS_PREFIX_OPCODE;
9630 else if (i.base_reg
9631 && (i.base_reg->reg_num == 4
9632 || i.base_reg->reg_num == 5))
9633 fragP->tc_frag_data.default_prefix = SS_PREFIX_OPCODE;
9634 else
9635 fragP->tc_frag_data.default_prefix = DS_PREFIX_OPCODE;
9636 }
9637 }
9638 }
9639
9640 /* NB: Don't work with COND_JUMP86 without i386. */
9641 if (align_branch_power
9642 && now_seg != absolute_section
9643 && cpu_arch_flags.bitfield.cpui386)
9644 {
9645 /* Terminate each frag so that we can add prefix and check for
9646 fused jcc. */
9647 frag_wane (frag_now);
9648 frag_new (0);
9649 }
9650
9651 #ifdef DEBUG386
9652 if (flag_debug)
9653 {
9654 pi ("" /*line*/, &i);
9655 }
9656 #endif /* DEBUG386 */
9657 }
9658
9659 /* Return the size of the displacement operand N. */
9660
9661 static int
9662 disp_size (unsigned int n)
9663 {
9664 int size = 4;
9665
9666 if (i.types[n].bitfield.disp64)
9667 size = 8;
9668 else if (i.types[n].bitfield.disp8)
9669 size = 1;
9670 else if (i.types[n].bitfield.disp16)
9671 size = 2;
9672 return size;
9673 }
9674
9675 /* Return the size of the immediate operand N. */
9676
9677 static int
9678 imm_size (unsigned int n)
9679 {
9680 int size = 4;
9681 if (i.types[n].bitfield.imm64)
9682 size = 8;
9683 else if (i.types[n].bitfield.imm8 || i.types[n].bitfield.imm8s)
9684 size = 1;
9685 else if (i.types[n].bitfield.imm16)
9686 size = 2;
9687 return size;
9688 }
9689
9690 static void
9691 output_disp (fragS *insn_start_frag, offsetT insn_start_off)
9692 {
9693 char *p;
9694 unsigned int n;
9695
9696 for (n = 0; n < i.operands; n++)
9697 {
9698 if (operand_type_check (i.types[n], disp))
9699 {
9700 int size = disp_size (n);
9701
9702 if (now_seg == absolute_section)
9703 abs_section_offset += size;
9704 else if (i.op[n].disps->X_op == O_constant)
9705 {
9706 offsetT val = i.op[n].disps->X_add_number;
9707
9708 val = offset_in_range (val >> (size == 1 ? i.memshift : 0),
9709 size);
9710 p = frag_more (size);
9711 md_number_to_chars (p, val, size);
9712 }
9713 else
9714 {
9715 enum bfd_reloc_code_real reloc_type;
9716 int sign = i.types[n].bitfield.disp32s;
9717 int pcrel = (i.flags[n] & Operand_PCrel) != 0;
9718 fixS *fixP;
9719
9720 /* We can't have 8 bit displacement here. */
9721 gas_assert (!i.types[n].bitfield.disp8);
9722
9723 /* The PC relative address is computed relative
9724 to the instruction boundary, so in case immediate
9725 fields follows, we need to adjust the value. */
9726 if (pcrel && i.imm_operands)
9727 {
9728 unsigned int n1;
9729 int sz = 0;
9730
9731 for (n1 = 0; n1 < i.operands; n1++)
9732 if (operand_type_check (i.types[n1], imm))
9733 {
9734 /* Only one immediate is allowed for PC
9735 relative address. */
9736 gas_assert (sz == 0);
9737 sz = imm_size (n1);
9738 i.op[n].disps->X_add_number -= sz;
9739 }
9740 /* We should find the immediate. */
9741 gas_assert (sz != 0);
9742 }
9743
9744 p = frag_more (size);
9745 reloc_type = reloc (size, pcrel, sign, i.reloc[n]);
9746 if (GOT_symbol
9747 && GOT_symbol == i.op[n].disps->X_add_symbol
9748 && (((reloc_type == BFD_RELOC_32
9749 || reloc_type == BFD_RELOC_X86_64_32S
9750 || (reloc_type == BFD_RELOC_64
9751 && object_64bit))
9752 && (i.op[n].disps->X_op == O_symbol
9753 || (i.op[n].disps->X_op == O_add
9754 && ((symbol_get_value_expression
9755 (i.op[n].disps->X_op_symbol)->X_op)
9756 == O_subtract))))
9757 || reloc_type == BFD_RELOC_32_PCREL))
9758 {
9759 if (!object_64bit)
9760 {
9761 reloc_type = BFD_RELOC_386_GOTPC;
9762 i.has_gotpc_tls_reloc = TRUE;
9763 i.op[n].imms->X_add_number +=
9764 encoding_length (insn_start_frag, insn_start_off, p);
9765 }
9766 else if (reloc_type == BFD_RELOC_64)
9767 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9768 else
9769 /* Don't do the adjustment for x86-64, as there
9770 the pcrel addressing is relative to the _next_
9771 insn, and that is taken care of in other code. */
9772 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9773 }
9774 else if (align_branch_power)
9775 {
9776 switch (reloc_type)
9777 {
9778 case BFD_RELOC_386_TLS_GD:
9779 case BFD_RELOC_386_TLS_LDM:
9780 case BFD_RELOC_386_TLS_IE:
9781 case BFD_RELOC_386_TLS_IE_32:
9782 case BFD_RELOC_386_TLS_GOTIE:
9783 case BFD_RELOC_386_TLS_GOTDESC:
9784 case BFD_RELOC_386_TLS_DESC_CALL:
9785 case BFD_RELOC_X86_64_TLSGD:
9786 case BFD_RELOC_X86_64_TLSLD:
9787 case BFD_RELOC_X86_64_GOTTPOFF:
9788 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
9789 case BFD_RELOC_X86_64_TLSDESC_CALL:
9790 i.has_gotpc_tls_reloc = TRUE;
9791 default:
9792 break;
9793 }
9794 }
9795 fixP = fix_new_exp (frag_now, p - frag_now->fr_literal,
9796 size, i.op[n].disps, pcrel,
9797 reloc_type);
9798 /* Check for "call/jmp *mem", "mov mem, %reg",
9799 "test %reg, mem" and "binop mem, %reg" where binop
9800 is one of adc, add, and, cmp, or, sbb, sub, xor
9801 instructions without data prefix. Always generate
9802 R_386_GOT32X for "sym*GOT" operand in 32-bit mode. */
9803 if (i.prefix[DATA_PREFIX] == 0
9804 && (generate_relax_relocations
9805 || (!object_64bit
9806 && i.rm.mode == 0
9807 && i.rm.regmem == 5))
9808 && (i.rm.mode == 2
9809 || (i.rm.mode == 0 && i.rm.regmem == 5))
9810 && !is_any_vex_encoding(&i.tm)
9811 && ((i.operands == 1
9812 && i.tm.base_opcode == 0xff
9813 && (i.rm.reg == 2 || i.rm.reg == 4))
9814 || (i.operands == 2
9815 && (i.tm.base_opcode == 0x8b
9816 || i.tm.base_opcode == 0x85
9817 || (i.tm.base_opcode & ~0x38) == 0x03))))
9818 {
9819 if (object_64bit)
9820 {
9821 fixP->fx_tcbit = i.rex != 0;
9822 if (i.base_reg
9823 && (i.base_reg->reg_num == RegIP))
9824 fixP->fx_tcbit2 = 1;
9825 }
9826 else
9827 fixP->fx_tcbit2 = 1;
9828 }
9829 }
9830 }
9831 }
9832 }
9833
9834 static void
9835 output_imm (fragS *insn_start_frag, offsetT insn_start_off)
9836 {
9837 char *p;
9838 unsigned int n;
9839
9840 for (n = 0; n < i.operands; n++)
9841 {
9842 /* Skip SAE/RC Imm operand in EVEX. They are already handled. */
9843 if (i.rounding && (int) n == i.rounding->operand)
9844 continue;
9845
9846 if (operand_type_check (i.types[n], imm))
9847 {
9848 int size = imm_size (n);
9849
9850 if (now_seg == absolute_section)
9851 abs_section_offset += size;
9852 else if (i.op[n].imms->X_op == O_constant)
9853 {
9854 offsetT val;
9855
9856 val = offset_in_range (i.op[n].imms->X_add_number,
9857 size);
9858 p = frag_more (size);
9859 md_number_to_chars (p, val, size);
9860 }
9861 else
9862 {
9863 /* Not absolute_section.
9864 Need a 32-bit fixup (don't support 8bit
9865 non-absolute imms). Try to support other
9866 sizes ... */
9867 enum bfd_reloc_code_real reloc_type;
9868 int sign;
9869
9870 if (i.types[n].bitfield.imm32s
9871 && (i.suffix == QWORD_MNEM_SUFFIX
9872 || (!i.suffix && i.tm.opcode_modifier.no_lsuf)))
9873 sign = 1;
9874 else
9875 sign = 0;
9876
9877 p = frag_more (size);
9878 reloc_type = reloc (size, 0, sign, i.reloc[n]);
9879
9880 /* This is tough to explain. We end up with this one if we
9881 * have operands that look like
9882 * "_GLOBAL_OFFSET_TABLE_+[.-.L284]". The goal here is to
9883 * obtain the absolute address of the GOT, and it is strongly
9884 * preferable from a performance point of view to avoid using
9885 * a runtime relocation for this. The actual sequence of
9886 * instructions often look something like:
9887 *
9888 * call .L66
9889 * .L66:
9890 * popl %ebx
9891 * addl $_GLOBAL_OFFSET_TABLE_+[.-.L66],%ebx
9892 *
9893 * The call and pop essentially return the absolute address
9894 * of the label .L66 and store it in %ebx. The linker itself
9895 * will ultimately change the first operand of the addl so
9896 * that %ebx points to the GOT, but to keep things simple, the
9897 * .o file must have this operand set so that it generates not
9898 * the absolute address of .L66, but the absolute address of
9899 * itself. This allows the linker itself simply treat a GOTPC
9900 * relocation as asking for a pcrel offset to the GOT to be
9901 * added in, and the addend of the relocation is stored in the
9902 * operand field for the instruction itself.
9903 *
9904 * Our job here is to fix the operand so that it would add
9905 * the correct offset so that %ebx would point to itself. The
9906 * thing that is tricky is that .-.L66 will point to the
9907 * beginning of the instruction, so we need to further modify
9908 * the operand so that it will point to itself. There are
9909 * other cases where you have something like:
9910 *
9911 * .long $_GLOBAL_OFFSET_TABLE_+[.-.L66]
9912 *
9913 * and here no correction would be required. Internally in
9914 * the assembler we treat operands of this form as not being
9915 * pcrel since the '.' is explicitly mentioned, and I wonder
9916 * whether it would simplify matters to do it this way. Who
9917 * knows. In earlier versions of the PIC patches, the
9918 * pcrel_adjust field was used to store the correction, but
9919 * since the expression is not pcrel, I felt it would be
9920 * confusing to do it this way. */
9921
9922 if ((reloc_type == BFD_RELOC_32
9923 || reloc_type == BFD_RELOC_X86_64_32S
9924 || reloc_type == BFD_RELOC_64)
9925 && GOT_symbol
9926 && GOT_symbol == i.op[n].imms->X_add_symbol
9927 && (i.op[n].imms->X_op == O_symbol
9928 || (i.op[n].imms->X_op == O_add
9929 && ((symbol_get_value_expression
9930 (i.op[n].imms->X_op_symbol)->X_op)
9931 == O_subtract))))
9932 {
9933 if (!object_64bit)
9934 reloc_type = BFD_RELOC_386_GOTPC;
9935 else if (size == 4)
9936 reloc_type = BFD_RELOC_X86_64_GOTPC32;
9937 else if (size == 8)
9938 reloc_type = BFD_RELOC_X86_64_GOTPC64;
9939 i.has_gotpc_tls_reloc = TRUE;
9940 i.op[n].imms->X_add_number +=
9941 encoding_length (insn_start_frag, insn_start_off, p);
9942 }
9943 fix_new_exp (frag_now, p - frag_now->fr_literal, size,
9944 i.op[n].imms, 0, reloc_type);
9945 }
9946 }
9947 }
9948 }
9949 \f
9950 /* x86_cons_fix_new is called via the expression parsing code when a
9951 reloc is needed. We use this hook to get the correct .got reloc. */
9952 static int cons_sign = -1;
9953
9954 void
9955 x86_cons_fix_new (fragS *frag, unsigned int off, unsigned int len,
9956 expressionS *exp, bfd_reloc_code_real_type r)
9957 {
9958 r = reloc (len, 0, cons_sign, r);
9959
9960 #ifdef TE_PE
9961 if (exp->X_op == O_secrel)
9962 {
9963 exp->X_op = O_symbol;
9964 r = BFD_RELOC_32_SECREL;
9965 }
9966 #endif
9967
9968 fix_new_exp (frag, off, len, exp, 0, r);
9969 }
9970
9971 /* Export the ABI address size for use by TC_ADDRESS_BYTES for the
9972 purpose of the `.dc.a' internal pseudo-op. */
9973
9974 int
9975 x86_address_bytes (void)
9976 {
9977 if ((stdoutput->arch_info->mach & bfd_mach_x64_32))
9978 return 4;
9979 return stdoutput->arch_info->bits_per_address / 8;
9980 }
9981
9982 #if !(defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) || defined (OBJ_MACH_O)) \
9983 || defined (LEX_AT)
9984 # define lex_got(reloc, adjust, types) NULL
9985 #else
9986 /* Parse operands of the form
9987 <symbol>@GOTOFF+<nnn>
9988 and similar .plt or .got references.
9989
9990 If we find one, set up the correct relocation in RELOC and copy the
9991 input string, minus the `@GOTOFF' into a malloc'd buffer for
9992 parsing by the calling routine. Return this buffer, and if ADJUST
9993 is non-null set it to the length of the string we removed from the
9994 input line. Otherwise return NULL. */
9995 static char *
9996 lex_got (enum bfd_reloc_code_real *rel,
9997 int *adjust,
9998 i386_operand_type *types)
9999 {
10000 /* Some of the relocations depend on the size of what field is to
10001 be relocated. But in our callers i386_immediate and i386_displacement
10002 we don't yet know the operand size (this will be set by insn
10003 matching). Hence we record the word32 relocation here,
10004 and adjust the reloc according to the real size in reloc(). */
10005 static const struct {
10006 const char *str;
10007 int len;
10008 const enum bfd_reloc_code_real rel[2];
10009 const i386_operand_type types64;
10010 bfd_boolean need_GOT_symbol;
10011 } gotrel[] = {
10012 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
10013 { STRING_COMMA_LEN ("SIZE"), { BFD_RELOC_SIZE32,
10014 BFD_RELOC_SIZE32 },
10015 OPERAND_TYPE_IMM32_64, FALSE },
10016 #endif
10017 { STRING_COMMA_LEN ("PLTOFF"), { _dummy_first_bfd_reloc_code_real,
10018 BFD_RELOC_X86_64_PLTOFF64 },
10019 OPERAND_TYPE_IMM64, TRUE },
10020 { STRING_COMMA_LEN ("PLT"), { BFD_RELOC_386_PLT32,
10021 BFD_RELOC_X86_64_PLT32 },
10022 OPERAND_TYPE_IMM32_32S_DISP32, FALSE },
10023 { STRING_COMMA_LEN ("GOTPLT"), { _dummy_first_bfd_reloc_code_real,
10024 BFD_RELOC_X86_64_GOTPLT64 },
10025 OPERAND_TYPE_IMM64_DISP64, TRUE },
10026 { STRING_COMMA_LEN ("GOTOFF"), { BFD_RELOC_386_GOTOFF,
10027 BFD_RELOC_X86_64_GOTOFF64 },
10028 OPERAND_TYPE_IMM64_DISP64, TRUE },
10029 { STRING_COMMA_LEN ("GOTPCREL"), { _dummy_first_bfd_reloc_code_real,
10030 BFD_RELOC_X86_64_GOTPCREL },
10031 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10032 { STRING_COMMA_LEN ("TLSGD"), { BFD_RELOC_386_TLS_GD,
10033 BFD_RELOC_X86_64_TLSGD },
10034 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10035 { STRING_COMMA_LEN ("TLSLDM"), { BFD_RELOC_386_TLS_LDM,
10036 _dummy_first_bfd_reloc_code_real },
10037 OPERAND_TYPE_NONE, TRUE },
10038 { STRING_COMMA_LEN ("TLSLD"), { _dummy_first_bfd_reloc_code_real,
10039 BFD_RELOC_X86_64_TLSLD },
10040 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10041 { STRING_COMMA_LEN ("GOTTPOFF"), { BFD_RELOC_386_TLS_IE_32,
10042 BFD_RELOC_X86_64_GOTTPOFF },
10043 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10044 { STRING_COMMA_LEN ("TPOFF"), { BFD_RELOC_386_TLS_LE_32,
10045 BFD_RELOC_X86_64_TPOFF32 },
10046 OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10047 { STRING_COMMA_LEN ("NTPOFF"), { BFD_RELOC_386_TLS_LE,
10048 _dummy_first_bfd_reloc_code_real },
10049 OPERAND_TYPE_NONE, TRUE },
10050 { STRING_COMMA_LEN ("DTPOFF"), { BFD_RELOC_386_TLS_LDO_32,
10051 BFD_RELOC_X86_64_DTPOFF32 },
10052 OPERAND_TYPE_IMM32_32S_64_DISP32_64, TRUE },
10053 { STRING_COMMA_LEN ("GOTNTPOFF"),{ BFD_RELOC_386_TLS_GOTIE,
10054 _dummy_first_bfd_reloc_code_real },
10055 OPERAND_TYPE_NONE, TRUE },
10056 { STRING_COMMA_LEN ("INDNTPOFF"),{ BFD_RELOC_386_TLS_IE,
10057 _dummy_first_bfd_reloc_code_real },
10058 OPERAND_TYPE_NONE, TRUE },
10059 { STRING_COMMA_LEN ("GOT"), { BFD_RELOC_386_GOT32,
10060 BFD_RELOC_X86_64_GOT32 },
10061 OPERAND_TYPE_IMM32_32S_64_DISP32, TRUE },
10062 { STRING_COMMA_LEN ("TLSDESC"), { BFD_RELOC_386_TLS_GOTDESC,
10063 BFD_RELOC_X86_64_GOTPC32_TLSDESC },
10064 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10065 { STRING_COMMA_LEN ("TLSCALL"), { BFD_RELOC_386_TLS_DESC_CALL,
10066 BFD_RELOC_X86_64_TLSDESC_CALL },
10067 OPERAND_TYPE_IMM32_32S_DISP32, TRUE },
10068 };
10069 char *cp;
10070 unsigned int j;
10071
10072 #if defined (OBJ_MAYBE_ELF)
10073 if (!IS_ELF)
10074 return NULL;
10075 #endif
10076
10077 for (cp = input_line_pointer; *cp != '@'; cp++)
10078 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10079 return NULL;
10080
10081 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10082 {
10083 int len = gotrel[j].len;
10084 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10085 {
10086 if (gotrel[j].rel[object_64bit] != 0)
10087 {
10088 int first, second;
10089 char *tmpbuf, *past_reloc;
10090
10091 *rel = gotrel[j].rel[object_64bit];
10092
10093 if (types)
10094 {
10095 if (flag_code != CODE_64BIT)
10096 {
10097 types->bitfield.imm32 = 1;
10098 types->bitfield.disp32 = 1;
10099 }
10100 else
10101 *types = gotrel[j].types64;
10102 }
10103
10104 if (gotrel[j].need_GOT_symbol && GOT_symbol == NULL)
10105 GOT_symbol = symbol_find_or_make (GLOBAL_OFFSET_TABLE_NAME);
10106
10107 /* The length of the first part of our input line. */
10108 first = cp - input_line_pointer;
10109
10110 /* The second part goes from after the reloc token until
10111 (and including) an end_of_line char or comma. */
10112 past_reloc = cp + 1 + len;
10113 cp = past_reloc;
10114 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10115 ++cp;
10116 second = cp + 1 - past_reloc;
10117
10118 /* Allocate and copy string. The trailing NUL shouldn't
10119 be necessary, but be safe. */
10120 tmpbuf = XNEWVEC (char, first + second + 2);
10121 memcpy (tmpbuf, input_line_pointer, first);
10122 if (second != 0 && *past_reloc != ' ')
10123 /* Replace the relocation token with ' ', so that
10124 errors like foo@GOTOFF1 will be detected. */
10125 tmpbuf[first++] = ' ';
10126 else
10127 /* Increment length by 1 if the relocation token is
10128 removed. */
10129 len++;
10130 if (adjust)
10131 *adjust = len;
10132 memcpy (tmpbuf + first, past_reloc, second);
10133 tmpbuf[first + second] = '\0';
10134 return tmpbuf;
10135 }
10136
10137 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10138 gotrel[j].str, 1 << (5 + object_64bit));
10139 return NULL;
10140 }
10141 }
10142
10143 /* Might be a symbol version string. Don't as_bad here. */
10144 return NULL;
10145 }
10146 #endif
10147
10148 #ifdef TE_PE
10149 #ifdef lex_got
10150 #undef lex_got
10151 #endif
10152 /* Parse operands of the form
10153 <symbol>@SECREL32+<nnn>
10154
10155 If we find one, set up the correct relocation in RELOC and copy the
10156 input string, minus the `@SECREL32' into a malloc'd buffer for
10157 parsing by the calling routine. Return this buffer, and if ADJUST
10158 is non-null set it to the length of the string we removed from the
10159 input line. Otherwise return NULL.
10160
10161 This function is copied from the ELF version above adjusted for PE targets. */
10162
10163 static char *
10164 lex_got (enum bfd_reloc_code_real *rel ATTRIBUTE_UNUSED,
10165 int *adjust ATTRIBUTE_UNUSED,
10166 i386_operand_type *types)
10167 {
10168 static const struct
10169 {
10170 const char *str;
10171 int len;
10172 const enum bfd_reloc_code_real rel[2];
10173 const i386_operand_type types64;
10174 }
10175 gotrel[] =
10176 {
10177 { STRING_COMMA_LEN ("SECREL32"), { BFD_RELOC_32_SECREL,
10178 BFD_RELOC_32_SECREL },
10179 OPERAND_TYPE_IMM32_32S_64_DISP32_64 },
10180 };
10181
10182 char *cp;
10183 unsigned j;
10184
10185 for (cp = input_line_pointer; *cp != '@'; cp++)
10186 if (is_end_of_line[(unsigned char) *cp] || *cp == ',')
10187 return NULL;
10188
10189 for (j = 0; j < ARRAY_SIZE (gotrel); j++)
10190 {
10191 int len = gotrel[j].len;
10192
10193 if (strncasecmp (cp + 1, gotrel[j].str, len) == 0)
10194 {
10195 if (gotrel[j].rel[object_64bit] != 0)
10196 {
10197 int first, second;
10198 char *tmpbuf, *past_reloc;
10199
10200 *rel = gotrel[j].rel[object_64bit];
10201 if (adjust)
10202 *adjust = len;
10203
10204 if (types)
10205 {
10206 if (flag_code != CODE_64BIT)
10207 {
10208 types->bitfield.imm32 = 1;
10209 types->bitfield.disp32 = 1;
10210 }
10211 else
10212 *types = gotrel[j].types64;
10213 }
10214
10215 /* The length of the first part of our input line. */
10216 first = cp - input_line_pointer;
10217
10218 /* The second part goes from after the reloc token until
10219 (and including) an end_of_line char or comma. */
10220 past_reloc = cp + 1 + len;
10221 cp = past_reloc;
10222 while (!is_end_of_line[(unsigned char) *cp] && *cp != ',')
10223 ++cp;
10224 second = cp + 1 - past_reloc;
10225
10226 /* Allocate and copy string. The trailing NUL shouldn't
10227 be necessary, but be safe. */
10228 tmpbuf = XNEWVEC (char, first + second + 2);
10229 memcpy (tmpbuf, input_line_pointer, first);
10230 if (second != 0 && *past_reloc != ' ')
10231 /* Replace the relocation token with ' ', so that
10232 errors like foo@SECLREL321 will be detected. */
10233 tmpbuf[first++] = ' ';
10234 memcpy (tmpbuf + first, past_reloc, second);
10235 tmpbuf[first + second] = '\0';
10236 return tmpbuf;
10237 }
10238
10239 as_bad (_("@%s reloc is not supported with %d-bit output format"),
10240 gotrel[j].str, 1 << (5 + object_64bit));
10241 return NULL;
10242 }
10243 }
10244
10245 /* Might be a symbol version string. Don't as_bad here. */
10246 return NULL;
10247 }
10248
10249 #endif /* TE_PE */
10250
10251 bfd_reloc_code_real_type
10252 x86_cons (expressionS *exp, int size)
10253 {
10254 bfd_reloc_code_real_type got_reloc = NO_RELOC;
10255
10256 intel_syntax = -intel_syntax;
10257
10258 exp->X_md = 0;
10259 if (size == 4 || (object_64bit && size == 8))
10260 {
10261 /* Handle @GOTOFF and the like in an expression. */
10262 char *save;
10263 char *gotfree_input_line;
10264 int adjust = 0;
10265
10266 save = input_line_pointer;
10267 gotfree_input_line = lex_got (&got_reloc, &adjust, NULL);
10268 if (gotfree_input_line)
10269 input_line_pointer = gotfree_input_line;
10270
10271 expression (exp);
10272
10273 if (gotfree_input_line)
10274 {
10275 /* expression () has merrily parsed up to the end of line,
10276 or a comma - in the wrong buffer. Transfer how far
10277 input_line_pointer has moved to the right buffer. */
10278 input_line_pointer = (save
10279 + (input_line_pointer - gotfree_input_line)
10280 + adjust);
10281 free (gotfree_input_line);
10282 if (exp->X_op == O_constant
10283 || exp->X_op == O_absent
10284 || exp->X_op == O_illegal
10285 || exp->X_op == O_register
10286 || exp->X_op == O_big)
10287 {
10288 char c = *input_line_pointer;
10289 *input_line_pointer = 0;
10290 as_bad (_("missing or invalid expression `%s'"), save);
10291 *input_line_pointer = c;
10292 }
10293 else if ((got_reloc == BFD_RELOC_386_PLT32
10294 || got_reloc == BFD_RELOC_X86_64_PLT32)
10295 && exp->X_op != O_symbol)
10296 {
10297 char c = *input_line_pointer;
10298 *input_line_pointer = 0;
10299 as_bad (_("invalid PLT expression `%s'"), save);
10300 *input_line_pointer = c;
10301 }
10302 }
10303 }
10304 else
10305 expression (exp);
10306
10307 intel_syntax = -intel_syntax;
10308
10309 if (intel_syntax)
10310 i386_intel_simplify (exp);
10311
10312 return got_reloc;
10313 }
10314
10315 static void
10316 signed_cons (int size)
10317 {
10318 if (flag_code == CODE_64BIT)
10319 cons_sign = 1;
10320 cons (size);
10321 cons_sign = -1;
10322 }
10323
10324 #ifdef TE_PE
10325 static void
10326 pe_directive_secrel (int dummy ATTRIBUTE_UNUSED)
10327 {
10328 expressionS exp;
10329
10330 do
10331 {
10332 expression (&exp);
10333 if (exp.X_op == O_symbol)
10334 exp.X_op = O_secrel;
10335
10336 emit_expr (&exp, 4);
10337 }
10338 while (*input_line_pointer++ == ',');
10339
10340 input_line_pointer--;
10341 demand_empty_rest_of_line ();
10342 }
10343 #endif
10344
10345 /* Handle Vector operations. */
10346
10347 static char *
10348 check_VecOperations (char *op_string, char *op_end)
10349 {
10350 const reg_entry *mask;
10351 const char *saved;
10352 char *end_op;
10353
10354 while (*op_string
10355 && (op_end == NULL || op_string < op_end))
10356 {
10357 saved = op_string;
10358 if (*op_string == '{')
10359 {
10360 op_string++;
10361
10362 /* Check broadcasts. */
10363 if (strncmp (op_string, "1to", 3) == 0)
10364 {
10365 int bcst_type;
10366
10367 if (i.broadcast)
10368 goto duplicated_vec_op;
10369
10370 op_string += 3;
10371 if (*op_string == '8')
10372 bcst_type = 8;
10373 else if (*op_string == '4')
10374 bcst_type = 4;
10375 else if (*op_string == '2')
10376 bcst_type = 2;
10377 else if (*op_string == '1'
10378 && *(op_string+1) == '6')
10379 {
10380 bcst_type = 16;
10381 op_string++;
10382 }
10383 else
10384 {
10385 as_bad (_("Unsupported broadcast: `%s'"), saved);
10386 return NULL;
10387 }
10388 op_string++;
10389
10390 broadcast_op.type = bcst_type;
10391 broadcast_op.operand = this_operand;
10392 broadcast_op.bytes = 0;
10393 i.broadcast = &broadcast_op;
10394 }
10395 /* Check masking operation. */
10396 else if ((mask = parse_register (op_string, &end_op)) != NULL)
10397 {
10398 if (mask == &bad_reg)
10399 return NULL;
10400
10401 /* k0 can't be used for write mask. */
10402 if (mask->reg_type.bitfield.class != RegMask || !mask->reg_num)
10403 {
10404 as_bad (_("`%s%s' can't be used for write mask"),
10405 register_prefix, mask->reg_name);
10406 return NULL;
10407 }
10408
10409 if (!i.mask)
10410 {
10411 mask_op.mask = mask;
10412 mask_op.zeroing = 0;
10413 mask_op.operand = this_operand;
10414 i.mask = &mask_op;
10415 }
10416 else
10417 {
10418 if (i.mask->mask)
10419 goto duplicated_vec_op;
10420
10421 i.mask->mask = mask;
10422
10423 /* Only "{z}" is allowed here. No need to check
10424 zeroing mask explicitly. */
10425 if (i.mask->operand != this_operand)
10426 {
10427 as_bad (_("invalid write mask `%s'"), saved);
10428 return NULL;
10429 }
10430 }
10431
10432 op_string = end_op;
10433 }
10434 /* Check zeroing-flag for masking operation. */
10435 else if (*op_string == 'z')
10436 {
10437 if (!i.mask)
10438 {
10439 mask_op.mask = NULL;
10440 mask_op.zeroing = 1;
10441 mask_op.operand = this_operand;
10442 i.mask = &mask_op;
10443 }
10444 else
10445 {
10446 if (i.mask->zeroing)
10447 {
10448 duplicated_vec_op:
10449 as_bad (_("duplicated `%s'"), saved);
10450 return NULL;
10451 }
10452
10453 i.mask->zeroing = 1;
10454
10455 /* Only "{%k}" is allowed here. No need to check mask
10456 register explicitly. */
10457 if (i.mask->operand != this_operand)
10458 {
10459 as_bad (_("invalid zeroing-masking `%s'"),
10460 saved);
10461 return NULL;
10462 }
10463 }
10464
10465 op_string++;
10466 }
10467 else
10468 goto unknown_vec_op;
10469
10470 if (*op_string != '}')
10471 {
10472 as_bad (_("missing `}' in `%s'"), saved);
10473 return NULL;
10474 }
10475 op_string++;
10476
10477 /* Strip whitespace since the addition of pseudo prefixes
10478 changed how the scrubber treats '{'. */
10479 if (is_space_char (*op_string))
10480 ++op_string;
10481
10482 continue;
10483 }
10484 unknown_vec_op:
10485 /* We don't know this one. */
10486 as_bad (_("unknown vector operation: `%s'"), saved);
10487 return NULL;
10488 }
10489
10490 if (i.mask && i.mask->zeroing && !i.mask->mask)
10491 {
10492 as_bad (_("zeroing-masking only allowed with write mask"));
10493 return NULL;
10494 }
10495
10496 return op_string;
10497 }
10498
10499 static int
10500 i386_immediate (char *imm_start)
10501 {
10502 char *save_input_line_pointer;
10503 char *gotfree_input_line;
10504 segT exp_seg = 0;
10505 expressionS *exp;
10506 i386_operand_type types;
10507
10508 operand_type_set (&types, ~0);
10509
10510 if (i.imm_operands == MAX_IMMEDIATE_OPERANDS)
10511 {
10512 as_bad (_("at most %d immediate operands are allowed"),
10513 MAX_IMMEDIATE_OPERANDS);
10514 return 0;
10515 }
10516
10517 exp = &im_expressions[i.imm_operands++];
10518 i.op[this_operand].imms = exp;
10519
10520 if (is_space_char (*imm_start))
10521 ++imm_start;
10522
10523 save_input_line_pointer = input_line_pointer;
10524 input_line_pointer = imm_start;
10525
10526 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10527 if (gotfree_input_line)
10528 input_line_pointer = gotfree_input_line;
10529
10530 exp_seg = expression (exp);
10531
10532 SKIP_WHITESPACE ();
10533
10534 /* Handle vector operations. */
10535 if (*input_line_pointer == '{')
10536 {
10537 input_line_pointer = check_VecOperations (input_line_pointer,
10538 NULL);
10539 if (input_line_pointer == NULL)
10540 return 0;
10541 }
10542
10543 if (*input_line_pointer)
10544 as_bad (_("junk `%s' after expression"), input_line_pointer);
10545
10546 input_line_pointer = save_input_line_pointer;
10547 if (gotfree_input_line)
10548 {
10549 free (gotfree_input_line);
10550
10551 if (exp->X_op == O_constant || exp->X_op == O_register)
10552 exp->X_op = O_illegal;
10553 }
10554
10555 return i386_finalize_immediate (exp_seg, exp, types, imm_start);
10556 }
10557
10558 static int
10559 i386_finalize_immediate (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10560 i386_operand_type types, const char *imm_start)
10561 {
10562 if (exp->X_op == O_absent || exp->X_op == O_illegal || exp->X_op == O_big)
10563 {
10564 if (imm_start)
10565 as_bad (_("missing or invalid immediate expression `%s'"),
10566 imm_start);
10567 return 0;
10568 }
10569 else if (exp->X_op == O_constant)
10570 {
10571 /* Size it properly later. */
10572 i.types[this_operand].bitfield.imm64 = 1;
10573 /* If not 64bit, sign extend val. */
10574 if (flag_code != CODE_64BIT
10575 && (exp->X_add_number & ~(((addressT) 2 << 31) - 1)) == 0)
10576 exp->X_add_number
10577 = (exp->X_add_number ^ ((addressT) 1 << 31)) - ((addressT) 1 << 31);
10578 }
10579 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10580 else if (OUTPUT_FLAVOR == bfd_target_aout_flavour
10581 && exp_seg != absolute_section
10582 && exp_seg != text_section
10583 && exp_seg != data_section
10584 && exp_seg != bss_section
10585 && exp_seg != undefined_section
10586 && !bfd_is_com_section (exp_seg))
10587 {
10588 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10589 return 0;
10590 }
10591 #endif
10592 else if (!intel_syntax && exp_seg == reg_section)
10593 {
10594 if (imm_start)
10595 as_bad (_("illegal immediate register operand %s"), imm_start);
10596 return 0;
10597 }
10598 else
10599 {
10600 /* This is an address. The size of the address will be
10601 determined later, depending on destination register,
10602 suffix, or the default for the section. */
10603 i.types[this_operand].bitfield.imm8 = 1;
10604 i.types[this_operand].bitfield.imm16 = 1;
10605 i.types[this_operand].bitfield.imm32 = 1;
10606 i.types[this_operand].bitfield.imm32s = 1;
10607 i.types[this_operand].bitfield.imm64 = 1;
10608 i.types[this_operand] = operand_type_and (i.types[this_operand],
10609 types);
10610 }
10611
10612 return 1;
10613 }
10614
10615 static char *
10616 i386_scale (char *scale)
10617 {
10618 offsetT val;
10619 char *save = input_line_pointer;
10620
10621 input_line_pointer = scale;
10622 val = get_absolute_expression ();
10623
10624 switch (val)
10625 {
10626 case 1:
10627 i.log2_scale_factor = 0;
10628 break;
10629 case 2:
10630 i.log2_scale_factor = 1;
10631 break;
10632 case 4:
10633 i.log2_scale_factor = 2;
10634 break;
10635 case 8:
10636 i.log2_scale_factor = 3;
10637 break;
10638 default:
10639 {
10640 char sep = *input_line_pointer;
10641
10642 *input_line_pointer = '\0';
10643 as_bad (_("expecting scale factor of 1, 2, 4, or 8: got `%s'"),
10644 scale);
10645 *input_line_pointer = sep;
10646 input_line_pointer = save;
10647 return NULL;
10648 }
10649 }
10650 if (i.log2_scale_factor != 0 && i.index_reg == 0)
10651 {
10652 as_warn (_("scale factor of %d without an index register"),
10653 1 << i.log2_scale_factor);
10654 i.log2_scale_factor = 0;
10655 }
10656 scale = input_line_pointer;
10657 input_line_pointer = save;
10658 return scale;
10659 }
10660
10661 static int
10662 i386_displacement (char *disp_start, char *disp_end)
10663 {
10664 expressionS *exp;
10665 segT exp_seg = 0;
10666 char *save_input_line_pointer;
10667 char *gotfree_input_line;
10668 int override;
10669 i386_operand_type bigdisp, types = anydisp;
10670 int ret;
10671
10672 if (i.disp_operands == MAX_MEMORY_OPERANDS)
10673 {
10674 as_bad (_("at most %d displacement operands are allowed"),
10675 MAX_MEMORY_OPERANDS);
10676 return 0;
10677 }
10678
10679 operand_type_set (&bigdisp, 0);
10680 if (i.jumpabsolute
10681 || i.types[this_operand].bitfield.baseindex
10682 || (current_templates->start->opcode_modifier.jump != JUMP
10683 && current_templates->start->opcode_modifier.jump != JUMP_DWORD))
10684 {
10685 i386_addressing_mode ();
10686 override = (i.prefix[ADDR_PREFIX] != 0);
10687 if (flag_code == CODE_64BIT)
10688 {
10689 if (!override)
10690 {
10691 bigdisp.bitfield.disp32s = 1;
10692 bigdisp.bitfield.disp64 = 1;
10693 }
10694 else
10695 bigdisp.bitfield.disp32 = 1;
10696 }
10697 else if ((flag_code == CODE_16BIT) ^ override)
10698 bigdisp.bitfield.disp16 = 1;
10699 else
10700 bigdisp.bitfield.disp32 = 1;
10701 }
10702 else
10703 {
10704 /* For PC-relative branches, the width of the displacement may be
10705 dependent upon data size, but is never dependent upon address size.
10706 Also make sure to not unintentionally match against a non-PC-relative
10707 branch template. */
10708 static templates aux_templates;
10709 const insn_template *t = current_templates->start;
10710 bfd_boolean has_intel64 = FALSE;
10711
10712 aux_templates.start = t;
10713 while (++t < current_templates->end)
10714 {
10715 if (t->opcode_modifier.jump
10716 != current_templates->start->opcode_modifier.jump)
10717 break;
10718 if ((t->opcode_modifier.isa64 >= INTEL64))
10719 has_intel64 = TRUE;
10720 }
10721 if (t < current_templates->end)
10722 {
10723 aux_templates.end = t;
10724 current_templates = &aux_templates;
10725 }
10726
10727 override = (i.prefix[DATA_PREFIX] != 0);
10728 if (flag_code == CODE_64BIT)
10729 {
10730 if ((override || i.suffix == WORD_MNEM_SUFFIX)
10731 && (!intel64 || !has_intel64))
10732 bigdisp.bitfield.disp16 = 1;
10733 else
10734 bigdisp.bitfield.disp32s = 1;
10735 }
10736 else
10737 {
10738 if (!override)
10739 override = (i.suffix == (flag_code != CODE_16BIT
10740 ? WORD_MNEM_SUFFIX
10741 : LONG_MNEM_SUFFIX));
10742 bigdisp.bitfield.disp32 = 1;
10743 if ((flag_code == CODE_16BIT) ^ override)
10744 {
10745 bigdisp.bitfield.disp32 = 0;
10746 bigdisp.bitfield.disp16 = 1;
10747 }
10748 }
10749 }
10750 i.types[this_operand] = operand_type_or (i.types[this_operand],
10751 bigdisp);
10752
10753 exp = &disp_expressions[i.disp_operands];
10754 i.op[this_operand].disps = exp;
10755 i.disp_operands++;
10756 save_input_line_pointer = input_line_pointer;
10757 input_line_pointer = disp_start;
10758 END_STRING_AND_SAVE (disp_end);
10759
10760 #ifndef GCC_ASM_O_HACK
10761 #define GCC_ASM_O_HACK 0
10762 #endif
10763 #if GCC_ASM_O_HACK
10764 END_STRING_AND_SAVE (disp_end + 1);
10765 if (i.types[this_operand].bitfield.baseIndex
10766 && displacement_string_end[-1] == '+')
10767 {
10768 /* This hack is to avoid a warning when using the "o"
10769 constraint within gcc asm statements.
10770 For instance:
10771
10772 #define _set_tssldt_desc(n,addr,limit,type) \
10773 __asm__ __volatile__ ( \
10774 "movw %w2,%0\n\t" \
10775 "movw %w1,2+%0\n\t" \
10776 "rorl $16,%1\n\t" \
10777 "movb %b1,4+%0\n\t" \
10778 "movb %4,5+%0\n\t" \
10779 "movb $0,6+%0\n\t" \
10780 "movb %h1,7+%0\n\t" \
10781 "rorl $16,%1" \
10782 : "=o"(*(n)) : "q" (addr), "ri"(limit), "i"(type))
10783
10784 This works great except that the output assembler ends
10785 up looking a bit weird if it turns out that there is
10786 no offset. You end up producing code that looks like:
10787
10788 #APP
10789 movw $235,(%eax)
10790 movw %dx,2+(%eax)
10791 rorl $16,%edx
10792 movb %dl,4+(%eax)
10793 movb $137,5+(%eax)
10794 movb $0,6+(%eax)
10795 movb %dh,7+(%eax)
10796 rorl $16,%edx
10797 #NO_APP
10798
10799 So here we provide the missing zero. */
10800
10801 *displacement_string_end = '0';
10802 }
10803 #endif
10804 gotfree_input_line = lex_got (&i.reloc[this_operand], NULL, &types);
10805 if (gotfree_input_line)
10806 input_line_pointer = gotfree_input_line;
10807
10808 exp_seg = expression (exp);
10809
10810 SKIP_WHITESPACE ();
10811 if (*input_line_pointer)
10812 as_bad (_("junk `%s' after expression"), input_line_pointer);
10813 #if GCC_ASM_O_HACK
10814 RESTORE_END_STRING (disp_end + 1);
10815 #endif
10816 input_line_pointer = save_input_line_pointer;
10817 if (gotfree_input_line)
10818 {
10819 free (gotfree_input_line);
10820
10821 if (exp->X_op == O_constant || exp->X_op == O_register)
10822 exp->X_op = O_illegal;
10823 }
10824
10825 ret = i386_finalize_displacement (exp_seg, exp, types, disp_start);
10826
10827 RESTORE_END_STRING (disp_end);
10828
10829 return ret;
10830 }
10831
10832 static int
10833 i386_finalize_displacement (segT exp_seg ATTRIBUTE_UNUSED, expressionS *exp,
10834 i386_operand_type types, const char *disp_start)
10835 {
10836 i386_operand_type bigdisp;
10837 int ret = 1;
10838
10839 /* We do this to make sure that the section symbol is in
10840 the symbol table. We will ultimately change the relocation
10841 to be relative to the beginning of the section. */
10842 if (i.reloc[this_operand] == BFD_RELOC_386_GOTOFF
10843 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL
10844 || i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10845 {
10846 if (exp->X_op != O_symbol)
10847 goto inv_disp;
10848
10849 if (S_IS_LOCAL (exp->X_add_symbol)
10850 && S_GET_SEGMENT (exp->X_add_symbol) != undefined_section
10851 && S_GET_SEGMENT (exp->X_add_symbol) != expr_section)
10852 section_symbol (S_GET_SEGMENT (exp->X_add_symbol));
10853 exp->X_op = O_subtract;
10854 exp->X_op_symbol = GOT_symbol;
10855 if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTPCREL)
10856 i.reloc[this_operand] = BFD_RELOC_32_PCREL;
10857 else if (i.reloc[this_operand] == BFD_RELOC_X86_64_GOTOFF64)
10858 i.reloc[this_operand] = BFD_RELOC_64;
10859 else
10860 i.reloc[this_operand] = BFD_RELOC_32;
10861 }
10862
10863 else if (exp->X_op == O_absent
10864 || exp->X_op == O_illegal
10865 || exp->X_op == O_big)
10866 {
10867 inv_disp:
10868 as_bad (_("missing or invalid displacement expression `%s'"),
10869 disp_start);
10870 ret = 0;
10871 }
10872
10873 else if (flag_code == CODE_64BIT
10874 && !i.prefix[ADDR_PREFIX]
10875 && exp->X_op == O_constant)
10876 {
10877 /* Since displacement is signed extended to 64bit, don't allow
10878 disp32 and turn off disp32s if they are out of range. */
10879 i.types[this_operand].bitfield.disp32 = 0;
10880 if (!fits_in_signed_long (exp->X_add_number))
10881 {
10882 i.types[this_operand].bitfield.disp32s = 0;
10883 if (i.types[this_operand].bitfield.baseindex)
10884 {
10885 as_bad (_("0x%lx out range of signed 32bit displacement"),
10886 (long) exp->X_add_number);
10887 ret = 0;
10888 }
10889 }
10890 }
10891
10892 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
10893 else if (exp->X_op != O_constant
10894 && OUTPUT_FLAVOR == bfd_target_aout_flavour
10895 && exp_seg != absolute_section
10896 && exp_seg != text_section
10897 && exp_seg != data_section
10898 && exp_seg != bss_section
10899 && exp_seg != undefined_section
10900 && !bfd_is_com_section (exp_seg))
10901 {
10902 as_bad (_("unimplemented segment %s in operand"), exp_seg->name);
10903 ret = 0;
10904 }
10905 #endif
10906
10907 if (current_templates->start->opcode_modifier.jump == JUMP_BYTE
10908 /* Constants get taken care of by optimize_disp(). */
10909 && exp->X_op != O_constant)
10910 i.types[this_operand].bitfield.disp8 = 1;
10911
10912 /* Check if this is a displacement only operand. */
10913 bigdisp = i.types[this_operand];
10914 bigdisp.bitfield.disp8 = 0;
10915 bigdisp.bitfield.disp16 = 0;
10916 bigdisp.bitfield.disp32 = 0;
10917 bigdisp.bitfield.disp32s = 0;
10918 bigdisp.bitfield.disp64 = 0;
10919 if (operand_type_all_zero (&bigdisp))
10920 i.types[this_operand] = operand_type_and (i.types[this_operand],
10921 types);
10922
10923 return ret;
10924 }
10925
10926 /* Return the active addressing mode, taking address override and
10927 registers forming the address into consideration. Update the
10928 address override prefix if necessary. */
10929
10930 static enum flag_code
10931 i386_addressing_mode (void)
10932 {
10933 enum flag_code addr_mode;
10934
10935 if (i.prefix[ADDR_PREFIX])
10936 addr_mode = flag_code == CODE_32BIT ? CODE_16BIT : CODE_32BIT;
10937 else if (flag_code == CODE_16BIT
10938 && current_templates->start->cpu_flags.bitfield.cpumpx
10939 /* Avoid replacing the "16-bit addressing not allowed" diagnostic
10940 from md_assemble() by "is not a valid base/index expression"
10941 when there is a base and/or index. */
10942 && !i.types[this_operand].bitfield.baseindex)
10943 {
10944 /* MPX insn memory operands with neither base nor index must be forced
10945 to use 32-bit addressing in 16-bit mode. */
10946 addr_mode = CODE_32BIT;
10947 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10948 ++i.prefixes;
10949 gas_assert (!i.types[this_operand].bitfield.disp16);
10950 gas_assert (!i.types[this_operand].bitfield.disp32);
10951 }
10952 else
10953 {
10954 addr_mode = flag_code;
10955
10956 #if INFER_ADDR_PREFIX
10957 if (i.mem_operands == 0)
10958 {
10959 /* Infer address prefix from the first memory operand. */
10960 const reg_entry *addr_reg = i.base_reg;
10961
10962 if (addr_reg == NULL)
10963 addr_reg = i.index_reg;
10964
10965 if (addr_reg)
10966 {
10967 if (addr_reg->reg_type.bitfield.dword)
10968 addr_mode = CODE_32BIT;
10969 else if (flag_code != CODE_64BIT
10970 && addr_reg->reg_type.bitfield.word)
10971 addr_mode = CODE_16BIT;
10972
10973 if (addr_mode != flag_code)
10974 {
10975 i.prefix[ADDR_PREFIX] = ADDR_PREFIX_OPCODE;
10976 i.prefixes += 1;
10977 /* Change the size of any displacement too. At most one
10978 of Disp16 or Disp32 is set.
10979 FIXME. There doesn't seem to be any real need for
10980 separate Disp16 and Disp32 flags. The same goes for
10981 Imm16 and Imm32. Removing them would probably clean
10982 up the code quite a lot. */
10983 if (flag_code != CODE_64BIT
10984 && (i.types[this_operand].bitfield.disp16
10985 || i.types[this_operand].bitfield.disp32))
10986 i.types[this_operand]
10987 = operand_type_xor (i.types[this_operand], disp16_32);
10988 }
10989 }
10990 }
10991 #endif
10992 }
10993
10994 return addr_mode;
10995 }
10996
10997 /* Make sure the memory operand we've been dealt is valid.
10998 Return 1 on success, 0 on a failure. */
10999
11000 static int
11001 i386_index_check (const char *operand_string)
11002 {
11003 const char *kind = "base/index";
11004 enum flag_code addr_mode = i386_addressing_mode ();
11005 const insn_template *t = current_templates->start;
11006
11007 if (t->opcode_modifier.isstring
11008 && !t->cpu_flags.bitfield.cpupadlock
11009 && (current_templates->end[-1].opcode_modifier.isstring
11010 || i.mem_operands))
11011 {
11012 /* Memory operands of string insns are special in that they only allow
11013 a single register (rDI, rSI, or rBX) as their memory address. */
11014 const reg_entry *expected_reg;
11015 static const char *di_si[][2] =
11016 {
11017 { "esi", "edi" },
11018 { "si", "di" },
11019 { "rsi", "rdi" }
11020 };
11021 static const char *bx[] = { "ebx", "bx", "rbx" };
11022
11023 kind = "string address";
11024
11025 if (t->opcode_modifier.prefixok == PrefixRep)
11026 {
11027 int es_op = current_templates->end[-1].opcode_modifier.isstring
11028 - IS_STRING_ES_OP0;
11029 int op = 0;
11030
11031 if (!current_templates->end[-1].operand_types[0].bitfield.baseindex
11032 || ((!i.mem_operands != !intel_syntax)
11033 && current_templates->end[-1].operand_types[1]
11034 .bitfield.baseindex))
11035 op = 1;
11036 expected_reg
11037 = (const reg_entry *) str_hash_find (reg_hash,
11038 di_si[addr_mode][op == es_op]);
11039 }
11040 else
11041 expected_reg
11042 = (const reg_entry *)str_hash_find (reg_hash, bx[addr_mode]);
11043
11044 if (i.base_reg != expected_reg
11045 || i.index_reg
11046 || operand_type_check (i.types[this_operand], disp))
11047 {
11048 /* The second memory operand must have the same size as
11049 the first one. */
11050 if (i.mem_operands
11051 && i.base_reg
11052 && !((addr_mode == CODE_64BIT
11053 && i.base_reg->reg_type.bitfield.qword)
11054 || (addr_mode == CODE_32BIT
11055 ? i.base_reg->reg_type.bitfield.dword
11056 : i.base_reg->reg_type.bitfield.word)))
11057 goto bad_address;
11058
11059 as_warn (_("`%s' is not valid here (expected `%c%s%s%c')"),
11060 operand_string,
11061 intel_syntax ? '[' : '(',
11062 register_prefix,
11063 expected_reg->reg_name,
11064 intel_syntax ? ']' : ')');
11065 return 1;
11066 }
11067 else
11068 return 1;
11069
11070 bad_address:
11071 as_bad (_("`%s' is not a valid %s expression"),
11072 operand_string, kind);
11073 return 0;
11074 }
11075 else
11076 {
11077 if (addr_mode != CODE_16BIT)
11078 {
11079 /* 32-bit/64-bit checks. */
11080 if (i.disp_encoding == disp_encoding_16bit)
11081 {
11082 bad_disp:
11083 as_bad (_("invalid `%s' prefix"),
11084 addr_mode == CODE_16BIT ? "{disp32}" : "{disp16}");
11085 return 0;
11086 }
11087
11088 if ((i.base_reg
11089 && ((addr_mode == CODE_64BIT
11090 ? !i.base_reg->reg_type.bitfield.qword
11091 : !i.base_reg->reg_type.bitfield.dword)
11092 || (i.index_reg && i.base_reg->reg_num == RegIP)
11093 || i.base_reg->reg_num == RegIZ))
11094 || (i.index_reg
11095 && !i.index_reg->reg_type.bitfield.xmmword
11096 && !i.index_reg->reg_type.bitfield.ymmword
11097 && !i.index_reg->reg_type.bitfield.zmmword
11098 && ((addr_mode == CODE_64BIT
11099 ? !i.index_reg->reg_type.bitfield.qword
11100 : !i.index_reg->reg_type.bitfield.dword)
11101 || !i.index_reg->reg_type.bitfield.baseindex)))
11102 goto bad_address;
11103
11104 /* bndmk, bndldx, bndstx and mandatory non-vector SIB have special restrictions. */
11105 if ((t->opcode_modifier.opcodeprefix == PREFIX_0XF3
11106 && t->base_opcode == 0x0f1b)
11107 || (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11108 && (t->base_opcode & ~1) == 0x0f1a)
11109 || t->opcode_modifier.sib == SIBMEM)
11110 {
11111 /* They cannot use RIP-relative addressing. */
11112 if (i.base_reg && i.base_reg->reg_num == RegIP)
11113 {
11114 as_bad (_("`%s' cannot be used here"), operand_string);
11115 return 0;
11116 }
11117
11118 /* bndldx and bndstx ignore their scale factor. */
11119 if (t->opcode_modifier.opcodeprefix == PREFIX_NONE
11120 && (t->base_opcode & ~1) == 0x0f1a
11121 && i.log2_scale_factor)
11122 as_warn (_("register scaling is being ignored here"));
11123 }
11124 }
11125 else
11126 {
11127 /* 16-bit checks. */
11128 if (i.disp_encoding == disp_encoding_32bit)
11129 goto bad_disp;
11130
11131 if ((i.base_reg
11132 && (!i.base_reg->reg_type.bitfield.word
11133 || !i.base_reg->reg_type.bitfield.baseindex))
11134 || (i.index_reg
11135 && (!i.index_reg->reg_type.bitfield.word
11136 || !i.index_reg->reg_type.bitfield.baseindex
11137 || !(i.base_reg
11138 && i.base_reg->reg_num < 6
11139 && i.index_reg->reg_num >= 6
11140 && i.log2_scale_factor == 0))))
11141 goto bad_address;
11142 }
11143 }
11144 return 1;
11145 }
11146
11147 /* Handle vector immediates. */
11148
11149 static int
11150 RC_SAE_immediate (const char *imm_start)
11151 {
11152 unsigned int match_found, j;
11153 const char *pstr = imm_start;
11154 expressionS *exp;
11155
11156 if (*pstr != '{')
11157 return 0;
11158
11159 pstr++;
11160 match_found = 0;
11161 for (j = 0; j < ARRAY_SIZE (RC_NamesTable); j++)
11162 {
11163 if (!strncmp (pstr, RC_NamesTable[j].name, RC_NamesTable[j].len))
11164 {
11165 if (!i.rounding)
11166 {
11167 rc_op.type = RC_NamesTable[j].type;
11168 rc_op.operand = this_operand;
11169 i.rounding = &rc_op;
11170 }
11171 else
11172 {
11173 as_bad (_("duplicated `%s'"), imm_start);
11174 return 0;
11175 }
11176 pstr += RC_NamesTable[j].len;
11177 match_found = 1;
11178 break;
11179 }
11180 }
11181 if (!match_found)
11182 return 0;
11183
11184 if (*pstr++ != '}')
11185 {
11186 as_bad (_("Missing '}': '%s'"), imm_start);
11187 return 0;
11188 }
11189 /* RC/SAE immediate string should contain nothing more. */;
11190 if (*pstr != 0)
11191 {
11192 as_bad (_("Junk after '}': '%s'"), imm_start);
11193 return 0;
11194 }
11195
11196 exp = &im_expressions[i.imm_operands++];
11197 i.op[this_operand].imms = exp;
11198
11199 exp->X_op = O_constant;
11200 exp->X_add_number = 0;
11201 exp->X_add_symbol = (symbolS *) 0;
11202 exp->X_op_symbol = (symbolS *) 0;
11203
11204 i.types[this_operand].bitfield.imm8 = 1;
11205 return 1;
11206 }
11207
11208 /* Only string instructions can have a second memory operand, so
11209 reduce current_templates to just those if it contains any. */
11210 static int
11211 maybe_adjust_templates (void)
11212 {
11213 const insn_template *t;
11214
11215 gas_assert (i.mem_operands == 1);
11216
11217 for (t = current_templates->start; t < current_templates->end; ++t)
11218 if (t->opcode_modifier.isstring)
11219 break;
11220
11221 if (t < current_templates->end)
11222 {
11223 static templates aux_templates;
11224 bfd_boolean recheck;
11225
11226 aux_templates.start = t;
11227 for (; t < current_templates->end; ++t)
11228 if (!t->opcode_modifier.isstring)
11229 break;
11230 aux_templates.end = t;
11231
11232 /* Determine whether to re-check the first memory operand. */
11233 recheck = (aux_templates.start != current_templates->start
11234 || t != current_templates->end);
11235
11236 current_templates = &aux_templates;
11237
11238 if (recheck)
11239 {
11240 i.mem_operands = 0;
11241 if (i.memop1_string != NULL
11242 && i386_index_check (i.memop1_string) == 0)
11243 return 0;
11244 i.mem_operands = 1;
11245 }
11246 }
11247
11248 return 1;
11249 }
11250
11251 /* Parse OPERAND_STRING into the i386_insn structure I. Returns zero
11252 on error. */
11253
11254 static int
11255 i386_att_operand (char *operand_string)
11256 {
11257 const reg_entry *r;
11258 char *end_op;
11259 char *op_string = operand_string;
11260
11261 if (is_space_char (*op_string))
11262 ++op_string;
11263
11264 /* We check for an absolute prefix (differentiating,
11265 for example, 'jmp pc_relative_label' from 'jmp *absolute_label'. */
11266 if (*op_string == ABSOLUTE_PREFIX)
11267 {
11268 ++op_string;
11269 if (is_space_char (*op_string))
11270 ++op_string;
11271 i.jumpabsolute = TRUE;
11272 }
11273
11274 /* Check if operand is a register. */
11275 if ((r = parse_register (op_string, &end_op)) != NULL)
11276 {
11277 i386_operand_type temp;
11278
11279 if (r == &bad_reg)
11280 return 0;
11281
11282 /* Check for a segment override by searching for ':' after a
11283 segment register. */
11284 op_string = end_op;
11285 if (is_space_char (*op_string))
11286 ++op_string;
11287 if (*op_string == ':' && r->reg_type.bitfield.class == SReg)
11288 {
11289 switch (r->reg_num)
11290 {
11291 case 0:
11292 i.seg[i.mem_operands] = &es;
11293 break;
11294 case 1:
11295 i.seg[i.mem_operands] = &cs;
11296 break;
11297 case 2:
11298 i.seg[i.mem_operands] = &ss;
11299 break;
11300 case 3:
11301 i.seg[i.mem_operands] = &ds;
11302 break;
11303 case 4:
11304 i.seg[i.mem_operands] = &fs;
11305 break;
11306 case 5:
11307 i.seg[i.mem_operands] = &gs;
11308 break;
11309 }
11310
11311 /* Skip the ':' and whitespace. */
11312 ++op_string;
11313 if (is_space_char (*op_string))
11314 ++op_string;
11315
11316 if (!is_digit_char (*op_string)
11317 && !is_identifier_char (*op_string)
11318 && *op_string != '('
11319 && *op_string != ABSOLUTE_PREFIX)
11320 {
11321 as_bad (_("bad memory operand `%s'"), op_string);
11322 return 0;
11323 }
11324 /* Handle case of %es:*foo. */
11325 if (*op_string == ABSOLUTE_PREFIX)
11326 {
11327 ++op_string;
11328 if (is_space_char (*op_string))
11329 ++op_string;
11330 i.jumpabsolute = TRUE;
11331 }
11332 goto do_memory_reference;
11333 }
11334
11335 /* Handle vector operations. */
11336 if (*op_string == '{')
11337 {
11338 op_string = check_VecOperations (op_string, NULL);
11339 if (op_string == NULL)
11340 return 0;
11341 }
11342
11343 if (*op_string)
11344 {
11345 as_bad (_("junk `%s' after register"), op_string);
11346 return 0;
11347 }
11348 temp = r->reg_type;
11349 temp.bitfield.baseindex = 0;
11350 i.types[this_operand] = operand_type_or (i.types[this_operand],
11351 temp);
11352 i.types[this_operand].bitfield.unspecified = 0;
11353 i.op[this_operand].regs = r;
11354 i.reg_operands++;
11355 }
11356 else if (*op_string == REGISTER_PREFIX)
11357 {
11358 as_bad (_("bad register name `%s'"), op_string);
11359 return 0;
11360 }
11361 else if (*op_string == IMMEDIATE_PREFIX)
11362 {
11363 ++op_string;
11364 if (i.jumpabsolute)
11365 {
11366 as_bad (_("immediate operand illegal with absolute jump"));
11367 return 0;
11368 }
11369 if (!i386_immediate (op_string))
11370 return 0;
11371 }
11372 else if (RC_SAE_immediate (operand_string))
11373 {
11374 /* If it is a RC or SAE immediate, do nothing. */
11375 ;
11376 }
11377 else if (is_digit_char (*op_string)
11378 || is_identifier_char (*op_string)
11379 || *op_string == '"'
11380 || *op_string == '(')
11381 {
11382 /* This is a memory reference of some sort. */
11383 char *base_string;
11384
11385 /* Start and end of displacement string expression (if found). */
11386 char *displacement_string_start;
11387 char *displacement_string_end;
11388 char *vop_start;
11389
11390 do_memory_reference:
11391 if (i.mem_operands == 1 && !maybe_adjust_templates ())
11392 return 0;
11393 if ((i.mem_operands == 1
11394 && !current_templates->start->opcode_modifier.isstring)
11395 || i.mem_operands == 2)
11396 {
11397 as_bad (_("too many memory references for `%s'"),
11398 current_templates->start->name);
11399 return 0;
11400 }
11401
11402 /* Check for base index form. We detect the base index form by
11403 looking for an ')' at the end of the operand, searching
11404 for the '(' matching it, and finding a REGISTER_PREFIX or ','
11405 after the '('. */
11406 base_string = op_string + strlen (op_string);
11407
11408 /* Handle vector operations. */
11409 vop_start = strchr (op_string, '{');
11410 if (vop_start && vop_start < base_string)
11411 {
11412 if (check_VecOperations (vop_start, base_string) == NULL)
11413 return 0;
11414 base_string = vop_start;
11415 }
11416
11417 --base_string;
11418 if (is_space_char (*base_string))
11419 --base_string;
11420
11421 /* If we only have a displacement, set-up for it to be parsed later. */
11422 displacement_string_start = op_string;
11423 displacement_string_end = base_string + 1;
11424
11425 if (*base_string == ')')
11426 {
11427 char *temp_string;
11428 unsigned int parens_balanced = 1;
11429 /* We've already checked that the number of left & right ()'s are
11430 equal, so this loop will not be infinite. */
11431 do
11432 {
11433 base_string--;
11434 if (*base_string == ')')
11435 parens_balanced++;
11436 if (*base_string == '(')
11437 parens_balanced--;
11438 }
11439 while (parens_balanced);
11440
11441 temp_string = base_string;
11442
11443 /* Skip past '(' and whitespace. */
11444 ++base_string;
11445 if (is_space_char (*base_string))
11446 ++base_string;
11447
11448 if (*base_string == ','
11449 || ((i.base_reg = parse_register (base_string, &end_op))
11450 != NULL))
11451 {
11452 displacement_string_end = temp_string;
11453
11454 i.types[this_operand].bitfield.baseindex = 1;
11455
11456 if (i.base_reg)
11457 {
11458 if (i.base_reg == &bad_reg)
11459 return 0;
11460 base_string = end_op;
11461 if (is_space_char (*base_string))
11462 ++base_string;
11463 }
11464
11465 /* There may be an index reg or scale factor here. */
11466 if (*base_string == ',')
11467 {
11468 ++base_string;
11469 if (is_space_char (*base_string))
11470 ++base_string;
11471
11472 if ((i.index_reg = parse_register (base_string, &end_op))
11473 != NULL)
11474 {
11475 if (i.index_reg == &bad_reg)
11476 return 0;
11477 base_string = end_op;
11478 if (is_space_char (*base_string))
11479 ++base_string;
11480 if (*base_string == ',')
11481 {
11482 ++base_string;
11483 if (is_space_char (*base_string))
11484 ++base_string;
11485 }
11486 else if (*base_string != ')')
11487 {
11488 as_bad (_("expecting `,' or `)' "
11489 "after index register in `%s'"),
11490 operand_string);
11491 return 0;
11492 }
11493 }
11494 else if (*base_string == REGISTER_PREFIX)
11495 {
11496 end_op = strchr (base_string, ',');
11497 if (end_op)
11498 *end_op = '\0';
11499 as_bad (_("bad register name `%s'"), base_string);
11500 return 0;
11501 }
11502
11503 /* Check for scale factor. */
11504 if (*base_string != ')')
11505 {
11506 char *end_scale = i386_scale (base_string);
11507
11508 if (!end_scale)
11509 return 0;
11510
11511 base_string = end_scale;
11512 if (is_space_char (*base_string))
11513 ++base_string;
11514 if (*base_string != ')')
11515 {
11516 as_bad (_("expecting `)' "
11517 "after scale factor in `%s'"),
11518 operand_string);
11519 return 0;
11520 }
11521 }
11522 else if (!i.index_reg)
11523 {
11524 as_bad (_("expecting index register or scale factor "
11525 "after `,'; got '%c'"),
11526 *base_string);
11527 return 0;
11528 }
11529 }
11530 else if (*base_string != ')')
11531 {
11532 as_bad (_("expecting `,' or `)' "
11533 "after base register in `%s'"),
11534 operand_string);
11535 return 0;
11536 }
11537 }
11538 else if (*base_string == REGISTER_PREFIX)
11539 {
11540 end_op = strchr (base_string, ',');
11541 if (end_op)
11542 *end_op = '\0';
11543 as_bad (_("bad register name `%s'"), base_string);
11544 return 0;
11545 }
11546 }
11547
11548 /* If there's an expression beginning the operand, parse it,
11549 assuming displacement_string_start and
11550 displacement_string_end are meaningful. */
11551 if (displacement_string_start != displacement_string_end)
11552 {
11553 if (!i386_displacement (displacement_string_start,
11554 displacement_string_end))
11555 return 0;
11556 }
11557
11558 /* Special case for (%dx) while doing input/output op. */
11559 if (i.base_reg
11560 && i.base_reg->reg_type.bitfield.instance == RegD
11561 && i.base_reg->reg_type.bitfield.word
11562 && i.index_reg == 0
11563 && i.log2_scale_factor == 0
11564 && i.seg[i.mem_operands] == 0
11565 && !operand_type_check (i.types[this_operand], disp))
11566 {
11567 i.types[this_operand] = i.base_reg->reg_type;
11568 return 1;
11569 }
11570
11571 if (i386_index_check (operand_string) == 0)
11572 return 0;
11573 i.flags[this_operand] |= Operand_Mem;
11574 if (i.mem_operands == 0)
11575 i.memop1_string = xstrdup (operand_string);
11576 i.mem_operands++;
11577 }
11578 else
11579 {
11580 /* It's not a memory operand; argh! */
11581 as_bad (_("invalid char %s beginning operand %d `%s'"),
11582 output_invalid (*op_string),
11583 this_operand + 1,
11584 op_string);
11585 return 0;
11586 }
11587 return 1; /* Normal return. */
11588 }
11589 \f
11590 /* Calculate the maximum variable size (i.e., excluding fr_fix)
11591 that an rs_machine_dependent frag may reach. */
11592
11593 unsigned int
11594 i386_frag_max_var (fragS *frag)
11595 {
11596 /* The only relaxable frags are for jumps.
11597 Unconditional jumps can grow by 4 bytes and others by 5 bytes. */
11598 gas_assert (frag->fr_type == rs_machine_dependent);
11599 return TYPE_FROM_RELAX_STATE (frag->fr_subtype) == UNCOND_JUMP ? 4 : 5;
11600 }
11601
11602 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
11603 static int
11604 elf_symbol_resolved_in_segment_p (symbolS *fr_symbol, offsetT fr_var)
11605 {
11606 /* STT_GNU_IFUNC symbol must go through PLT. */
11607 if ((symbol_get_bfdsym (fr_symbol)->flags
11608 & BSF_GNU_INDIRECT_FUNCTION) != 0)
11609 return 0;
11610
11611 if (!S_IS_EXTERNAL (fr_symbol))
11612 /* Symbol may be weak or local. */
11613 return !S_IS_WEAK (fr_symbol);
11614
11615 /* Global symbols with non-default visibility can't be preempted. */
11616 if (ELF_ST_VISIBILITY (S_GET_OTHER (fr_symbol)) != STV_DEFAULT)
11617 return 1;
11618
11619 if (fr_var != NO_RELOC)
11620 switch ((enum bfd_reloc_code_real) fr_var)
11621 {
11622 case BFD_RELOC_386_PLT32:
11623 case BFD_RELOC_X86_64_PLT32:
11624 /* Symbol with PLT relocation may be preempted. */
11625 return 0;
11626 default:
11627 abort ();
11628 }
11629
11630 /* Global symbols with default visibility in a shared library may be
11631 preempted by another definition. */
11632 return !shared;
11633 }
11634 #endif
11635
11636 /* Table 3-2. Macro-Fusible Instructions in Haswell Microarchitecture
11637 Note also work for Skylake and Cascadelake.
11638 ---------------------------------------------------------------------
11639 | JCC | ADD/SUB/CMP | INC/DEC | TEST/AND |
11640 | ------ | ----------- | ------- | -------- |
11641 | Jo | N | N | Y |
11642 | Jno | N | N | Y |
11643 | Jc/Jb | Y | N | Y |
11644 | Jae/Jnb | Y | N | Y |
11645 | Je/Jz | Y | Y | Y |
11646 | Jne/Jnz | Y | Y | Y |
11647 | Jna/Jbe | Y | N | Y |
11648 | Ja/Jnbe | Y | N | Y |
11649 | Js | N | N | Y |
11650 | Jns | N | N | Y |
11651 | Jp/Jpe | N | N | Y |
11652 | Jnp/Jpo | N | N | Y |
11653 | Jl/Jnge | Y | Y | Y |
11654 | Jge/Jnl | Y | Y | Y |
11655 | Jle/Jng | Y | Y | Y |
11656 | Jg/Jnle | Y | Y | Y |
11657 --------------------------------------------------------------------- */
11658 static int
11659 i386_macro_fusible_p (enum mf_cmp_kind mf_cmp, enum mf_jcc_kind mf_jcc)
11660 {
11661 if (mf_cmp == mf_cmp_alu_cmp)
11662 return ((mf_jcc >= mf_jcc_jc && mf_jcc <= mf_jcc_jna)
11663 || mf_jcc == mf_jcc_jl || mf_jcc == mf_jcc_jle);
11664 if (mf_cmp == mf_cmp_incdec)
11665 return (mf_jcc == mf_jcc_je || mf_jcc == mf_jcc_jl
11666 || mf_jcc == mf_jcc_jle);
11667 if (mf_cmp == mf_cmp_test_and)
11668 return 1;
11669 return 0;
11670 }
11671
11672 /* Return the next non-empty frag. */
11673
11674 static fragS *
11675 i386_next_non_empty_frag (fragS *fragP)
11676 {
11677 /* There may be a frag with a ".fill 0" when there is no room in
11678 the current frag for frag_grow in output_insn. */
11679 for (fragP = fragP->fr_next;
11680 (fragP != NULL
11681 && fragP->fr_type == rs_fill
11682 && fragP->fr_fix == 0);
11683 fragP = fragP->fr_next)
11684 ;
11685 return fragP;
11686 }
11687
11688 /* Return the next jcc frag after BRANCH_PADDING. */
11689
11690 static fragS *
11691 i386_next_fusible_jcc_frag (fragS *maybe_cmp_fragP, fragS *pad_fragP)
11692 {
11693 fragS *branch_fragP;
11694 if (!pad_fragP)
11695 return NULL;
11696
11697 if (pad_fragP->fr_type == rs_machine_dependent
11698 && (TYPE_FROM_RELAX_STATE (pad_fragP->fr_subtype)
11699 == BRANCH_PADDING))
11700 {
11701 branch_fragP = i386_next_non_empty_frag (pad_fragP);
11702 if (branch_fragP->fr_type != rs_machine_dependent)
11703 return NULL;
11704 if (TYPE_FROM_RELAX_STATE (branch_fragP->fr_subtype) == COND_JUMP
11705 && i386_macro_fusible_p (maybe_cmp_fragP->tc_frag_data.mf_type,
11706 pad_fragP->tc_frag_data.mf_type))
11707 return branch_fragP;
11708 }
11709
11710 return NULL;
11711 }
11712
11713 /* Classify BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags. */
11714
11715 static void
11716 i386_classify_machine_dependent_frag (fragS *fragP)
11717 {
11718 fragS *cmp_fragP;
11719 fragS *pad_fragP;
11720 fragS *branch_fragP;
11721 fragS *next_fragP;
11722 unsigned int max_prefix_length;
11723
11724 if (fragP->tc_frag_data.classified)
11725 return;
11726
11727 /* First scan for BRANCH_PADDING and FUSED_JCC_PADDING. Convert
11728 FUSED_JCC_PADDING and merge BRANCH_PADDING. */
11729 for (next_fragP = fragP;
11730 next_fragP != NULL;
11731 next_fragP = next_fragP->fr_next)
11732 {
11733 next_fragP->tc_frag_data.classified = 1;
11734 if (next_fragP->fr_type == rs_machine_dependent)
11735 switch (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype))
11736 {
11737 case BRANCH_PADDING:
11738 /* The BRANCH_PADDING frag must be followed by a branch
11739 frag. */
11740 branch_fragP = i386_next_non_empty_frag (next_fragP);
11741 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11742 break;
11743 case FUSED_JCC_PADDING:
11744 /* Check if this is a fused jcc:
11745 FUSED_JCC_PADDING
11746 CMP like instruction
11747 BRANCH_PADDING
11748 COND_JUMP
11749 */
11750 cmp_fragP = i386_next_non_empty_frag (next_fragP);
11751 pad_fragP = i386_next_non_empty_frag (cmp_fragP);
11752 branch_fragP = i386_next_fusible_jcc_frag (next_fragP, pad_fragP);
11753 if (branch_fragP)
11754 {
11755 /* The BRANCH_PADDING frag is merged with the
11756 FUSED_JCC_PADDING frag. */
11757 next_fragP->tc_frag_data.u.branch_fragP = branch_fragP;
11758 /* CMP like instruction size. */
11759 next_fragP->tc_frag_data.cmp_size = cmp_fragP->fr_fix;
11760 frag_wane (pad_fragP);
11761 /* Skip to branch_fragP. */
11762 next_fragP = branch_fragP;
11763 }
11764 else if (next_fragP->tc_frag_data.max_prefix_length)
11765 {
11766 /* Turn FUSED_JCC_PADDING into BRANCH_PREFIX if it isn't
11767 a fused jcc. */
11768 next_fragP->fr_subtype
11769 = ENCODE_RELAX_STATE (BRANCH_PREFIX, 0);
11770 next_fragP->tc_frag_data.max_bytes
11771 = next_fragP->tc_frag_data.max_prefix_length;
11772 /* This will be updated in the BRANCH_PREFIX scan. */
11773 next_fragP->tc_frag_data.max_prefix_length = 0;
11774 }
11775 else
11776 frag_wane (next_fragP);
11777 break;
11778 }
11779 }
11780
11781 /* Stop if there is no BRANCH_PREFIX. */
11782 if (!align_branch_prefix_size)
11783 return;
11784
11785 /* Scan for BRANCH_PREFIX. */
11786 for (; fragP != NULL; fragP = fragP->fr_next)
11787 {
11788 if (fragP->fr_type != rs_machine_dependent
11789 || (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
11790 != BRANCH_PREFIX))
11791 continue;
11792
11793 /* Count all BRANCH_PREFIX frags before BRANCH_PADDING and
11794 COND_JUMP_PREFIX. */
11795 max_prefix_length = 0;
11796 for (next_fragP = fragP;
11797 next_fragP != NULL;
11798 next_fragP = next_fragP->fr_next)
11799 {
11800 if (next_fragP->fr_type == rs_fill)
11801 /* Skip rs_fill frags. */
11802 continue;
11803 else if (next_fragP->fr_type != rs_machine_dependent)
11804 /* Stop for all other frags. */
11805 break;
11806
11807 /* rs_machine_dependent frags. */
11808 if (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11809 == BRANCH_PREFIX)
11810 {
11811 /* Count BRANCH_PREFIX frags. */
11812 if (max_prefix_length >= MAX_FUSED_JCC_PADDING_SIZE)
11813 {
11814 max_prefix_length = MAX_FUSED_JCC_PADDING_SIZE;
11815 frag_wane (next_fragP);
11816 }
11817 else
11818 max_prefix_length
11819 += next_fragP->tc_frag_data.max_bytes;
11820 }
11821 else if ((TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11822 == BRANCH_PADDING)
11823 || (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11824 == FUSED_JCC_PADDING))
11825 {
11826 /* Stop at BRANCH_PADDING and FUSED_JCC_PADDING. */
11827 fragP->tc_frag_data.u.padding_fragP = next_fragP;
11828 break;
11829 }
11830 else
11831 /* Stop for other rs_machine_dependent frags. */
11832 break;
11833 }
11834
11835 fragP->tc_frag_data.max_prefix_length = max_prefix_length;
11836
11837 /* Skip to the next frag. */
11838 fragP = next_fragP;
11839 }
11840 }
11841
11842 /* Compute padding size for
11843
11844 FUSED_JCC_PADDING
11845 CMP like instruction
11846 BRANCH_PADDING
11847 COND_JUMP/UNCOND_JUMP
11848
11849 or
11850
11851 BRANCH_PADDING
11852 COND_JUMP/UNCOND_JUMP
11853 */
11854
11855 static int
11856 i386_branch_padding_size (fragS *fragP, offsetT address)
11857 {
11858 unsigned int offset, size, padding_size;
11859 fragS *branch_fragP = fragP->tc_frag_data.u.branch_fragP;
11860
11861 /* The start address of the BRANCH_PADDING or FUSED_JCC_PADDING frag. */
11862 if (!address)
11863 address = fragP->fr_address;
11864 address += fragP->fr_fix;
11865
11866 /* CMP like instrunction size. */
11867 size = fragP->tc_frag_data.cmp_size;
11868
11869 /* The base size of the branch frag. */
11870 size += branch_fragP->fr_fix;
11871
11872 /* Add opcode and displacement bytes for the rs_machine_dependent
11873 branch frag. */
11874 if (branch_fragP->fr_type == rs_machine_dependent)
11875 size += md_relax_table[branch_fragP->fr_subtype].rlx_length;
11876
11877 /* Check if branch is within boundary and doesn't end at the last
11878 byte. */
11879 offset = address & ((1U << align_branch_power) - 1);
11880 if ((offset + size) >= (1U << align_branch_power))
11881 /* Padding needed to avoid crossing boundary. */
11882 padding_size = (1U << align_branch_power) - offset;
11883 else
11884 /* No padding needed. */
11885 padding_size = 0;
11886
11887 /* The return value may be saved in tc_frag_data.length which is
11888 unsigned byte. */
11889 if (!fits_in_unsigned_byte (padding_size))
11890 abort ();
11891
11892 return padding_size;
11893 }
11894
11895 /* i386_generic_table_relax_frag()
11896
11897 Handle BRANCH_PADDING, BRANCH_PREFIX and FUSED_JCC_PADDING frags to
11898 grow/shrink padding to align branch frags. Hand others to
11899 relax_frag(). */
11900
11901 long
11902 i386_generic_table_relax_frag (segT segment, fragS *fragP, long stretch)
11903 {
11904 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
11905 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
11906 {
11907 long padding_size = i386_branch_padding_size (fragP, 0);
11908 long grow = padding_size - fragP->tc_frag_data.length;
11909
11910 /* When the BRANCH_PREFIX frag is used, the computed address
11911 must match the actual address and there should be no padding. */
11912 if (fragP->tc_frag_data.padding_address
11913 && (fragP->tc_frag_data.padding_address != fragP->fr_address
11914 || padding_size))
11915 abort ();
11916
11917 /* Update the padding size. */
11918 if (grow)
11919 fragP->tc_frag_data.length = padding_size;
11920
11921 return grow;
11922 }
11923 else if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
11924 {
11925 fragS *padding_fragP, *next_fragP;
11926 long padding_size, left_size, last_size;
11927
11928 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
11929 if (!padding_fragP)
11930 /* Use the padding set by the leading BRANCH_PREFIX frag. */
11931 return (fragP->tc_frag_data.length
11932 - fragP->tc_frag_data.last_length);
11933
11934 /* Compute the relative address of the padding frag in the very
11935 first time where the BRANCH_PREFIX frag sizes are zero. */
11936 if (!fragP->tc_frag_data.padding_address)
11937 fragP->tc_frag_data.padding_address
11938 = padding_fragP->fr_address - (fragP->fr_address - stretch);
11939
11940 /* First update the last length from the previous interation. */
11941 left_size = fragP->tc_frag_data.prefix_length;
11942 for (next_fragP = fragP;
11943 next_fragP != padding_fragP;
11944 next_fragP = next_fragP->fr_next)
11945 if (next_fragP->fr_type == rs_machine_dependent
11946 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
11947 == BRANCH_PREFIX))
11948 {
11949 if (left_size)
11950 {
11951 int max = next_fragP->tc_frag_data.max_bytes;
11952 if (max)
11953 {
11954 int size;
11955 if (max > left_size)
11956 size = left_size;
11957 else
11958 size = max;
11959 left_size -= size;
11960 next_fragP->tc_frag_data.last_length = size;
11961 }
11962 }
11963 else
11964 next_fragP->tc_frag_data.last_length = 0;
11965 }
11966
11967 /* Check the padding size for the padding frag. */
11968 padding_size = i386_branch_padding_size
11969 (padding_fragP, (fragP->fr_address
11970 + fragP->tc_frag_data.padding_address));
11971
11972 last_size = fragP->tc_frag_data.prefix_length;
11973 /* Check if there is change from the last interation. */
11974 if (padding_size == last_size)
11975 {
11976 /* Update the expected address of the padding frag. */
11977 padding_fragP->tc_frag_data.padding_address
11978 = (fragP->fr_address + padding_size
11979 + fragP->tc_frag_data.padding_address);
11980 return 0;
11981 }
11982
11983 if (padding_size > fragP->tc_frag_data.max_prefix_length)
11984 {
11985 /* No padding if there is no sufficient room. Clear the
11986 expected address of the padding frag. */
11987 padding_fragP->tc_frag_data.padding_address = 0;
11988 padding_size = 0;
11989 }
11990 else
11991 /* Store the expected address of the padding frag. */
11992 padding_fragP->tc_frag_data.padding_address
11993 = (fragP->fr_address + padding_size
11994 + fragP->tc_frag_data.padding_address);
11995
11996 fragP->tc_frag_data.prefix_length = padding_size;
11997
11998 /* Update the length for the current interation. */
11999 left_size = padding_size;
12000 for (next_fragP = fragP;
12001 next_fragP != padding_fragP;
12002 next_fragP = next_fragP->fr_next)
12003 if (next_fragP->fr_type == rs_machine_dependent
12004 && (TYPE_FROM_RELAX_STATE (next_fragP->fr_subtype)
12005 == BRANCH_PREFIX))
12006 {
12007 if (left_size)
12008 {
12009 int max = next_fragP->tc_frag_data.max_bytes;
12010 if (max)
12011 {
12012 int size;
12013 if (max > left_size)
12014 size = left_size;
12015 else
12016 size = max;
12017 left_size -= size;
12018 next_fragP->tc_frag_data.length = size;
12019 }
12020 }
12021 else
12022 next_fragP->tc_frag_data.length = 0;
12023 }
12024
12025 return (fragP->tc_frag_data.length
12026 - fragP->tc_frag_data.last_length);
12027 }
12028 return relax_frag (segment, fragP, stretch);
12029 }
12030
12031 /* md_estimate_size_before_relax()
12032
12033 Called just before relax() for rs_machine_dependent frags. The x86
12034 assembler uses these frags to handle variable size jump
12035 instructions.
12036
12037 Any symbol that is now undefined will not become defined.
12038 Return the correct fr_subtype in the frag.
12039 Return the initial "guess for variable size of frag" to caller.
12040 The guess is actually the growth beyond the fixed part. Whatever
12041 we do to grow the fixed or variable part contributes to our
12042 returned value. */
12043
12044 int
12045 md_estimate_size_before_relax (fragS *fragP, segT segment)
12046 {
12047 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12048 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX
12049 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING)
12050 {
12051 i386_classify_machine_dependent_frag (fragP);
12052 return fragP->tc_frag_data.length;
12053 }
12054
12055 /* We've already got fragP->fr_subtype right; all we have to do is
12056 check for un-relaxable symbols. On an ELF system, we can't relax
12057 an externally visible symbol, because it may be overridden by a
12058 shared library. */
12059 if (S_GET_SEGMENT (fragP->fr_symbol) != segment
12060 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12061 || (IS_ELF
12062 && !elf_symbol_resolved_in_segment_p (fragP->fr_symbol,
12063 fragP->fr_var))
12064 #endif
12065 #if defined (OBJ_COFF) && defined (TE_PE)
12066 || (OUTPUT_FLAVOR == bfd_target_coff_flavour
12067 && S_IS_WEAK (fragP->fr_symbol))
12068 #endif
12069 )
12070 {
12071 /* Symbol is undefined in this segment, or we need to keep a
12072 reloc so that weak symbols can be overridden. */
12073 int size = (fragP->fr_subtype & CODE16) ? 2 : 4;
12074 enum bfd_reloc_code_real reloc_type;
12075 unsigned char *opcode;
12076 int old_fr_fix;
12077
12078 if (fragP->fr_var != NO_RELOC)
12079 reloc_type = (enum bfd_reloc_code_real) fragP->fr_var;
12080 else if (size == 2)
12081 reloc_type = BFD_RELOC_16_PCREL;
12082 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12083 else if (need_plt32_p (fragP->fr_symbol))
12084 reloc_type = BFD_RELOC_X86_64_PLT32;
12085 #endif
12086 else
12087 reloc_type = BFD_RELOC_32_PCREL;
12088
12089 old_fr_fix = fragP->fr_fix;
12090 opcode = (unsigned char *) fragP->fr_opcode;
12091
12092 switch (TYPE_FROM_RELAX_STATE (fragP->fr_subtype))
12093 {
12094 case UNCOND_JUMP:
12095 /* Make jmp (0xeb) a (d)word displacement jump. */
12096 opcode[0] = 0xe9;
12097 fragP->fr_fix += size;
12098 fix_new (fragP, old_fr_fix, size,
12099 fragP->fr_symbol,
12100 fragP->fr_offset, 1,
12101 reloc_type);
12102 break;
12103
12104 case COND_JUMP86:
12105 if (size == 2
12106 && (!no_cond_jump_promotion || fragP->fr_var != NO_RELOC))
12107 {
12108 /* Negate the condition, and branch past an
12109 unconditional jump. */
12110 opcode[0] ^= 1;
12111 opcode[1] = 3;
12112 /* Insert an unconditional jump. */
12113 opcode[2] = 0xe9;
12114 /* We added two extra opcode bytes, and have a two byte
12115 offset. */
12116 fragP->fr_fix += 2 + 2;
12117 fix_new (fragP, old_fr_fix + 2, 2,
12118 fragP->fr_symbol,
12119 fragP->fr_offset, 1,
12120 reloc_type);
12121 break;
12122 }
12123 /* Fall through. */
12124
12125 case COND_JUMP:
12126 if (no_cond_jump_promotion && fragP->fr_var == NO_RELOC)
12127 {
12128 fixS *fixP;
12129
12130 fragP->fr_fix += 1;
12131 fixP = fix_new (fragP, old_fr_fix, 1,
12132 fragP->fr_symbol,
12133 fragP->fr_offset, 1,
12134 BFD_RELOC_8_PCREL);
12135 fixP->fx_signed = 1;
12136 break;
12137 }
12138
12139 /* This changes the byte-displacement jump 0x7N
12140 to the (d)word-displacement jump 0x0f,0x8N. */
12141 opcode[1] = opcode[0] + 0x10;
12142 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12143 /* We've added an opcode byte. */
12144 fragP->fr_fix += 1 + size;
12145 fix_new (fragP, old_fr_fix + 1, size,
12146 fragP->fr_symbol,
12147 fragP->fr_offset, 1,
12148 reloc_type);
12149 break;
12150
12151 default:
12152 BAD_CASE (fragP->fr_subtype);
12153 break;
12154 }
12155 frag_wane (fragP);
12156 return fragP->fr_fix - old_fr_fix;
12157 }
12158
12159 /* Guess size depending on current relax state. Initially the relax
12160 state will correspond to a short jump and we return 1, because
12161 the variable part of the frag (the branch offset) is one byte
12162 long. However, we can relax a section more than once and in that
12163 case we must either set fr_subtype back to the unrelaxed state,
12164 or return the value for the appropriate branch. */
12165 return md_relax_table[fragP->fr_subtype].rlx_length;
12166 }
12167
12168 /* Called after relax() is finished.
12169
12170 In: Address of frag.
12171 fr_type == rs_machine_dependent.
12172 fr_subtype is what the address relaxed to.
12173
12174 Out: Any fixSs and constants are set up.
12175 Caller will turn frag into a ".space 0". */
12176
12177 void
12178 md_convert_frag (bfd *abfd ATTRIBUTE_UNUSED, segT sec ATTRIBUTE_UNUSED,
12179 fragS *fragP)
12180 {
12181 unsigned char *opcode;
12182 unsigned char *where_to_put_displacement = NULL;
12183 offsetT target_address;
12184 offsetT opcode_address;
12185 unsigned int extension = 0;
12186 offsetT displacement_from_opcode_start;
12187
12188 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PADDING
12189 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == FUSED_JCC_PADDING
12190 || TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12191 {
12192 /* Generate nop padding. */
12193 unsigned int size = fragP->tc_frag_data.length;
12194 if (size)
12195 {
12196 if (size > fragP->tc_frag_data.max_bytes)
12197 abort ();
12198
12199 if (flag_debug)
12200 {
12201 const char *msg;
12202 const char *branch = "branch";
12203 const char *prefix = "";
12204 fragS *padding_fragP;
12205 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype)
12206 == BRANCH_PREFIX)
12207 {
12208 padding_fragP = fragP->tc_frag_data.u.padding_fragP;
12209 switch (fragP->tc_frag_data.default_prefix)
12210 {
12211 default:
12212 abort ();
12213 break;
12214 case CS_PREFIX_OPCODE:
12215 prefix = " cs";
12216 break;
12217 case DS_PREFIX_OPCODE:
12218 prefix = " ds";
12219 break;
12220 case ES_PREFIX_OPCODE:
12221 prefix = " es";
12222 break;
12223 case FS_PREFIX_OPCODE:
12224 prefix = " fs";
12225 break;
12226 case GS_PREFIX_OPCODE:
12227 prefix = " gs";
12228 break;
12229 case SS_PREFIX_OPCODE:
12230 prefix = " ss";
12231 break;
12232 }
12233 if (padding_fragP)
12234 msg = _("%s:%u: add %d%s at 0x%llx to align "
12235 "%s within %d-byte boundary\n");
12236 else
12237 msg = _("%s:%u: add additional %d%s at 0x%llx to "
12238 "align %s within %d-byte boundary\n");
12239 }
12240 else
12241 {
12242 padding_fragP = fragP;
12243 msg = _("%s:%u: add %d%s-byte nop at 0x%llx to align "
12244 "%s within %d-byte boundary\n");
12245 }
12246
12247 if (padding_fragP)
12248 switch (padding_fragP->tc_frag_data.branch_type)
12249 {
12250 case align_branch_jcc:
12251 branch = "jcc";
12252 break;
12253 case align_branch_fused:
12254 branch = "fused jcc";
12255 break;
12256 case align_branch_jmp:
12257 branch = "jmp";
12258 break;
12259 case align_branch_call:
12260 branch = "call";
12261 break;
12262 case align_branch_indirect:
12263 branch = "indiret branch";
12264 break;
12265 case align_branch_ret:
12266 branch = "ret";
12267 break;
12268 default:
12269 break;
12270 }
12271
12272 fprintf (stdout, msg,
12273 fragP->fr_file, fragP->fr_line, size, prefix,
12274 (long long) fragP->fr_address, branch,
12275 1 << align_branch_power);
12276 }
12277 if (TYPE_FROM_RELAX_STATE (fragP->fr_subtype) == BRANCH_PREFIX)
12278 memset (fragP->fr_opcode,
12279 fragP->tc_frag_data.default_prefix, size);
12280 else
12281 i386_generate_nops (fragP, (char *) fragP->fr_opcode,
12282 size, 0);
12283 fragP->fr_fix += size;
12284 }
12285 return;
12286 }
12287
12288 opcode = (unsigned char *) fragP->fr_opcode;
12289
12290 /* Address we want to reach in file space. */
12291 target_address = S_GET_VALUE (fragP->fr_symbol) + fragP->fr_offset;
12292
12293 /* Address opcode resides at in file space. */
12294 opcode_address = fragP->fr_address + fragP->fr_fix;
12295
12296 /* Displacement from opcode start to fill into instruction. */
12297 displacement_from_opcode_start = target_address - opcode_address;
12298
12299 if ((fragP->fr_subtype & BIG) == 0)
12300 {
12301 /* Don't have to change opcode. */
12302 extension = 1; /* 1 opcode + 1 displacement */
12303 where_to_put_displacement = &opcode[1];
12304 }
12305 else
12306 {
12307 if (no_cond_jump_promotion
12308 && TYPE_FROM_RELAX_STATE (fragP->fr_subtype) != UNCOND_JUMP)
12309 as_warn_where (fragP->fr_file, fragP->fr_line,
12310 _("long jump required"));
12311
12312 switch (fragP->fr_subtype)
12313 {
12314 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG):
12315 extension = 4; /* 1 opcode + 4 displacement */
12316 opcode[0] = 0xe9;
12317 where_to_put_displacement = &opcode[1];
12318 break;
12319
12320 case ENCODE_RELAX_STATE (UNCOND_JUMP, BIG16):
12321 extension = 2; /* 1 opcode + 2 displacement */
12322 opcode[0] = 0xe9;
12323 where_to_put_displacement = &opcode[1];
12324 break;
12325
12326 case ENCODE_RELAX_STATE (COND_JUMP, BIG):
12327 case ENCODE_RELAX_STATE (COND_JUMP86, BIG):
12328 extension = 5; /* 2 opcode + 4 displacement */
12329 opcode[1] = opcode[0] + 0x10;
12330 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12331 where_to_put_displacement = &opcode[2];
12332 break;
12333
12334 case ENCODE_RELAX_STATE (COND_JUMP, BIG16):
12335 extension = 3; /* 2 opcode + 2 displacement */
12336 opcode[1] = opcode[0] + 0x10;
12337 opcode[0] = TWO_BYTE_OPCODE_ESCAPE;
12338 where_to_put_displacement = &opcode[2];
12339 break;
12340
12341 case ENCODE_RELAX_STATE (COND_JUMP86, BIG16):
12342 extension = 4;
12343 opcode[0] ^= 1;
12344 opcode[1] = 3;
12345 opcode[2] = 0xe9;
12346 where_to_put_displacement = &opcode[3];
12347 break;
12348
12349 default:
12350 BAD_CASE (fragP->fr_subtype);
12351 break;
12352 }
12353 }
12354
12355 /* If size if less then four we are sure that the operand fits,
12356 but if it's 4, then it could be that the displacement is larger
12357 then -/+ 2GB. */
12358 if (DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype) == 4
12359 && object_64bit
12360 && ((addressT) (displacement_from_opcode_start - extension
12361 + ((addressT) 1 << 31))
12362 > (((addressT) 2 << 31) - 1)))
12363 {
12364 as_bad_where (fragP->fr_file, fragP->fr_line,
12365 _("jump target out of range"));
12366 /* Make us emit 0. */
12367 displacement_from_opcode_start = extension;
12368 }
12369 /* Now put displacement after opcode. */
12370 md_number_to_chars ((char *) where_to_put_displacement,
12371 (valueT) (displacement_from_opcode_start - extension),
12372 DISP_SIZE_FROM_RELAX_STATE (fragP->fr_subtype));
12373 fragP->fr_fix += extension;
12374 }
12375 \f
12376 /* Apply a fixup (fixP) to segment data, once it has been determined
12377 by our caller that we have all the info we need to fix it up.
12378
12379 Parameter valP is the pointer to the value of the bits.
12380
12381 On the 386, immediates, displacements, and data pointers are all in
12382 the same (little-endian) format, so we don't need to care about which
12383 we are handling. */
12384
12385 void
12386 md_apply_fix (fixS *fixP, valueT *valP, segT seg ATTRIBUTE_UNUSED)
12387 {
12388 char *p = fixP->fx_where + fixP->fx_frag->fr_literal;
12389 valueT value = *valP;
12390
12391 #if !defined (TE_Mach)
12392 if (fixP->fx_pcrel)
12393 {
12394 switch (fixP->fx_r_type)
12395 {
12396 default:
12397 break;
12398
12399 case BFD_RELOC_64:
12400 fixP->fx_r_type = BFD_RELOC_64_PCREL;
12401 break;
12402 case BFD_RELOC_32:
12403 case BFD_RELOC_X86_64_32S:
12404 fixP->fx_r_type = BFD_RELOC_32_PCREL;
12405 break;
12406 case BFD_RELOC_16:
12407 fixP->fx_r_type = BFD_RELOC_16_PCREL;
12408 break;
12409 case BFD_RELOC_8:
12410 fixP->fx_r_type = BFD_RELOC_8_PCREL;
12411 break;
12412 }
12413 }
12414
12415 if (fixP->fx_addsy != NULL
12416 && (fixP->fx_r_type == BFD_RELOC_32_PCREL
12417 || fixP->fx_r_type == BFD_RELOC_64_PCREL
12418 || fixP->fx_r_type == BFD_RELOC_16_PCREL
12419 || fixP->fx_r_type == BFD_RELOC_8_PCREL)
12420 && !use_rela_relocations)
12421 {
12422 /* This is a hack. There should be a better way to handle this.
12423 This covers for the fact that bfd_install_relocation will
12424 subtract the current location (for partial_inplace, PC relative
12425 relocations); see more below. */
12426 #ifndef OBJ_AOUT
12427 if (IS_ELF
12428 #ifdef TE_PE
12429 || OUTPUT_FLAVOR == bfd_target_coff_flavour
12430 #endif
12431 )
12432 value += fixP->fx_where + fixP->fx_frag->fr_address;
12433 #endif
12434 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12435 if (IS_ELF)
12436 {
12437 segT sym_seg = S_GET_SEGMENT (fixP->fx_addsy);
12438
12439 if ((sym_seg == seg
12440 || (symbol_section_p (fixP->fx_addsy)
12441 && sym_seg != absolute_section))
12442 && !generic_force_reloc (fixP))
12443 {
12444 /* Yes, we add the values in twice. This is because
12445 bfd_install_relocation subtracts them out again. I think
12446 bfd_install_relocation is broken, but I don't dare change
12447 it. FIXME. */
12448 value += fixP->fx_where + fixP->fx_frag->fr_address;
12449 }
12450 }
12451 #endif
12452 #if defined (OBJ_COFF) && defined (TE_PE)
12453 /* For some reason, the PE format does not store a
12454 section address offset for a PC relative symbol. */
12455 if (S_GET_SEGMENT (fixP->fx_addsy) != seg
12456 || S_IS_WEAK (fixP->fx_addsy))
12457 value += md_pcrel_from (fixP);
12458 #endif
12459 }
12460 #if defined (OBJ_COFF) && defined (TE_PE)
12461 if (fixP->fx_addsy != NULL
12462 && S_IS_WEAK (fixP->fx_addsy)
12463 /* PR 16858: Do not modify weak function references. */
12464 && ! fixP->fx_pcrel)
12465 {
12466 #if !defined (TE_PEP)
12467 /* For x86 PE weak function symbols are neither PC-relative
12468 nor do they set S_IS_FUNCTION. So the only reliable way
12469 to detect them is to check the flags of their containing
12470 section. */
12471 if (S_GET_SEGMENT (fixP->fx_addsy) != NULL
12472 && S_GET_SEGMENT (fixP->fx_addsy)->flags & SEC_CODE)
12473 ;
12474 else
12475 #endif
12476 value -= S_GET_VALUE (fixP->fx_addsy);
12477 }
12478 #endif
12479
12480 /* Fix a few things - the dynamic linker expects certain values here,
12481 and we must not disappoint it. */
12482 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12483 if (IS_ELF && fixP->fx_addsy)
12484 switch (fixP->fx_r_type)
12485 {
12486 case BFD_RELOC_386_PLT32:
12487 case BFD_RELOC_X86_64_PLT32:
12488 /* Make the jump instruction point to the address of the operand.
12489 At runtime we merely add the offset to the actual PLT entry.
12490 NB: Subtract the offset size only for jump instructions. */
12491 if (fixP->fx_pcrel)
12492 value = -4;
12493 break;
12494
12495 case BFD_RELOC_386_TLS_GD:
12496 case BFD_RELOC_386_TLS_LDM:
12497 case BFD_RELOC_386_TLS_IE_32:
12498 case BFD_RELOC_386_TLS_IE:
12499 case BFD_RELOC_386_TLS_GOTIE:
12500 case BFD_RELOC_386_TLS_GOTDESC:
12501 case BFD_RELOC_X86_64_TLSGD:
12502 case BFD_RELOC_X86_64_TLSLD:
12503 case BFD_RELOC_X86_64_GOTTPOFF:
12504 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
12505 value = 0; /* Fully resolved at runtime. No addend. */
12506 /* Fallthrough */
12507 case BFD_RELOC_386_TLS_LE:
12508 case BFD_RELOC_386_TLS_LDO_32:
12509 case BFD_RELOC_386_TLS_LE_32:
12510 case BFD_RELOC_X86_64_DTPOFF32:
12511 case BFD_RELOC_X86_64_DTPOFF64:
12512 case BFD_RELOC_X86_64_TPOFF32:
12513 case BFD_RELOC_X86_64_TPOFF64:
12514 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12515 break;
12516
12517 case BFD_RELOC_386_TLS_DESC_CALL:
12518 case BFD_RELOC_X86_64_TLSDESC_CALL:
12519 value = 0; /* Fully resolved at runtime. No addend. */
12520 S_SET_THREAD_LOCAL (fixP->fx_addsy);
12521 fixP->fx_done = 0;
12522 return;
12523
12524 case BFD_RELOC_VTABLE_INHERIT:
12525 case BFD_RELOC_VTABLE_ENTRY:
12526 fixP->fx_done = 0;
12527 return;
12528
12529 default:
12530 break;
12531 }
12532 #endif /* defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) */
12533 *valP = value;
12534 #endif /* !defined (TE_Mach) */
12535
12536 /* Are we finished with this relocation now? */
12537 if (fixP->fx_addsy == NULL)
12538 fixP->fx_done = 1;
12539 #if defined (OBJ_COFF) && defined (TE_PE)
12540 else if (fixP->fx_addsy != NULL && S_IS_WEAK (fixP->fx_addsy))
12541 {
12542 fixP->fx_done = 0;
12543 /* Remember value for tc_gen_reloc. */
12544 fixP->fx_addnumber = value;
12545 /* Clear out the frag for now. */
12546 value = 0;
12547 }
12548 #endif
12549 else if (use_rela_relocations)
12550 {
12551 fixP->fx_no_overflow = 1;
12552 /* Remember value for tc_gen_reloc. */
12553 fixP->fx_addnumber = value;
12554 value = 0;
12555 }
12556
12557 md_number_to_chars (p, value, fixP->fx_size);
12558 }
12559 \f
12560 const char *
12561 md_atof (int type, char *litP, int *sizeP)
12562 {
12563 /* This outputs the LITTLENUMs in REVERSE order;
12564 in accord with the bigendian 386. */
12565 return ieee_md_atof (type, litP, sizeP, FALSE);
12566 }
12567 \f
12568 static char output_invalid_buf[sizeof (unsigned char) * 2 + 6];
12569
12570 static char *
12571 output_invalid (int c)
12572 {
12573 if (ISPRINT (c))
12574 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12575 "'%c'", c);
12576 else
12577 snprintf (output_invalid_buf, sizeof (output_invalid_buf),
12578 "(0x%x)", (unsigned char) c);
12579 return output_invalid_buf;
12580 }
12581
12582 /* Verify that @r can be used in the current context. */
12583
12584 static bfd_boolean check_register (const reg_entry *r)
12585 {
12586 if (allow_pseudo_reg)
12587 return TRUE;
12588
12589 if (operand_type_all_zero (&r->reg_type))
12590 return FALSE;
12591
12592 if ((r->reg_type.bitfield.dword
12593 || (r->reg_type.bitfield.class == SReg && r->reg_num > 3)
12594 || r->reg_type.bitfield.class == RegCR
12595 || r->reg_type.bitfield.class == RegDR)
12596 && !cpu_arch_flags.bitfield.cpui386)
12597 return FALSE;
12598
12599 if (r->reg_type.bitfield.class == RegTR
12600 && (flag_code == CODE_64BIT
12601 || !cpu_arch_flags.bitfield.cpui386
12602 || cpu_arch_isa_flags.bitfield.cpui586
12603 || cpu_arch_isa_flags.bitfield.cpui686))
12604 return FALSE;
12605
12606 if (r->reg_type.bitfield.class == RegMMX && !cpu_arch_flags.bitfield.cpummx)
12607 return FALSE;
12608
12609 if (!cpu_arch_flags.bitfield.cpuavx512f)
12610 {
12611 if (r->reg_type.bitfield.zmmword
12612 || r->reg_type.bitfield.class == RegMask)
12613 return FALSE;
12614
12615 if (!cpu_arch_flags.bitfield.cpuavx)
12616 {
12617 if (r->reg_type.bitfield.ymmword)
12618 return FALSE;
12619
12620 if (!cpu_arch_flags.bitfield.cpusse && r->reg_type.bitfield.xmmword)
12621 return FALSE;
12622 }
12623 }
12624
12625 if (r->reg_type.bitfield.tmmword
12626 && (!cpu_arch_flags.bitfield.cpuamx_tile
12627 || flag_code != CODE_64BIT))
12628 return FALSE;
12629
12630 if (r->reg_type.bitfield.class == RegBND && !cpu_arch_flags.bitfield.cpumpx)
12631 return FALSE;
12632
12633 /* Don't allow fake index register unless allow_index_reg isn't 0. */
12634 if (!allow_index_reg && r->reg_num == RegIZ)
12635 return FALSE;
12636
12637 /* Upper 16 vector registers are only available with VREX in 64bit
12638 mode, and require EVEX encoding. */
12639 if (r->reg_flags & RegVRex)
12640 {
12641 if (!cpu_arch_flags.bitfield.cpuavx512f
12642 || flag_code != CODE_64BIT)
12643 return FALSE;
12644
12645 if (i.vec_encoding == vex_encoding_default)
12646 i.vec_encoding = vex_encoding_evex;
12647 else if (i.vec_encoding != vex_encoding_evex)
12648 i.vec_encoding = vex_encoding_error;
12649 }
12650
12651 if (((r->reg_flags & (RegRex64 | RegRex)) || r->reg_type.bitfield.qword)
12652 && (!cpu_arch_flags.bitfield.cpulm || r->reg_type.bitfield.class != RegCR)
12653 && flag_code != CODE_64BIT)
12654 return FALSE;
12655
12656 if (r->reg_type.bitfield.class == SReg && r->reg_num == RegFlat
12657 && !intel_syntax)
12658 return FALSE;
12659
12660 return TRUE;
12661 }
12662
12663 /* REG_STRING starts *before* REGISTER_PREFIX. */
12664
12665 static const reg_entry *
12666 parse_real_register (char *reg_string, char **end_op)
12667 {
12668 char *s = reg_string;
12669 char *p;
12670 char reg_name_given[MAX_REG_NAME_SIZE + 1];
12671 const reg_entry *r;
12672
12673 /* Skip possible REGISTER_PREFIX and possible whitespace. */
12674 if (*s == REGISTER_PREFIX)
12675 ++s;
12676
12677 if (is_space_char (*s))
12678 ++s;
12679
12680 p = reg_name_given;
12681 while ((*p++ = register_chars[(unsigned char) *s]) != '\0')
12682 {
12683 if (p >= reg_name_given + MAX_REG_NAME_SIZE)
12684 return (const reg_entry *) NULL;
12685 s++;
12686 }
12687
12688 /* For naked regs, make sure that we are not dealing with an identifier.
12689 This prevents confusing an identifier like `eax_var' with register
12690 `eax'. */
12691 if (allow_naked_reg && identifier_chars[(unsigned char) *s])
12692 return (const reg_entry *) NULL;
12693
12694 *end_op = s;
12695
12696 r = (const reg_entry *) str_hash_find (reg_hash, reg_name_given);
12697
12698 /* Handle floating point regs, allowing spaces in the (i) part. */
12699 if (r == i386_regtab /* %st is first entry of table */)
12700 {
12701 if (!cpu_arch_flags.bitfield.cpu8087
12702 && !cpu_arch_flags.bitfield.cpu287
12703 && !cpu_arch_flags.bitfield.cpu387
12704 && !allow_pseudo_reg)
12705 return (const reg_entry *) NULL;
12706
12707 if (is_space_char (*s))
12708 ++s;
12709 if (*s == '(')
12710 {
12711 ++s;
12712 if (is_space_char (*s))
12713 ++s;
12714 if (*s >= '0' && *s <= '7')
12715 {
12716 int fpr = *s - '0';
12717 ++s;
12718 if (is_space_char (*s))
12719 ++s;
12720 if (*s == ')')
12721 {
12722 *end_op = s + 1;
12723 r = (const reg_entry *) str_hash_find (reg_hash, "st(0)");
12724 know (r);
12725 return r + fpr;
12726 }
12727 }
12728 /* We have "%st(" then garbage. */
12729 return (const reg_entry *) NULL;
12730 }
12731 }
12732
12733 return r && check_register (r) ? r : NULL;
12734 }
12735
12736 /* REG_STRING starts *before* REGISTER_PREFIX. */
12737
12738 static const reg_entry *
12739 parse_register (char *reg_string, char **end_op)
12740 {
12741 const reg_entry *r;
12742
12743 if (*reg_string == REGISTER_PREFIX || allow_naked_reg)
12744 r = parse_real_register (reg_string, end_op);
12745 else
12746 r = NULL;
12747 if (!r)
12748 {
12749 char *save = input_line_pointer;
12750 char c;
12751 symbolS *symbolP;
12752
12753 input_line_pointer = reg_string;
12754 c = get_symbol_name (&reg_string);
12755 symbolP = symbol_find (reg_string);
12756 if (symbolP && S_GET_SEGMENT (symbolP) == reg_section)
12757 {
12758 const expressionS *e = symbol_get_value_expression (symbolP);
12759
12760 know (e->X_op == O_register);
12761 know (e->X_add_number >= 0
12762 && (valueT) e->X_add_number < i386_regtab_size);
12763 r = i386_regtab + e->X_add_number;
12764 if (!check_register (r))
12765 {
12766 as_bad (_("register '%s%s' cannot be used here"),
12767 register_prefix, r->reg_name);
12768 r = &bad_reg;
12769 }
12770 *end_op = input_line_pointer;
12771 }
12772 *input_line_pointer = c;
12773 input_line_pointer = save;
12774 }
12775 return r;
12776 }
12777
12778 int
12779 i386_parse_name (char *name, expressionS *e, char *nextcharP)
12780 {
12781 const reg_entry *r;
12782 char *end = input_line_pointer;
12783
12784 *end = *nextcharP;
12785 r = parse_register (name, &input_line_pointer);
12786 if (r && end <= input_line_pointer)
12787 {
12788 *nextcharP = *input_line_pointer;
12789 *input_line_pointer = 0;
12790 if (r != &bad_reg)
12791 {
12792 e->X_op = O_register;
12793 e->X_add_number = r - i386_regtab;
12794 }
12795 else
12796 e->X_op = O_illegal;
12797 return 1;
12798 }
12799 input_line_pointer = end;
12800 *end = 0;
12801 return intel_syntax ? i386_intel_parse_name (name, e) : 0;
12802 }
12803
12804 void
12805 md_operand (expressionS *e)
12806 {
12807 char *end;
12808 const reg_entry *r;
12809
12810 switch (*input_line_pointer)
12811 {
12812 case REGISTER_PREFIX:
12813 r = parse_real_register (input_line_pointer, &end);
12814 if (r)
12815 {
12816 e->X_op = O_register;
12817 e->X_add_number = r - i386_regtab;
12818 input_line_pointer = end;
12819 }
12820 break;
12821
12822 case '[':
12823 gas_assert (intel_syntax);
12824 end = input_line_pointer++;
12825 expression (e);
12826 if (*input_line_pointer == ']')
12827 {
12828 ++input_line_pointer;
12829 e->X_op_symbol = make_expr_symbol (e);
12830 e->X_add_symbol = NULL;
12831 e->X_add_number = 0;
12832 e->X_op = O_index;
12833 }
12834 else
12835 {
12836 e->X_op = O_absent;
12837 input_line_pointer = end;
12838 }
12839 break;
12840 }
12841 }
12842
12843 \f
12844 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12845 const char *md_shortopts = "kVQ:sqnO::";
12846 #else
12847 const char *md_shortopts = "qnO::";
12848 #endif
12849
12850 #define OPTION_32 (OPTION_MD_BASE + 0)
12851 #define OPTION_64 (OPTION_MD_BASE + 1)
12852 #define OPTION_DIVIDE (OPTION_MD_BASE + 2)
12853 #define OPTION_MARCH (OPTION_MD_BASE + 3)
12854 #define OPTION_MTUNE (OPTION_MD_BASE + 4)
12855 #define OPTION_MMNEMONIC (OPTION_MD_BASE + 5)
12856 #define OPTION_MSYNTAX (OPTION_MD_BASE + 6)
12857 #define OPTION_MINDEX_REG (OPTION_MD_BASE + 7)
12858 #define OPTION_MNAKED_REG (OPTION_MD_BASE + 8)
12859 #define OPTION_MRELAX_RELOCATIONS (OPTION_MD_BASE + 9)
12860 #define OPTION_MSSE2AVX (OPTION_MD_BASE + 10)
12861 #define OPTION_MSSE_CHECK (OPTION_MD_BASE + 11)
12862 #define OPTION_MOPERAND_CHECK (OPTION_MD_BASE + 12)
12863 #define OPTION_MAVXSCALAR (OPTION_MD_BASE + 13)
12864 #define OPTION_X32 (OPTION_MD_BASE + 14)
12865 #define OPTION_MADD_BND_PREFIX (OPTION_MD_BASE + 15)
12866 #define OPTION_MEVEXLIG (OPTION_MD_BASE + 16)
12867 #define OPTION_MEVEXWIG (OPTION_MD_BASE + 17)
12868 #define OPTION_MBIG_OBJ (OPTION_MD_BASE + 18)
12869 #define OPTION_MOMIT_LOCK_PREFIX (OPTION_MD_BASE + 19)
12870 #define OPTION_MEVEXRCIG (OPTION_MD_BASE + 20)
12871 #define OPTION_MSHARED (OPTION_MD_BASE + 21)
12872 #define OPTION_MAMD64 (OPTION_MD_BASE + 22)
12873 #define OPTION_MINTEL64 (OPTION_MD_BASE + 23)
12874 #define OPTION_MFENCE_AS_LOCK_ADD (OPTION_MD_BASE + 24)
12875 #define OPTION_X86_USED_NOTE (OPTION_MD_BASE + 25)
12876 #define OPTION_MVEXWIG (OPTION_MD_BASE + 26)
12877 #define OPTION_MALIGN_BRANCH_BOUNDARY (OPTION_MD_BASE + 27)
12878 #define OPTION_MALIGN_BRANCH_PREFIX_SIZE (OPTION_MD_BASE + 28)
12879 #define OPTION_MALIGN_BRANCH (OPTION_MD_BASE + 29)
12880 #define OPTION_MBRANCHES_WITH_32B_BOUNDARIES (OPTION_MD_BASE + 30)
12881 #define OPTION_MLFENCE_AFTER_LOAD (OPTION_MD_BASE + 31)
12882 #define OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH (OPTION_MD_BASE + 32)
12883 #define OPTION_MLFENCE_BEFORE_RET (OPTION_MD_BASE + 33)
12884
12885 struct option md_longopts[] =
12886 {
12887 {"32", no_argument, NULL, OPTION_32},
12888 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12889 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12890 {"64", no_argument, NULL, OPTION_64},
12891 #endif
12892 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12893 {"x32", no_argument, NULL, OPTION_X32},
12894 {"mshared", no_argument, NULL, OPTION_MSHARED},
12895 {"mx86-used-note", required_argument, NULL, OPTION_X86_USED_NOTE},
12896 #endif
12897 {"divide", no_argument, NULL, OPTION_DIVIDE},
12898 {"march", required_argument, NULL, OPTION_MARCH},
12899 {"mtune", required_argument, NULL, OPTION_MTUNE},
12900 {"mmnemonic", required_argument, NULL, OPTION_MMNEMONIC},
12901 {"msyntax", required_argument, NULL, OPTION_MSYNTAX},
12902 {"mindex-reg", no_argument, NULL, OPTION_MINDEX_REG},
12903 {"mnaked-reg", no_argument, NULL, OPTION_MNAKED_REG},
12904 {"msse2avx", no_argument, NULL, OPTION_MSSE2AVX},
12905 {"msse-check", required_argument, NULL, OPTION_MSSE_CHECK},
12906 {"moperand-check", required_argument, NULL, OPTION_MOPERAND_CHECK},
12907 {"mavxscalar", required_argument, NULL, OPTION_MAVXSCALAR},
12908 {"mvexwig", required_argument, NULL, OPTION_MVEXWIG},
12909 {"madd-bnd-prefix", no_argument, NULL, OPTION_MADD_BND_PREFIX},
12910 {"mevexlig", required_argument, NULL, OPTION_MEVEXLIG},
12911 {"mevexwig", required_argument, NULL, OPTION_MEVEXWIG},
12912 # if defined (TE_PE) || defined (TE_PEP)
12913 {"mbig-obj", no_argument, NULL, OPTION_MBIG_OBJ},
12914 #endif
12915 {"momit-lock-prefix", required_argument, NULL, OPTION_MOMIT_LOCK_PREFIX},
12916 {"mfence-as-lock-add", required_argument, NULL, OPTION_MFENCE_AS_LOCK_ADD},
12917 {"mrelax-relocations", required_argument, NULL, OPTION_MRELAX_RELOCATIONS},
12918 {"mevexrcig", required_argument, NULL, OPTION_MEVEXRCIG},
12919 {"malign-branch-boundary", required_argument, NULL, OPTION_MALIGN_BRANCH_BOUNDARY},
12920 {"malign-branch-prefix-size", required_argument, NULL, OPTION_MALIGN_BRANCH_PREFIX_SIZE},
12921 {"malign-branch", required_argument, NULL, OPTION_MALIGN_BRANCH},
12922 {"mbranches-within-32B-boundaries", no_argument, NULL, OPTION_MBRANCHES_WITH_32B_BOUNDARIES},
12923 {"mlfence-after-load", required_argument, NULL, OPTION_MLFENCE_AFTER_LOAD},
12924 {"mlfence-before-indirect-branch", required_argument, NULL,
12925 OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH},
12926 {"mlfence-before-ret", required_argument, NULL, OPTION_MLFENCE_BEFORE_RET},
12927 {"mamd64", no_argument, NULL, OPTION_MAMD64},
12928 {"mintel64", no_argument, NULL, OPTION_MINTEL64},
12929 {NULL, no_argument, NULL, 0}
12930 };
12931 size_t md_longopts_size = sizeof (md_longopts);
12932
12933 int
12934 md_parse_option (int c, const char *arg)
12935 {
12936 unsigned int j;
12937 char *arch, *next, *saved, *type;
12938
12939 switch (c)
12940 {
12941 case 'n':
12942 optimize_align_code = 0;
12943 break;
12944
12945 case 'q':
12946 quiet_warnings = 1;
12947 break;
12948
12949 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
12950 /* -Qy, -Qn: SVR4 arguments controlling whether a .comment section
12951 should be emitted or not. FIXME: Not implemented. */
12952 case 'Q':
12953 if ((arg[0] != 'y' && arg[0] != 'n') || arg[1])
12954 return 0;
12955 break;
12956
12957 /* -V: SVR4 argument to print version ID. */
12958 case 'V':
12959 print_version_id ();
12960 break;
12961
12962 /* -k: Ignore for FreeBSD compatibility. */
12963 case 'k':
12964 break;
12965
12966 case 's':
12967 /* -s: On i386 Solaris, this tells the native assembler to use
12968 .stab instead of .stab.excl. We always use .stab anyhow. */
12969 break;
12970
12971 case OPTION_MSHARED:
12972 shared = 1;
12973 break;
12974
12975 case OPTION_X86_USED_NOTE:
12976 if (strcasecmp (arg, "yes") == 0)
12977 x86_used_note = 1;
12978 else if (strcasecmp (arg, "no") == 0)
12979 x86_used_note = 0;
12980 else
12981 as_fatal (_("invalid -mx86-used-note= option: `%s'"), arg);
12982 break;
12983
12984
12985 #endif
12986 #if (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
12987 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
12988 case OPTION_64:
12989 {
12990 const char **list, **l;
12991
12992 list = bfd_target_list ();
12993 for (l = list; *l != NULL; l++)
12994 if (startswith (*l, "elf64-x86-64")
12995 || strcmp (*l, "coff-x86-64") == 0
12996 || strcmp (*l, "pe-x86-64") == 0
12997 || strcmp (*l, "pei-x86-64") == 0
12998 || strcmp (*l, "mach-o-x86-64") == 0)
12999 {
13000 default_arch = "x86_64";
13001 break;
13002 }
13003 if (*l == NULL)
13004 as_fatal (_("no compiled in support for x86_64"));
13005 free (list);
13006 }
13007 break;
13008 #endif
13009
13010 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13011 case OPTION_X32:
13012 if (IS_ELF)
13013 {
13014 const char **list, **l;
13015
13016 list = bfd_target_list ();
13017 for (l = list; *l != NULL; l++)
13018 if (startswith (*l, "elf32-x86-64"))
13019 {
13020 default_arch = "x86_64:32";
13021 break;
13022 }
13023 if (*l == NULL)
13024 as_fatal (_("no compiled in support for 32bit x86_64"));
13025 free (list);
13026 }
13027 else
13028 as_fatal (_("32bit x86_64 is only supported for ELF"));
13029 break;
13030 #endif
13031
13032 case OPTION_32:
13033 default_arch = "i386";
13034 break;
13035
13036 case OPTION_DIVIDE:
13037 #ifdef SVR4_COMMENT_CHARS
13038 {
13039 char *n, *t;
13040 const char *s;
13041
13042 n = XNEWVEC (char, strlen (i386_comment_chars) + 1);
13043 t = n;
13044 for (s = i386_comment_chars; *s != '\0'; s++)
13045 if (*s != '/')
13046 *t++ = *s;
13047 *t = '\0';
13048 i386_comment_chars = n;
13049 }
13050 #endif
13051 break;
13052
13053 case OPTION_MARCH:
13054 saved = xstrdup (arg);
13055 arch = saved;
13056 /* Allow -march=+nosse. */
13057 if (*arch == '+')
13058 arch++;
13059 do
13060 {
13061 if (*arch == '.')
13062 as_fatal (_("invalid -march= option: `%s'"), arg);
13063 next = strchr (arch, '+');
13064 if (next)
13065 *next++ = '\0';
13066 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13067 {
13068 if (strcmp (arch, cpu_arch [j].name) == 0)
13069 {
13070 /* Processor. */
13071 if (! cpu_arch[j].flags.bitfield.cpui386)
13072 continue;
13073
13074 cpu_arch_name = cpu_arch[j].name;
13075 cpu_sub_arch_name = NULL;
13076 cpu_arch_flags = cpu_arch[j].flags;
13077 cpu_arch_isa = cpu_arch[j].type;
13078 cpu_arch_isa_flags = cpu_arch[j].flags;
13079 if (!cpu_arch_tune_set)
13080 {
13081 cpu_arch_tune = cpu_arch_isa;
13082 cpu_arch_tune_flags = cpu_arch_isa_flags;
13083 }
13084 break;
13085 }
13086 else if (*cpu_arch [j].name == '.'
13087 && strcmp (arch, cpu_arch [j].name + 1) == 0)
13088 {
13089 /* ISA extension. */
13090 i386_cpu_flags flags;
13091
13092 flags = cpu_flags_or (cpu_arch_flags,
13093 cpu_arch[j].flags);
13094
13095 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13096 {
13097 if (cpu_sub_arch_name)
13098 {
13099 char *name = cpu_sub_arch_name;
13100 cpu_sub_arch_name = concat (name,
13101 cpu_arch[j].name,
13102 (const char *) NULL);
13103 free (name);
13104 }
13105 else
13106 cpu_sub_arch_name = xstrdup (cpu_arch[j].name);
13107 cpu_arch_flags = flags;
13108 cpu_arch_isa_flags = flags;
13109 }
13110 else
13111 cpu_arch_isa_flags
13112 = cpu_flags_or (cpu_arch_isa_flags,
13113 cpu_arch[j].flags);
13114 break;
13115 }
13116 }
13117
13118 if (j >= ARRAY_SIZE (cpu_arch))
13119 {
13120 /* Disable an ISA extension. */
13121 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13122 if (strcmp (arch, cpu_noarch [j].name) == 0)
13123 {
13124 i386_cpu_flags flags;
13125
13126 flags = cpu_flags_and_not (cpu_arch_flags,
13127 cpu_noarch[j].flags);
13128 if (!cpu_flags_equal (&flags, &cpu_arch_flags))
13129 {
13130 if (cpu_sub_arch_name)
13131 {
13132 char *name = cpu_sub_arch_name;
13133 cpu_sub_arch_name = concat (arch,
13134 (const char *) NULL);
13135 free (name);
13136 }
13137 else
13138 cpu_sub_arch_name = xstrdup (arch);
13139 cpu_arch_flags = flags;
13140 cpu_arch_isa_flags = flags;
13141 }
13142 break;
13143 }
13144
13145 if (j >= ARRAY_SIZE (cpu_noarch))
13146 j = ARRAY_SIZE (cpu_arch);
13147 }
13148
13149 if (j >= ARRAY_SIZE (cpu_arch))
13150 as_fatal (_("invalid -march= option: `%s'"), arg);
13151
13152 arch = next;
13153 }
13154 while (next != NULL);
13155 free (saved);
13156 break;
13157
13158 case OPTION_MTUNE:
13159 if (*arg == '.')
13160 as_fatal (_("invalid -mtune= option: `%s'"), arg);
13161 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13162 {
13163 if (strcmp (arg, cpu_arch [j].name) == 0)
13164 {
13165 cpu_arch_tune_set = 1;
13166 cpu_arch_tune = cpu_arch [j].type;
13167 cpu_arch_tune_flags = cpu_arch[j].flags;
13168 break;
13169 }
13170 }
13171 if (j >= ARRAY_SIZE (cpu_arch))
13172 as_fatal (_("invalid -mtune= option: `%s'"), arg);
13173 break;
13174
13175 case OPTION_MMNEMONIC:
13176 if (strcasecmp (arg, "att") == 0)
13177 intel_mnemonic = 0;
13178 else if (strcasecmp (arg, "intel") == 0)
13179 intel_mnemonic = 1;
13180 else
13181 as_fatal (_("invalid -mmnemonic= option: `%s'"), arg);
13182 break;
13183
13184 case OPTION_MSYNTAX:
13185 if (strcasecmp (arg, "att") == 0)
13186 intel_syntax = 0;
13187 else if (strcasecmp (arg, "intel") == 0)
13188 intel_syntax = 1;
13189 else
13190 as_fatal (_("invalid -msyntax= option: `%s'"), arg);
13191 break;
13192
13193 case OPTION_MINDEX_REG:
13194 allow_index_reg = 1;
13195 break;
13196
13197 case OPTION_MNAKED_REG:
13198 allow_naked_reg = 1;
13199 break;
13200
13201 case OPTION_MSSE2AVX:
13202 sse2avx = 1;
13203 break;
13204
13205 case OPTION_MSSE_CHECK:
13206 if (strcasecmp (arg, "error") == 0)
13207 sse_check = check_error;
13208 else if (strcasecmp (arg, "warning") == 0)
13209 sse_check = check_warning;
13210 else if (strcasecmp (arg, "none") == 0)
13211 sse_check = check_none;
13212 else
13213 as_fatal (_("invalid -msse-check= option: `%s'"), arg);
13214 break;
13215
13216 case OPTION_MOPERAND_CHECK:
13217 if (strcasecmp (arg, "error") == 0)
13218 operand_check = check_error;
13219 else if (strcasecmp (arg, "warning") == 0)
13220 operand_check = check_warning;
13221 else if (strcasecmp (arg, "none") == 0)
13222 operand_check = check_none;
13223 else
13224 as_fatal (_("invalid -moperand-check= option: `%s'"), arg);
13225 break;
13226
13227 case OPTION_MAVXSCALAR:
13228 if (strcasecmp (arg, "128") == 0)
13229 avxscalar = vex128;
13230 else if (strcasecmp (arg, "256") == 0)
13231 avxscalar = vex256;
13232 else
13233 as_fatal (_("invalid -mavxscalar= option: `%s'"), arg);
13234 break;
13235
13236 case OPTION_MVEXWIG:
13237 if (strcmp (arg, "0") == 0)
13238 vexwig = vexw0;
13239 else if (strcmp (arg, "1") == 0)
13240 vexwig = vexw1;
13241 else
13242 as_fatal (_("invalid -mvexwig= option: `%s'"), arg);
13243 break;
13244
13245 case OPTION_MADD_BND_PREFIX:
13246 add_bnd_prefix = 1;
13247 break;
13248
13249 case OPTION_MEVEXLIG:
13250 if (strcmp (arg, "128") == 0)
13251 evexlig = evexl128;
13252 else if (strcmp (arg, "256") == 0)
13253 evexlig = evexl256;
13254 else if (strcmp (arg, "512") == 0)
13255 evexlig = evexl512;
13256 else
13257 as_fatal (_("invalid -mevexlig= option: `%s'"), arg);
13258 break;
13259
13260 case OPTION_MEVEXRCIG:
13261 if (strcmp (arg, "rne") == 0)
13262 evexrcig = rne;
13263 else if (strcmp (arg, "rd") == 0)
13264 evexrcig = rd;
13265 else if (strcmp (arg, "ru") == 0)
13266 evexrcig = ru;
13267 else if (strcmp (arg, "rz") == 0)
13268 evexrcig = rz;
13269 else
13270 as_fatal (_("invalid -mevexrcig= option: `%s'"), arg);
13271 break;
13272
13273 case OPTION_MEVEXWIG:
13274 if (strcmp (arg, "0") == 0)
13275 evexwig = evexw0;
13276 else if (strcmp (arg, "1") == 0)
13277 evexwig = evexw1;
13278 else
13279 as_fatal (_("invalid -mevexwig= option: `%s'"), arg);
13280 break;
13281
13282 # if defined (TE_PE) || defined (TE_PEP)
13283 case OPTION_MBIG_OBJ:
13284 use_big_obj = 1;
13285 break;
13286 #endif
13287
13288 case OPTION_MOMIT_LOCK_PREFIX:
13289 if (strcasecmp (arg, "yes") == 0)
13290 omit_lock_prefix = 1;
13291 else if (strcasecmp (arg, "no") == 0)
13292 omit_lock_prefix = 0;
13293 else
13294 as_fatal (_("invalid -momit-lock-prefix= option: `%s'"), arg);
13295 break;
13296
13297 case OPTION_MFENCE_AS_LOCK_ADD:
13298 if (strcasecmp (arg, "yes") == 0)
13299 avoid_fence = 1;
13300 else if (strcasecmp (arg, "no") == 0)
13301 avoid_fence = 0;
13302 else
13303 as_fatal (_("invalid -mfence-as-lock-add= option: `%s'"), arg);
13304 break;
13305
13306 case OPTION_MLFENCE_AFTER_LOAD:
13307 if (strcasecmp (arg, "yes") == 0)
13308 lfence_after_load = 1;
13309 else if (strcasecmp (arg, "no") == 0)
13310 lfence_after_load = 0;
13311 else
13312 as_fatal (_("invalid -mlfence-after-load= option: `%s'"), arg);
13313 break;
13314
13315 case OPTION_MLFENCE_BEFORE_INDIRECT_BRANCH:
13316 if (strcasecmp (arg, "all") == 0)
13317 {
13318 lfence_before_indirect_branch = lfence_branch_all;
13319 if (lfence_before_ret == lfence_before_ret_none)
13320 lfence_before_ret = lfence_before_ret_shl;
13321 }
13322 else if (strcasecmp (arg, "memory") == 0)
13323 lfence_before_indirect_branch = lfence_branch_memory;
13324 else if (strcasecmp (arg, "register") == 0)
13325 lfence_before_indirect_branch = lfence_branch_register;
13326 else if (strcasecmp (arg, "none") == 0)
13327 lfence_before_indirect_branch = lfence_branch_none;
13328 else
13329 as_fatal (_("invalid -mlfence-before-indirect-branch= option: `%s'"),
13330 arg);
13331 break;
13332
13333 case OPTION_MLFENCE_BEFORE_RET:
13334 if (strcasecmp (arg, "or") == 0)
13335 lfence_before_ret = lfence_before_ret_or;
13336 else if (strcasecmp (arg, "not") == 0)
13337 lfence_before_ret = lfence_before_ret_not;
13338 else if (strcasecmp (arg, "shl") == 0 || strcasecmp (arg, "yes") == 0)
13339 lfence_before_ret = lfence_before_ret_shl;
13340 else if (strcasecmp (arg, "none") == 0)
13341 lfence_before_ret = lfence_before_ret_none;
13342 else
13343 as_fatal (_("invalid -mlfence-before-ret= option: `%s'"),
13344 arg);
13345 break;
13346
13347 case OPTION_MRELAX_RELOCATIONS:
13348 if (strcasecmp (arg, "yes") == 0)
13349 generate_relax_relocations = 1;
13350 else if (strcasecmp (arg, "no") == 0)
13351 generate_relax_relocations = 0;
13352 else
13353 as_fatal (_("invalid -mrelax-relocations= option: `%s'"), arg);
13354 break;
13355
13356 case OPTION_MALIGN_BRANCH_BOUNDARY:
13357 {
13358 char *end;
13359 long int align = strtoul (arg, &end, 0);
13360 if (*end == '\0')
13361 {
13362 if (align == 0)
13363 {
13364 align_branch_power = 0;
13365 break;
13366 }
13367 else if (align >= 16)
13368 {
13369 int align_power;
13370 for (align_power = 0;
13371 (align & 1) == 0;
13372 align >>= 1, align_power++)
13373 continue;
13374 /* Limit alignment power to 31. */
13375 if (align == 1 && align_power < 32)
13376 {
13377 align_branch_power = align_power;
13378 break;
13379 }
13380 }
13381 }
13382 as_fatal (_("invalid -malign-branch-boundary= value: %s"), arg);
13383 }
13384 break;
13385
13386 case OPTION_MALIGN_BRANCH_PREFIX_SIZE:
13387 {
13388 char *end;
13389 int align = strtoul (arg, &end, 0);
13390 /* Some processors only support 5 prefixes. */
13391 if (*end == '\0' && align >= 0 && align < 6)
13392 {
13393 align_branch_prefix_size = align;
13394 break;
13395 }
13396 as_fatal (_("invalid -malign-branch-prefix-size= value: %s"),
13397 arg);
13398 }
13399 break;
13400
13401 case OPTION_MALIGN_BRANCH:
13402 align_branch = 0;
13403 saved = xstrdup (arg);
13404 type = saved;
13405 do
13406 {
13407 next = strchr (type, '+');
13408 if (next)
13409 *next++ = '\0';
13410 if (strcasecmp (type, "jcc") == 0)
13411 align_branch |= align_branch_jcc_bit;
13412 else if (strcasecmp (type, "fused") == 0)
13413 align_branch |= align_branch_fused_bit;
13414 else if (strcasecmp (type, "jmp") == 0)
13415 align_branch |= align_branch_jmp_bit;
13416 else if (strcasecmp (type, "call") == 0)
13417 align_branch |= align_branch_call_bit;
13418 else if (strcasecmp (type, "ret") == 0)
13419 align_branch |= align_branch_ret_bit;
13420 else if (strcasecmp (type, "indirect") == 0)
13421 align_branch |= align_branch_indirect_bit;
13422 else
13423 as_fatal (_("invalid -malign-branch= option: `%s'"), arg);
13424 type = next;
13425 }
13426 while (next != NULL);
13427 free (saved);
13428 break;
13429
13430 case OPTION_MBRANCHES_WITH_32B_BOUNDARIES:
13431 align_branch_power = 5;
13432 align_branch_prefix_size = 5;
13433 align_branch = (align_branch_jcc_bit
13434 | align_branch_fused_bit
13435 | align_branch_jmp_bit);
13436 break;
13437
13438 case OPTION_MAMD64:
13439 isa64 = amd64;
13440 break;
13441
13442 case OPTION_MINTEL64:
13443 isa64 = intel64;
13444 break;
13445
13446 case 'O':
13447 if (arg == NULL)
13448 {
13449 optimize = 1;
13450 /* Turn off -Os. */
13451 optimize_for_space = 0;
13452 }
13453 else if (*arg == 's')
13454 {
13455 optimize_for_space = 1;
13456 /* Turn on all encoding optimizations. */
13457 optimize = INT_MAX;
13458 }
13459 else
13460 {
13461 optimize = atoi (arg);
13462 /* Turn off -Os. */
13463 optimize_for_space = 0;
13464 }
13465 break;
13466
13467 default:
13468 return 0;
13469 }
13470 return 1;
13471 }
13472
13473 #define MESSAGE_TEMPLATE \
13474 " "
13475
13476 static char *
13477 output_message (FILE *stream, char *p, char *message, char *start,
13478 int *left_p, const char *name, int len)
13479 {
13480 int size = sizeof (MESSAGE_TEMPLATE);
13481 int left = *left_p;
13482
13483 /* Reserve 2 spaces for ", " or ",\0" */
13484 left -= len + 2;
13485
13486 /* Check if there is any room. */
13487 if (left >= 0)
13488 {
13489 if (p != start)
13490 {
13491 *p++ = ',';
13492 *p++ = ' ';
13493 }
13494 p = mempcpy (p, name, len);
13495 }
13496 else
13497 {
13498 /* Output the current message now and start a new one. */
13499 *p++ = ',';
13500 *p = '\0';
13501 fprintf (stream, "%s\n", message);
13502 p = start;
13503 left = size - (start - message) - len - 2;
13504
13505 gas_assert (left >= 0);
13506
13507 p = mempcpy (p, name, len);
13508 }
13509
13510 *left_p = left;
13511 return p;
13512 }
13513
13514 static void
13515 show_arch (FILE *stream, int ext, int check)
13516 {
13517 static char message[] = MESSAGE_TEMPLATE;
13518 char *start = message + 27;
13519 char *p;
13520 int size = sizeof (MESSAGE_TEMPLATE);
13521 int left;
13522 const char *name;
13523 int len;
13524 unsigned int j;
13525
13526 p = start;
13527 left = size - (start - message);
13528 for (j = 0; j < ARRAY_SIZE (cpu_arch); j++)
13529 {
13530 /* Should it be skipped? */
13531 if (cpu_arch [j].skip)
13532 continue;
13533
13534 name = cpu_arch [j].name;
13535 len = cpu_arch [j].len;
13536 if (*name == '.')
13537 {
13538 /* It is an extension. Skip if we aren't asked to show it. */
13539 if (ext)
13540 {
13541 name++;
13542 len--;
13543 }
13544 else
13545 continue;
13546 }
13547 else if (ext)
13548 {
13549 /* It is an processor. Skip if we show only extension. */
13550 continue;
13551 }
13552 else if (check && ! cpu_arch[j].flags.bitfield.cpui386)
13553 {
13554 /* It is an impossible processor - skip. */
13555 continue;
13556 }
13557
13558 p = output_message (stream, p, message, start, &left, name, len);
13559 }
13560
13561 /* Display disabled extensions. */
13562 if (ext)
13563 for (j = 0; j < ARRAY_SIZE (cpu_noarch); j++)
13564 {
13565 name = cpu_noarch [j].name;
13566 len = cpu_noarch [j].len;
13567 p = output_message (stream, p, message, start, &left, name,
13568 len);
13569 }
13570
13571 *p = '\0';
13572 fprintf (stream, "%s\n", message);
13573 }
13574
13575 void
13576 md_show_usage (FILE *stream)
13577 {
13578 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13579 fprintf (stream, _("\
13580 -Qy, -Qn ignored\n\
13581 -V print assembler version number\n\
13582 -k ignored\n"));
13583 #endif
13584 fprintf (stream, _("\
13585 -n Do not optimize code alignment\n\
13586 -q quieten some warnings\n"));
13587 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13588 fprintf (stream, _("\
13589 -s ignored\n"));
13590 #endif
13591 #if defined BFD64 && (defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13592 || defined (TE_PE) || defined (TE_PEP))
13593 fprintf (stream, _("\
13594 --32/--64/--x32 generate 32bit/64bit/x32 code\n"));
13595 #endif
13596 #ifdef SVR4_COMMENT_CHARS
13597 fprintf (stream, _("\
13598 --divide do not treat `/' as a comment character\n"));
13599 #else
13600 fprintf (stream, _("\
13601 --divide ignored\n"));
13602 #endif
13603 fprintf (stream, _("\
13604 -march=CPU[,+EXTENSION...]\n\
13605 generate code for CPU and EXTENSION, CPU is one of:\n"));
13606 show_arch (stream, 0, 1);
13607 fprintf (stream, _("\
13608 EXTENSION is combination of:\n"));
13609 show_arch (stream, 1, 0);
13610 fprintf (stream, _("\
13611 -mtune=CPU optimize for CPU, CPU is one of:\n"));
13612 show_arch (stream, 0, 0);
13613 fprintf (stream, _("\
13614 -msse2avx encode SSE instructions with VEX prefix\n"));
13615 fprintf (stream, _("\
13616 -msse-check=[none|error|warning] (default: warning)\n\
13617 check SSE instructions\n"));
13618 fprintf (stream, _("\
13619 -moperand-check=[none|error|warning] (default: warning)\n\
13620 check operand combinations for validity\n"));
13621 fprintf (stream, _("\
13622 -mavxscalar=[128|256] (default: 128)\n\
13623 encode scalar AVX instructions with specific vector\n\
13624 length\n"));
13625 fprintf (stream, _("\
13626 -mvexwig=[0|1] (default: 0)\n\
13627 encode VEX instructions with specific VEX.W value\n\
13628 for VEX.W bit ignored instructions\n"));
13629 fprintf (stream, _("\
13630 -mevexlig=[128|256|512] (default: 128)\n\
13631 encode scalar EVEX instructions with specific vector\n\
13632 length\n"));
13633 fprintf (stream, _("\
13634 -mevexwig=[0|1] (default: 0)\n\
13635 encode EVEX instructions with specific EVEX.W value\n\
13636 for EVEX.W bit ignored instructions\n"));
13637 fprintf (stream, _("\
13638 -mevexrcig=[rne|rd|ru|rz] (default: rne)\n\
13639 encode EVEX instructions with specific EVEX.RC value\n\
13640 for SAE-only ignored instructions\n"));
13641 fprintf (stream, _("\
13642 -mmnemonic=[att|intel] "));
13643 if (SYSV386_COMPAT)
13644 fprintf (stream, _("(default: att)\n"));
13645 else
13646 fprintf (stream, _("(default: intel)\n"));
13647 fprintf (stream, _("\
13648 use AT&T/Intel mnemonic\n"));
13649 fprintf (stream, _("\
13650 -msyntax=[att|intel] (default: att)\n\
13651 use AT&T/Intel syntax\n"));
13652 fprintf (stream, _("\
13653 -mindex-reg support pseudo index registers\n"));
13654 fprintf (stream, _("\
13655 -mnaked-reg don't require `%%' prefix for registers\n"));
13656 fprintf (stream, _("\
13657 -madd-bnd-prefix add BND prefix for all valid branches\n"));
13658 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13659 fprintf (stream, _("\
13660 -mshared disable branch optimization for shared code\n"));
13661 fprintf (stream, _("\
13662 -mx86-used-note=[no|yes] "));
13663 if (DEFAULT_X86_USED_NOTE)
13664 fprintf (stream, _("(default: yes)\n"));
13665 else
13666 fprintf (stream, _("(default: no)\n"));
13667 fprintf (stream, _("\
13668 generate x86 used ISA and feature properties\n"));
13669 #endif
13670 #if defined (TE_PE) || defined (TE_PEP)
13671 fprintf (stream, _("\
13672 -mbig-obj generate big object files\n"));
13673 #endif
13674 fprintf (stream, _("\
13675 -momit-lock-prefix=[no|yes] (default: no)\n\
13676 strip all lock prefixes\n"));
13677 fprintf (stream, _("\
13678 -mfence-as-lock-add=[no|yes] (default: no)\n\
13679 encode lfence, mfence and sfence as\n\
13680 lock addl $0x0, (%%{re}sp)\n"));
13681 fprintf (stream, _("\
13682 -mrelax-relocations=[no|yes] "));
13683 if (DEFAULT_GENERATE_X86_RELAX_RELOCATIONS)
13684 fprintf (stream, _("(default: yes)\n"));
13685 else
13686 fprintf (stream, _("(default: no)\n"));
13687 fprintf (stream, _("\
13688 generate relax relocations\n"));
13689 fprintf (stream, _("\
13690 -malign-branch-boundary=NUM (default: 0)\n\
13691 align branches within NUM byte boundary\n"));
13692 fprintf (stream, _("\
13693 -malign-branch=TYPE[+TYPE...] (default: jcc+fused+jmp)\n\
13694 TYPE is combination of jcc, fused, jmp, call, ret,\n\
13695 indirect\n\
13696 specify types of branches to align\n"));
13697 fprintf (stream, _("\
13698 -malign-branch-prefix-size=NUM (default: 5)\n\
13699 align branches with NUM prefixes per instruction\n"));
13700 fprintf (stream, _("\
13701 -mbranches-within-32B-boundaries\n\
13702 align branches within 32 byte boundary\n"));
13703 fprintf (stream, _("\
13704 -mlfence-after-load=[no|yes] (default: no)\n\
13705 generate lfence after load\n"));
13706 fprintf (stream, _("\
13707 -mlfence-before-indirect-branch=[none|all|register|memory] (default: none)\n\
13708 generate lfence before indirect near branch\n"));
13709 fprintf (stream, _("\
13710 -mlfence-before-ret=[none|or|not|shl|yes] (default: none)\n\
13711 generate lfence before ret\n"));
13712 fprintf (stream, _("\
13713 -mamd64 accept only AMD64 ISA [default]\n"));
13714 fprintf (stream, _("\
13715 -mintel64 accept only Intel64 ISA\n"));
13716 }
13717
13718 #if ((defined (OBJ_MAYBE_COFF) && defined (OBJ_MAYBE_AOUT)) \
13719 || defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF) \
13720 || defined (TE_PE) || defined (TE_PEP) || defined (OBJ_MACH_O))
13721
13722 /* Pick the target format to use. */
13723
13724 const char *
13725 i386_target_format (void)
13726 {
13727 if (!strncmp (default_arch, "x86_64", 6))
13728 {
13729 update_code_flag (CODE_64BIT, 1);
13730 if (default_arch[6] == '\0')
13731 x86_elf_abi = X86_64_ABI;
13732 else
13733 x86_elf_abi = X86_64_X32_ABI;
13734 }
13735 else if (!strcmp (default_arch, "i386"))
13736 update_code_flag (CODE_32BIT, 1);
13737 else if (!strcmp (default_arch, "iamcu"))
13738 {
13739 update_code_flag (CODE_32BIT, 1);
13740 if (cpu_arch_isa == PROCESSOR_UNKNOWN)
13741 {
13742 static const i386_cpu_flags iamcu_flags = CPU_IAMCU_FLAGS;
13743 cpu_arch_name = "iamcu";
13744 cpu_sub_arch_name = NULL;
13745 cpu_arch_flags = iamcu_flags;
13746 cpu_arch_isa = PROCESSOR_IAMCU;
13747 cpu_arch_isa_flags = iamcu_flags;
13748 if (!cpu_arch_tune_set)
13749 {
13750 cpu_arch_tune = cpu_arch_isa;
13751 cpu_arch_tune_flags = cpu_arch_isa_flags;
13752 }
13753 }
13754 else if (cpu_arch_isa != PROCESSOR_IAMCU)
13755 as_fatal (_("Intel MCU doesn't support `%s' architecture"),
13756 cpu_arch_name);
13757 }
13758 else
13759 as_fatal (_("unknown architecture"));
13760
13761 if (cpu_flags_all_zero (&cpu_arch_isa_flags))
13762 cpu_arch_isa_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13763 if (cpu_flags_all_zero (&cpu_arch_tune_flags))
13764 cpu_arch_tune_flags = cpu_arch[flag_code == CODE_64BIT].flags;
13765
13766 switch (OUTPUT_FLAVOR)
13767 {
13768 #if defined (OBJ_MAYBE_AOUT) || defined (OBJ_AOUT)
13769 case bfd_target_aout_flavour:
13770 return AOUT_TARGET_FORMAT;
13771 #endif
13772 #if defined (OBJ_MAYBE_COFF) || defined (OBJ_COFF)
13773 # if defined (TE_PE) || defined (TE_PEP)
13774 case bfd_target_coff_flavour:
13775 if (flag_code == CODE_64BIT)
13776 return use_big_obj ? "pe-bigobj-x86-64" : "pe-x86-64";
13777 else
13778 return use_big_obj ? "pe-bigobj-i386" : "pe-i386";
13779 # elif defined (TE_GO32)
13780 case bfd_target_coff_flavour:
13781 return "coff-go32";
13782 # else
13783 case bfd_target_coff_flavour:
13784 return "coff-i386";
13785 # endif
13786 #endif
13787 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
13788 case bfd_target_elf_flavour:
13789 {
13790 const char *format;
13791
13792 switch (x86_elf_abi)
13793 {
13794 default:
13795 format = ELF_TARGET_FORMAT;
13796 #ifndef TE_SOLARIS
13797 tls_get_addr = "___tls_get_addr";
13798 #endif
13799 break;
13800 case X86_64_ABI:
13801 use_rela_relocations = 1;
13802 object_64bit = 1;
13803 #ifndef TE_SOLARIS
13804 tls_get_addr = "__tls_get_addr";
13805 #endif
13806 format = ELF_TARGET_FORMAT64;
13807 break;
13808 case X86_64_X32_ABI:
13809 use_rela_relocations = 1;
13810 object_64bit = 1;
13811 #ifndef TE_SOLARIS
13812 tls_get_addr = "__tls_get_addr";
13813 #endif
13814 disallow_64bit_reloc = 1;
13815 format = ELF_TARGET_FORMAT32;
13816 break;
13817 }
13818 if (cpu_arch_isa == PROCESSOR_L1OM)
13819 {
13820 if (x86_elf_abi != X86_64_ABI)
13821 as_fatal (_("Intel L1OM is 64bit only"));
13822 return ELF_TARGET_L1OM_FORMAT;
13823 }
13824 else if (cpu_arch_isa == PROCESSOR_K1OM)
13825 {
13826 if (x86_elf_abi != X86_64_ABI)
13827 as_fatal (_("Intel K1OM is 64bit only"));
13828 return ELF_TARGET_K1OM_FORMAT;
13829 }
13830 else if (cpu_arch_isa == PROCESSOR_IAMCU)
13831 {
13832 if (x86_elf_abi != I386_ABI)
13833 as_fatal (_("Intel MCU is 32bit only"));
13834 return ELF_TARGET_IAMCU_FORMAT;
13835 }
13836 else
13837 return format;
13838 }
13839 #endif
13840 #if defined (OBJ_MACH_O)
13841 case bfd_target_mach_o_flavour:
13842 if (flag_code == CODE_64BIT)
13843 {
13844 use_rela_relocations = 1;
13845 object_64bit = 1;
13846 return "mach-o-x86-64";
13847 }
13848 else
13849 return "mach-o-i386";
13850 #endif
13851 default:
13852 abort ();
13853 return NULL;
13854 }
13855 }
13856
13857 #endif /* OBJ_MAYBE_ more than one */
13858 \f
13859 symbolS *
13860 md_undefined_symbol (char *name)
13861 {
13862 if (name[0] == GLOBAL_OFFSET_TABLE_NAME[0]
13863 && name[1] == GLOBAL_OFFSET_TABLE_NAME[1]
13864 && name[2] == GLOBAL_OFFSET_TABLE_NAME[2]
13865 && strcmp (name, GLOBAL_OFFSET_TABLE_NAME) == 0)
13866 {
13867 if (!GOT_symbol)
13868 {
13869 if (symbol_find (name))
13870 as_bad (_("GOT already in symbol table"));
13871 GOT_symbol = symbol_new (name, undefined_section,
13872 &zero_address_frag, 0);
13873 };
13874 return GOT_symbol;
13875 }
13876 return 0;
13877 }
13878
13879 /* Round up a section size to the appropriate boundary. */
13880
13881 valueT
13882 md_section_align (segT segment ATTRIBUTE_UNUSED, valueT size)
13883 {
13884 #if (defined (OBJ_AOUT) || defined (OBJ_MAYBE_AOUT))
13885 if (OUTPUT_FLAVOR == bfd_target_aout_flavour)
13886 {
13887 /* For a.out, force the section size to be aligned. If we don't do
13888 this, BFD will align it for us, but it will not write out the
13889 final bytes of the section. This may be a bug in BFD, but it is
13890 easier to fix it here since that is how the other a.out targets
13891 work. */
13892 int align;
13893
13894 align = bfd_section_alignment (segment);
13895 size = ((size + (1 << align) - 1) & (-((valueT) 1 << align)));
13896 }
13897 #endif
13898
13899 return size;
13900 }
13901
13902 /* On the i386, PC-relative offsets are relative to the start of the
13903 next instruction. That is, the address of the offset, plus its
13904 size, since the offset is always the last part of the insn. */
13905
13906 long
13907 md_pcrel_from (fixS *fixP)
13908 {
13909 return fixP->fx_size + fixP->fx_where + fixP->fx_frag->fr_address;
13910 }
13911
13912 #ifndef I386COFF
13913
13914 static void
13915 s_bss (int ignore ATTRIBUTE_UNUSED)
13916 {
13917 int temp;
13918
13919 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13920 if (IS_ELF)
13921 obj_elf_section_change_hook ();
13922 #endif
13923 temp = get_absolute_expression ();
13924 subseg_set (bss_section, (subsegT) temp);
13925 demand_empty_rest_of_line ();
13926 }
13927
13928 #endif
13929
13930 /* Remember constant directive. */
13931
13932 void
13933 i386_cons_align (int ignore ATTRIBUTE_UNUSED)
13934 {
13935 if (last_insn.kind != last_insn_directive
13936 && (bfd_section_flags (now_seg) & SEC_CODE))
13937 {
13938 last_insn.seg = now_seg;
13939 last_insn.kind = last_insn_directive;
13940 last_insn.name = "constant directive";
13941 last_insn.file = as_where (&last_insn.line);
13942 if (lfence_before_ret != lfence_before_ret_none)
13943 {
13944 if (lfence_before_indirect_branch != lfence_branch_none)
13945 as_warn (_("constant directive skips -mlfence-before-ret "
13946 "and -mlfence-before-indirect-branch"));
13947 else
13948 as_warn (_("constant directive skips -mlfence-before-ret"));
13949 }
13950 else if (lfence_before_indirect_branch != lfence_branch_none)
13951 as_warn (_("constant directive skips -mlfence-before-indirect-branch"));
13952 }
13953 }
13954
13955 void
13956 i386_validate_fix (fixS *fixp)
13957 {
13958 if (fixp->fx_subsy)
13959 {
13960 if (fixp->fx_subsy == GOT_symbol)
13961 {
13962 if (fixp->fx_r_type == BFD_RELOC_32_PCREL)
13963 {
13964 if (!object_64bit)
13965 abort ();
13966 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13967 if (fixp->fx_tcbit2)
13968 fixp->fx_r_type = (fixp->fx_tcbit
13969 ? BFD_RELOC_X86_64_REX_GOTPCRELX
13970 : BFD_RELOC_X86_64_GOTPCRELX);
13971 else
13972 #endif
13973 fixp->fx_r_type = BFD_RELOC_X86_64_GOTPCREL;
13974 }
13975 else
13976 {
13977 if (!object_64bit)
13978 fixp->fx_r_type = BFD_RELOC_386_GOTOFF;
13979 else
13980 fixp->fx_r_type = BFD_RELOC_X86_64_GOTOFF64;
13981 }
13982 fixp->fx_subsy = 0;
13983 }
13984 }
13985 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
13986 else
13987 {
13988 /* NB: Commit 292676c1 resolved PLT32 reloc aganst local symbol
13989 to section. Since PLT32 relocation must be against symbols,
13990 turn such PLT32 relocation into PC32 relocation. */
13991 if (fixp->fx_addsy
13992 && (fixp->fx_r_type == BFD_RELOC_386_PLT32
13993 || fixp->fx_r_type == BFD_RELOC_X86_64_PLT32)
13994 && symbol_section_p (fixp->fx_addsy))
13995 fixp->fx_r_type = BFD_RELOC_32_PCREL;
13996 if (!object_64bit)
13997 {
13998 if (fixp->fx_r_type == BFD_RELOC_386_GOT32
13999 && fixp->fx_tcbit2)
14000 fixp->fx_r_type = BFD_RELOC_386_GOT32X;
14001 }
14002 }
14003 #endif
14004 }
14005
14006 arelent *
14007 tc_gen_reloc (asection *section ATTRIBUTE_UNUSED, fixS *fixp)
14008 {
14009 arelent *rel;
14010 bfd_reloc_code_real_type code;
14011
14012 switch (fixp->fx_r_type)
14013 {
14014 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14015 case BFD_RELOC_SIZE32:
14016 case BFD_RELOC_SIZE64:
14017 if (S_IS_DEFINED (fixp->fx_addsy)
14018 && !S_IS_EXTERNAL (fixp->fx_addsy))
14019 {
14020 /* Resolve size relocation against local symbol to size of
14021 the symbol plus addend. */
14022 valueT value = S_GET_SIZE (fixp->fx_addsy) + fixp->fx_offset;
14023 if (fixp->fx_r_type == BFD_RELOC_SIZE32
14024 && !fits_in_unsigned_long (value))
14025 as_bad_where (fixp->fx_file, fixp->fx_line,
14026 _("symbol size computation overflow"));
14027 fixp->fx_addsy = NULL;
14028 fixp->fx_subsy = NULL;
14029 md_apply_fix (fixp, (valueT *) &value, NULL);
14030 return NULL;
14031 }
14032 #endif
14033 /* Fall through. */
14034
14035 case BFD_RELOC_X86_64_PLT32:
14036 case BFD_RELOC_X86_64_GOT32:
14037 case BFD_RELOC_X86_64_GOTPCREL:
14038 case BFD_RELOC_X86_64_GOTPCRELX:
14039 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14040 case BFD_RELOC_386_PLT32:
14041 case BFD_RELOC_386_GOT32:
14042 case BFD_RELOC_386_GOT32X:
14043 case BFD_RELOC_386_GOTOFF:
14044 case BFD_RELOC_386_GOTPC:
14045 case BFD_RELOC_386_TLS_GD:
14046 case BFD_RELOC_386_TLS_LDM:
14047 case BFD_RELOC_386_TLS_LDO_32:
14048 case BFD_RELOC_386_TLS_IE_32:
14049 case BFD_RELOC_386_TLS_IE:
14050 case BFD_RELOC_386_TLS_GOTIE:
14051 case BFD_RELOC_386_TLS_LE_32:
14052 case BFD_RELOC_386_TLS_LE:
14053 case BFD_RELOC_386_TLS_GOTDESC:
14054 case BFD_RELOC_386_TLS_DESC_CALL:
14055 case BFD_RELOC_X86_64_TLSGD:
14056 case BFD_RELOC_X86_64_TLSLD:
14057 case BFD_RELOC_X86_64_DTPOFF32:
14058 case BFD_RELOC_X86_64_DTPOFF64:
14059 case BFD_RELOC_X86_64_GOTTPOFF:
14060 case BFD_RELOC_X86_64_TPOFF32:
14061 case BFD_RELOC_X86_64_TPOFF64:
14062 case BFD_RELOC_X86_64_GOTOFF64:
14063 case BFD_RELOC_X86_64_GOTPC32:
14064 case BFD_RELOC_X86_64_GOT64:
14065 case BFD_RELOC_X86_64_GOTPCREL64:
14066 case BFD_RELOC_X86_64_GOTPC64:
14067 case BFD_RELOC_X86_64_GOTPLT64:
14068 case BFD_RELOC_X86_64_PLTOFF64:
14069 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14070 case BFD_RELOC_X86_64_TLSDESC_CALL:
14071 case BFD_RELOC_RVA:
14072 case BFD_RELOC_VTABLE_ENTRY:
14073 case BFD_RELOC_VTABLE_INHERIT:
14074 #ifdef TE_PE
14075 case BFD_RELOC_32_SECREL:
14076 #endif
14077 code = fixp->fx_r_type;
14078 break;
14079 case BFD_RELOC_X86_64_32S:
14080 if (!fixp->fx_pcrel)
14081 {
14082 /* Don't turn BFD_RELOC_X86_64_32S into BFD_RELOC_32. */
14083 code = fixp->fx_r_type;
14084 break;
14085 }
14086 /* Fall through. */
14087 default:
14088 if (fixp->fx_pcrel)
14089 {
14090 switch (fixp->fx_size)
14091 {
14092 default:
14093 as_bad_where (fixp->fx_file, fixp->fx_line,
14094 _("can not do %d byte pc-relative relocation"),
14095 fixp->fx_size);
14096 code = BFD_RELOC_32_PCREL;
14097 break;
14098 case 1: code = BFD_RELOC_8_PCREL; break;
14099 case 2: code = BFD_RELOC_16_PCREL; break;
14100 case 4: code = BFD_RELOC_32_PCREL; break;
14101 #ifdef BFD64
14102 case 8: code = BFD_RELOC_64_PCREL; break;
14103 #endif
14104 }
14105 }
14106 else
14107 {
14108 switch (fixp->fx_size)
14109 {
14110 default:
14111 as_bad_where (fixp->fx_file, fixp->fx_line,
14112 _("can not do %d byte relocation"),
14113 fixp->fx_size);
14114 code = BFD_RELOC_32;
14115 break;
14116 case 1: code = BFD_RELOC_8; break;
14117 case 2: code = BFD_RELOC_16; break;
14118 case 4: code = BFD_RELOC_32; break;
14119 #ifdef BFD64
14120 case 8: code = BFD_RELOC_64; break;
14121 #endif
14122 }
14123 }
14124 break;
14125 }
14126
14127 if ((code == BFD_RELOC_32
14128 || code == BFD_RELOC_32_PCREL
14129 || code == BFD_RELOC_X86_64_32S)
14130 && GOT_symbol
14131 && fixp->fx_addsy == GOT_symbol)
14132 {
14133 if (!object_64bit)
14134 code = BFD_RELOC_386_GOTPC;
14135 else
14136 code = BFD_RELOC_X86_64_GOTPC32;
14137 }
14138 if ((code == BFD_RELOC_64 || code == BFD_RELOC_64_PCREL)
14139 && GOT_symbol
14140 && fixp->fx_addsy == GOT_symbol)
14141 {
14142 code = BFD_RELOC_X86_64_GOTPC64;
14143 }
14144
14145 rel = XNEW (arelent);
14146 rel->sym_ptr_ptr = XNEW (asymbol *);
14147 *rel->sym_ptr_ptr = symbol_get_bfdsym (fixp->fx_addsy);
14148
14149 rel->address = fixp->fx_frag->fr_address + fixp->fx_where;
14150
14151 if (!use_rela_relocations)
14152 {
14153 /* HACK: Since i386 ELF uses Rel instead of Rela, encode the
14154 vtable entry to be used in the relocation's section offset. */
14155 if (fixp->fx_r_type == BFD_RELOC_VTABLE_ENTRY)
14156 rel->address = fixp->fx_offset;
14157 #if defined (OBJ_COFF) && defined (TE_PE)
14158 else if (fixp->fx_addsy && S_IS_WEAK (fixp->fx_addsy))
14159 rel->addend = fixp->fx_addnumber - (S_GET_VALUE (fixp->fx_addsy) * 2);
14160 else
14161 #endif
14162 rel->addend = 0;
14163 }
14164 /* Use the rela in 64bit mode. */
14165 else
14166 {
14167 if (disallow_64bit_reloc)
14168 switch (code)
14169 {
14170 case BFD_RELOC_X86_64_DTPOFF64:
14171 case BFD_RELOC_X86_64_TPOFF64:
14172 case BFD_RELOC_64_PCREL:
14173 case BFD_RELOC_X86_64_GOTOFF64:
14174 case BFD_RELOC_X86_64_GOT64:
14175 case BFD_RELOC_X86_64_GOTPCREL64:
14176 case BFD_RELOC_X86_64_GOTPC64:
14177 case BFD_RELOC_X86_64_GOTPLT64:
14178 case BFD_RELOC_X86_64_PLTOFF64:
14179 as_bad_where (fixp->fx_file, fixp->fx_line,
14180 _("cannot represent relocation type %s in x32 mode"),
14181 bfd_get_reloc_code_name (code));
14182 break;
14183 default:
14184 break;
14185 }
14186
14187 if (!fixp->fx_pcrel)
14188 rel->addend = fixp->fx_offset;
14189 else
14190 switch (code)
14191 {
14192 case BFD_RELOC_X86_64_PLT32:
14193 case BFD_RELOC_X86_64_GOT32:
14194 case BFD_RELOC_X86_64_GOTPCREL:
14195 case BFD_RELOC_X86_64_GOTPCRELX:
14196 case BFD_RELOC_X86_64_REX_GOTPCRELX:
14197 case BFD_RELOC_X86_64_TLSGD:
14198 case BFD_RELOC_X86_64_TLSLD:
14199 case BFD_RELOC_X86_64_GOTTPOFF:
14200 case BFD_RELOC_X86_64_GOTPC32_TLSDESC:
14201 case BFD_RELOC_X86_64_TLSDESC_CALL:
14202 rel->addend = fixp->fx_offset - fixp->fx_size;
14203 break;
14204 default:
14205 rel->addend = (section->vma
14206 - fixp->fx_size
14207 + fixp->fx_addnumber
14208 + md_pcrel_from (fixp));
14209 break;
14210 }
14211 }
14212
14213 rel->howto = bfd_reloc_type_lookup (stdoutput, code);
14214 if (rel->howto == NULL)
14215 {
14216 as_bad_where (fixp->fx_file, fixp->fx_line,
14217 _("cannot represent relocation type %s"),
14218 bfd_get_reloc_code_name (code));
14219 /* Set howto to a garbage value so that we can keep going. */
14220 rel->howto = bfd_reloc_type_lookup (stdoutput, BFD_RELOC_32);
14221 gas_assert (rel->howto != NULL);
14222 }
14223
14224 return rel;
14225 }
14226
14227 #include "tc-i386-intel.c"
14228
14229 void
14230 tc_x86_parse_to_dw2regnum (expressionS *exp)
14231 {
14232 int saved_naked_reg;
14233 char saved_register_dot;
14234
14235 saved_naked_reg = allow_naked_reg;
14236 allow_naked_reg = 1;
14237 saved_register_dot = register_chars['.'];
14238 register_chars['.'] = '.';
14239 allow_pseudo_reg = 1;
14240 expression_and_evaluate (exp);
14241 allow_pseudo_reg = 0;
14242 register_chars['.'] = saved_register_dot;
14243 allow_naked_reg = saved_naked_reg;
14244
14245 if (exp->X_op == O_register && exp->X_add_number >= 0)
14246 {
14247 if ((addressT) exp->X_add_number < i386_regtab_size)
14248 {
14249 exp->X_op = O_constant;
14250 exp->X_add_number = i386_regtab[exp->X_add_number]
14251 .dw2_regnum[flag_code >> 1];
14252 }
14253 else
14254 exp->X_op = O_illegal;
14255 }
14256 }
14257
14258 void
14259 tc_x86_frame_initial_instructions (void)
14260 {
14261 static unsigned int sp_regno[2];
14262
14263 if (!sp_regno[flag_code >> 1])
14264 {
14265 char *saved_input = input_line_pointer;
14266 char sp[][4] = {"esp", "rsp"};
14267 expressionS exp;
14268
14269 input_line_pointer = sp[flag_code >> 1];
14270 tc_x86_parse_to_dw2regnum (&exp);
14271 gas_assert (exp.X_op == O_constant);
14272 sp_regno[flag_code >> 1] = exp.X_add_number;
14273 input_line_pointer = saved_input;
14274 }
14275
14276 cfi_add_CFA_def_cfa (sp_regno[flag_code >> 1], -x86_cie_data_alignment);
14277 cfi_add_CFA_offset (x86_dwarf2_return_column, x86_cie_data_alignment);
14278 }
14279
14280 int
14281 x86_dwarf2_addr_size (void)
14282 {
14283 #if defined (OBJ_MAYBE_ELF) || defined (OBJ_ELF)
14284 if (x86_elf_abi == X86_64_X32_ABI)
14285 return 4;
14286 #endif
14287 return bfd_arch_bits_per_address (stdoutput) / 8;
14288 }
14289
14290 int
14291 i386_elf_section_type (const char *str, size_t len)
14292 {
14293 if (flag_code == CODE_64BIT
14294 && len == sizeof ("unwind") - 1
14295 && strncmp (str, "unwind", 6) == 0)
14296 return SHT_X86_64_UNWIND;
14297
14298 return -1;
14299 }
14300
14301 #ifdef TE_SOLARIS
14302 void
14303 i386_solaris_fix_up_eh_frame (segT sec)
14304 {
14305 if (flag_code == CODE_64BIT)
14306 elf_section_type (sec) = SHT_X86_64_UNWIND;
14307 }
14308 #endif
14309
14310 #ifdef TE_PE
14311 void
14312 tc_pe_dwarf2_emit_offset (symbolS *symbol, unsigned int size)
14313 {
14314 expressionS exp;
14315
14316 exp.X_op = O_secrel;
14317 exp.X_add_symbol = symbol;
14318 exp.X_add_number = 0;
14319 emit_expr (&exp, size);
14320 }
14321 #endif
14322
14323 #if defined (OBJ_ELF) || defined (OBJ_MAYBE_ELF)
14324 /* For ELF on x86-64, add support for SHF_X86_64_LARGE. */
14325
14326 bfd_vma
14327 x86_64_section_letter (int letter, const char **ptr_msg)
14328 {
14329 if (flag_code == CODE_64BIT)
14330 {
14331 if (letter == 'l')
14332 return SHF_X86_64_LARGE;
14333
14334 *ptr_msg = _("bad .section directive: want a,l,w,x,M,S,G,T in string");
14335 }
14336 else
14337 *ptr_msg = _("bad .section directive: want a,w,x,M,S,G,T in string");
14338 return -1;
14339 }
14340
14341 bfd_vma
14342 x86_64_section_word (char *str, size_t len)
14343 {
14344 if (len == 5 && flag_code == CODE_64BIT && startswith (str, "large"))
14345 return SHF_X86_64_LARGE;
14346
14347 return -1;
14348 }
14349
14350 static void
14351 handle_large_common (int small ATTRIBUTE_UNUSED)
14352 {
14353 if (flag_code != CODE_64BIT)
14354 {
14355 s_comm_internal (0, elf_common_parse);
14356 as_warn (_(".largecomm supported only in 64bit mode, producing .comm"));
14357 }
14358 else
14359 {
14360 static segT lbss_section;
14361 asection *saved_com_section_ptr = elf_com_section_ptr;
14362 asection *saved_bss_section = bss_section;
14363
14364 if (lbss_section == NULL)
14365 {
14366 flagword applicable;
14367 segT seg = now_seg;
14368 subsegT subseg = now_subseg;
14369
14370 /* The .lbss section is for local .largecomm symbols. */
14371 lbss_section = subseg_new (".lbss", 0);
14372 applicable = bfd_applicable_section_flags (stdoutput);
14373 bfd_set_section_flags (lbss_section, applicable & SEC_ALLOC);
14374 seg_info (lbss_section)->bss = 1;
14375
14376 subseg_set (seg, subseg);
14377 }
14378
14379 elf_com_section_ptr = &_bfd_elf_large_com_section;
14380 bss_section = lbss_section;
14381
14382 s_comm_internal (0, elf_common_parse);
14383
14384 elf_com_section_ptr = saved_com_section_ptr;
14385 bss_section = saved_bss_section;
14386 }
14387 }
14388 #endif /* OBJ_ELF || OBJ_MAYBE_ELF */